From 63d3091b24501c8d00f7d9013ea94744793fabc5 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@getlookcrowd.corp.yahoo.com>
Date: Thu, 7 Jun 2012 12:31:49 -0700
Subject: [PATCH 001/434] Move binaries to an actual binary dir.

---
 cloud-init-cfg.py => bin/cloud-init-cfg.py     | 0
 cloud-init-query.py => bin/cloud-init-query.py | 0
 cloud-init.py => bin/cloud-init.py             | 0
 3 files changed, 0 insertions(+), 0 deletions(-)
 rename cloud-init-cfg.py => bin/cloud-init-cfg.py (100%)
 rename cloud-init-query.py => bin/cloud-init-query.py (100%)
 rename cloud-init.py => bin/cloud-init.py (100%)

diff --git a/cloud-init-cfg.py b/bin/cloud-init-cfg.py
similarity index 100%
rename from cloud-init-cfg.py
rename to bin/cloud-init-cfg.py
diff --git a/cloud-init-query.py b/bin/cloud-init-query.py
similarity index 100%
rename from cloud-init-query.py
rename to bin/cloud-init-query.py
diff --git a/cloud-init.py b/bin/cloud-init.py
similarity index 100%
rename from cloud-init.py
rename to bin/cloud-init.py

From 78ce3cbfe03243f37e297d182f0252e802c3e787 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 12:42:38 -0700
Subject: [PATCH 002/434] 1. Adding some new helper files that split off file
 inclusion, templating, importing, constant usage. 1. Move all datasources to
 a new sources directory 1. Rename some files to be more consistent with
 python file/module naming.

---
 cloudinit/constants.py                        | 37 ++++++++
 cloudinit/{ => handlers}/DataSource.py        |  0
 .../{ => handlers}/DataSourceCloudStack.py    |  0
 .../{ => handlers}/DataSourceConfigDrive.py   |  0
 cloudinit/{ => handlers}/DataSourceEc2.py     |  0
 cloudinit/{ => handlers}/DataSourceMAAS.py    |  0
 cloudinit/{ => handlers}/DataSourceNoCloud.py |  0
 cloudinit/{ => handlers}/DataSourceOVF.py     |  0
 .../{CloudConfig => handlers}/__init__.py     |  0
 .../cc_apt_pipelining.py                      |  0
 .../cc_apt_update_upgrade.py                  |  0
 .../{CloudConfig => handlers}/cc_bootcmd.py   |  0
 .../{CloudConfig => handlers}/cc_byobu.py     |  0
 .../{CloudConfig => handlers}/cc_ca_certs.py  |  0
 .../{CloudConfig => handlers}/cc_chef.py      |  0
 .../cc_disable_ec2_metadata.py                |  0
 .../cc_final_message.py                       |  0
 cloudinit/{CloudConfig => handlers}/cc_foo.py |  0
 .../{CloudConfig => handlers}/cc_grub_dpkg.py |  0
 .../cc_keys_to_console.py                     |  0
 .../{CloudConfig => handlers}/cc_landscape.py |  0
 .../{CloudConfig => handlers}/cc_locale.py    |  0
 .../cc_mcollective.py                         |  0
 .../{CloudConfig => handlers}/cc_mounts.py    |  0
 .../cc_phone_home.py                          |  0
 .../{CloudConfig => handlers}/cc_puppet.py    |  0
 .../{CloudConfig => handlers}/cc_resizefs.py  |  0
 .../cc_rightscale_userdata.py                 |  0
 .../{CloudConfig => handlers}/cc_rsyslog.py   |  0
 .../{CloudConfig => handlers}/cc_runcmd.py    |  0
 .../cc_salt_minion.py                         |  0
 .../cc_scripts_per_boot.py                    |  0
 .../cc_scripts_per_instance.py                |  0
 .../cc_scripts_per_once.py                    |  0
 .../cc_scripts_user.py                        |  0
 .../cc_set_hostname.py                        |  0
 .../cc_set_passwords.py                       |  0
 cloudinit/{CloudConfig => handlers}/cc_ssh.py |  0
 .../cc_ssh_import_id.py                       |  0
 .../{CloudConfig => handlers}/cc_timezone.py  |  0
 .../cc_update_etc_hosts.py                    |  0
 .../cc_update_hostname.py                     |  0
 cloudinit/importer.py                         | 11 +++
 cloudinit/includer.py                         | 65 +++++++++++++
 cloudinit/log.py                              | 94 +++++++++++++++++++
 cloudinit/{SshUtil.py => ssh_util.py}         |  0
 cloudinit/templater.py                        | 17 ++++
 .../{UserDataHandler.py => user_data.py}      |  0
 48 files changed, 224 insertions(+)
 create mode 100644 cloudinit/constants.py
 rename cloudinit/{ => handlers}/DataSource.py (100%)
 rename cloudinit/{ => handlers}/DataSourceCloudStack.py (100%)
 rename cloudinit/{ => handlers}/DataSourceConfigDrive.py (100%)
 rename cloudinit/{ => handlers}/DataSourceEc2.py (100%)
 rename cloudinit/{ => handlers}/DataSourceMAAS.py (100%)
 rename cloudinit/{ => handlers}/DataSourceNoCloud.py (100%)
 rename cloudinit/{ => handlers}/DataSourceOVF.py (100%)
 rename cloudinit/{CloudConfig => handlers}/__init__.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_apt_pipelining.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_apt_update_upgrade.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_bootcmd.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_byobu.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_ca_certs.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_chef.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_disable_ec2_metadata.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_final_message.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_foo.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_grub_dpkg.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_keys_to_console.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_landscape.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_locale.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_mcollective.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_mounts.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_phone_home.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_puppet.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_resizefs.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_rightscale_userdata.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_rsyslog.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_runcmd.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_salt_minion.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_scripts_per_boot.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_scripts_per_instance.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_scripts_per_once.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_scripts_user.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_set_hostname.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_set_passwords.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_ssh.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_ssh_import_id.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_timezone.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_update_etc_hosts.py (100%)
 rename cloudinit/{CloudConfig => handlers}/cc_update_hostname.py (100%)
 create mode 100644 cloudinit/importer.py
 create mode 100644 cloudinit/includer.py
 create mode 100644 cloudinit/log.py
 rename cloudinit/{SshUtil.py => ssh_util.py} (100%)
 create mode 100644 cloudinit/templater.py
 rename cloudinit/{UserDataHandler.py => user_data.py} (100%)

diff --git a/cloudinit/constants.py b/cloudinit/constants.py
new file mode 100644
index 00000000..7bc90f27
--- /dev/null
+++ b/cloudinit/constants.py
@@ -0,0 +1,37 @@
+import os
+
+VAR_LIB_DIR = '/var/lib/cloud'
+CUR_INSTANCE_LINK = os.path.join(VAR_LIB_DIR, "instance")
+BOOT_FINISHED = os.path.join(CUR_INSTANCE_LINK, "boot-finished")
+SEED_DIR = os.path.join(VAR_LIB_DIR, "seed")
+
+CFG_ENV_NAME = "CLOUD_CFG"
+CLOUD_CONFIG = '/etc/cloud/cloud.cfg'
+
+CFG_BUILTIN = {
+    'datasource_list': ['NoCloud',
+                        'ConfigDrive',
+                        'OVF',
+                        'MAAS',
+                        'Ec2',
+                        'CloudStack'],
+    'def_log_file': '/var/log/cloud-init.log',
+    'log_cfgs': [],
+    'syslog_fix_perms': 'syslog:adm'
+}
+
+PATH_MAP = {
+   "handlers": "handlers",
+   "scripts": "scripts",
+   "sem": "sem",
+   "boothooks": "boothooks",
+   "userdata_raw": "user-data.txt",
+   "userdata": "user-data.txt.i",
+   "obj_pkl": "obj.pkl",
+   "cloud_config": "cloud-config.txt",
+   "data": "data",
+}
+
+PER_INSTANCE = "once-per-instance"
+PER_ALWAYS = "always"
+PER_ONCE = "once"
diff --git a/cloudinit/DataSource.py b/cloudinit/handlers/DataSource.py
similarity index 100%
rename from cloudinit/DataSource.py
rename to cloudinit/handlers/DataSource.py
diff --git a/cloudinit/DataSourceCloudStack.py b/cloudinit/handlers/DataSourceCloudStack.py
similarity index 100%
rename from cloudinit/DataSourceCloudStack.py
rename to cloudinit/handlers/DataSourceCloudStack.py
diff --git a/cloudinit/DataSourceConfigDrive.py b/cloudinit/handlers/DataSourceConfigDrive.py
similarity index 100%
rename from cloudinit/DataSourceConfigDrive.py
rename to cloudinit/handlers/DataSourceConfigDrive.py
diff --git a/cloudinit/DataSourceEc2.py b/cloudinit/handlers/DataSourceEc2.py
similarity index 100%
rename from cloudinit/DataSourceEc2.py
rename to cloudinit/handlers/DataSourceEc2.py
diff --git a/cloudinit/DataSourceMAAS.py b/cloudinit/handlers/DataSourceMAAS.py
similarity index 100%
rename from cloudinit/DataSourceMAAS.py
rename to cloudinit/handlers/DataSourceMAAS.py
diff --git a/cloudinit/DataSourceNoCloud.py b/cloudinit/handlers/DataSourceNoCloud.py
similarity index 100%
rename from cloudinit/DataSourceNoCloud.py
rename to cloudinit/handlers/DataSourceNoCloud.py
diff --git a/cloudinit/DataSourceOVF.py b/cloudinit/handlers/DataSourceOVF.py
similarity index 100%
rename from cloudinit/DataSourceOVF.py
rename to cloudinit/handlers/DataSourceOVF.py
diff --git a/cloudinit/CloudConfig/__init__.py b/cloudinit/handlers/__init__.py
similarity index 100%
rename from cloudinit/CloudConfig/__init__.py
rename to cloudinit/handlers/__init__.py
diff --git a/cloudinit/CloudConfig/cc_apt_pipelining.py b/cloudinit/handlers/cc_apt_pipelining.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_apt_pipelining.py
rename to cloudinit/handlers/cc_apt_pipelining.py
diff --git a/cloudinit/CloudConfig/cc_apt_update_upgrade.py b/cloudinit/handlers/cc_apt_update_upgrade.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_apt_update_upgrade.py
rename to cloudinit/handlers/cc_apt_update_upgrade.py
diff --git a/cloudinit/CloudConfig/cc_bootcmd.py b/cloudinit/handlers/cc_bootcmd.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_bootcmd.py
rename to cloudinit/handlers/cc_bootcmd.py
diff --git a/cloudinit/CloudConfig/cc_byobu.py b/cloudinit/handlers/cc_byobu.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_byobu.py
rename to cloudinit/handlers/cc_byobu.py
diff --git a/cloudinit/CloudConfig/cc_ca_certs.py b/cloudinit/handlers/cc_ca_certs.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_ca_certs.py
rename to cloudinit/handlers/cc_ca_certs.py
diff --git a/cloudinit/CloudConfig/cc_chef.py b/cloudinit/handlers/cc_chef.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_chef.py
rename to cloudinit/handlers/cc_chef.py
diff --git a/cloudinit/CloudConfig/cc_disable_ec2_metadata.py b/cloudinit/handlers/cc_disable_ec2_metadata.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_disable_ec2_metadata.py
rename to cloudinit/handlers/cc_disable_ec2_metadata.py
diff --git a/cloudinit/CloudConfig/cc_final_message.py b/cloudinit/handlers/cc_final_message.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_final_message.py
rename to cloudinit/handlers/cc_final_message.py
diff --git a/cloudinit/CloudConfig/cc_foo.py b/cloudinit/handlers/cc_foo.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_foo.py
rename to cloudinit/handlers/cc_foo.py
diff --git a/cloudinit/CloudConfig/cc_grub_dpkg.py b/cloudinit/handlers/cc_grub_dpkg.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_grub_dpkg.py
rename to cloudinit/handlers/cc_grub_dpkg.py
diff --git a/cloudinit/CloudConfig/cc_keys_to_console.py b/cloudinit/handlers/cc_keys_to_console.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_keys_to_console.py
rename to cloudinit/handlers/cc_keys_to_console.py
diff --git a/cloudinit/CloudConfig/cc_landscape.py b/cloudinit/handlers/cc_landscape.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_landscape.py
rename to cloudinit/handlers/cc_landscape.py
diff --git a/cloudinit/CloudConfig/cc_locale.py b/cloudinit/handlers/cc_locale.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_locale.py
rename to cloudinit/handlers/cc_locale.py
diff --git a/cloudinit/CloudConfig/cc_mcollective.py b/cloudinit/handlers/cc_mcollective.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_mcollective.py
rename to cloudinit/handlers/cc_mcollective.py
diff --git a/cloudinit/CloudConfig/cc_mounts.py b/cloudinit/handlers/cc_mounts.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_mounts.py
rename to cloudinit/handlers/cc_mounts.py
diff --git a/cloudinit/CloudConfig/cc_phone_home.py b/cloudinit/handlers/cc_phone_home.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_phone_home.py
rename to cloudinit/handlers/cc_phone_home.py
diff --git a/cloudinit/CloudConfig/cc_puppet.py b/cloudinit/handlers/cc_puppet.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_puppet.py
rename to cloudinit/handlers/cc_puppet.py
diff --git a/cloudinit/CloudConfig/cc_resizefs.py b/cloudinit/handlers/cc_resizefs.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_resizefs.py
rename to cloudinit/handlers/cc_resizefs.py
diff --git a/cloudinit/CloudConfig/cc_rightscale_userdata.py b/cloudinit/handlers/cc_rightscale_userdata.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_rightscale_userdata.py
rename to cloudinit/handlers/cc_rightscale_userdata.py
diff --git a/cloudinit/CloudConfig/cc_rsyslog.py b/cloudinit/handlers/cc_rsyslog.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_rsyslog.py
rename to cloudinit/handlers/cc_rsyslog.py
diff --git a/cloudinit/CloudConfig/cc_runcmd.py b/cloudinit/handlers/cc_runcmd.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_runcmd.py
rename to cloudinit/handlers/cc_runcmd.py
diff --git a/cloudinit/CloudConfig/cc_salt_minion.py b/cloudinit/handlers/cc_salt_minion.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_salt_minion.py
rename to cloudinit/handlers/cc_salt_minion.py
diff --git a/cloudinit/CloudConfig/cc_scripts_per_boot.py b/cloudinit/handlers/cc_scripts_per_boot.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_scripts_per_boot.py
rename to cloudinit/handlers/cc_scripts_per_boot.py
diff --git a/cloudinit/CloudConfig/cc_scripts_per_instance.py b/cloudinit/handlers/cc_scripts_per_instance.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_scripts_per_instance.py
rename to cloudinit/handlers/cc_scripts_per_instance.py
diff --git a/cloudinit/CloudConfig/cc_scripts_per_once.py b/cloudinit/handlers/cc_scripts_per_once.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_scripts_per_once.py
rename to cloudinit/handlers/cc_scripts_per_once.py
diff --git a/cloudinit/CloudConfig/cc_scripts_user.py b/cloudinit/handlers/cc_scripts_user.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_scripts_user.py
rename to cloudinit/handlers/cc_scripts_user.py
diff --git a/cloudinit/CloudConfig/cc_set_hostname.py b/cloudinit/handlers/cc_set_hostname.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_set_hostname.py
rename to cloudinit/handlers/cc_set_hostname.py
diff --git a/cloudinit/CloudConfig/cc_set_passwords.py b/cloudinit/handlers/cc_set_passwords.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_set_passwords.py
rename to cloudinit/handlers/cc_set_passwords.py
diff --git a/cloudinit/CloudConfig/cc_ssh.py b/cloudinit/handlers/cc_ssh.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_ssh.py
rename to cloudinit/handlers/cc_ssh.py
diff --git a/cloudinit/CloudConfig/cc_ssh_import_id.py b/cloudinit/handlers/cc_ssh_import_id.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_ssh_import_id.py
rename to cloudinit/handlers/cc_ssh_import_id.py
diff --git a/cloudinit/CloudConfig/cc_timezone.py b/cloudinit/handlers/cc_timezone.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_timezone.py
rename to cloudinit/handlers/cc_timezone.py
diff --git a/cloudinit/CloudConfig/cc_update_etc_hosts.py b/cloudinit/handlers/cc_update_etc_hosts.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_update_etc_hosts.py
rename to cloudinit/handlers/cc_update_etc_hosts.py
diff --git a/cloudinit/CloudConfig/cc_update_hostname.py b/cloudinit/handlers/cc_update_hostname.py
similarity index 100%
rename from cloudinit/CloudConfig/cc_update_hostname.py
rename to cloudinit/handlers/cc_update_hostname.py
diff --git a/cloudinit/importer.py b/cloudinit/importer.py
new file mode 100644
index 00000000..deea0956
--- /dev/null
+++ b/cloudinit/importer.py
@@ -0,0 +1,11 @@
+# vim: tabstop=4 shiftwidth=4 softtabstop=4
+
+import sys
+
+
+def import_module(module_name):
+    try:
+        __import__(module_name)
+        return sys.modules.get(module_name, None)
+    except ImportError as err:
+        raise RuntimeError('Could not load module %s: %s' % (module_name, err))
diff --git a/cloudinit/includer.py b/cloudinit/includer.py
new file mode 100644
index 00000000..d1022c5a
--- /dev/null
+++ b/cloudinit/includer.py
@@ -0,0 +1,65 @@
+import os
+import re
+
+from cloudinit import downloader as down
+from cloudinit import exceptions as excp
+from cloudinit import log as logging
+from cloudinit import shell as sh
+
+INCLUDE_PATT = re.compile("^#(opt_include|include)[ \t](.*)$", re.MULTILINE)
+OPT_PATS = ['opt_include']
+
+LOG = logging.getLogger(__name__)
+
+
+class Includer(object):
+
+    def __init__(self, root_fn, stack_limit=10):
+        self.root_fn = root_fn
+        self.stack_limit = stack_limit
+
+    def _read_file(self, fname):
+        return sh.read_file(fname)
+
+    def _read(self, fname, stack, rel):
+        if len(stack) >= self.stack_limit:
+            raise excp.StackExceeded("Stack limit of %s reached while including %s" % (self.stack_limit, fname))
+
+        canon_fname = self._canon_name(fname, rel)
+        if canon_fname in stack:
+            raise excp.RecursiveInclude("File %s recursively included" % (canon_fname))
+
+        stack.add(canon_fname)
+        new_rel = os.path.dirname(canon_fname)
+        contents = self._read_file(canon_fname)
+
+        def include_cb(match):
+            is_optional = (match.group(1).lower() in OPT_PATS)
+            fn = match.group(2).strip()
+            if not fn:
+                # Should we die??
+                return match.group(0)
+            else:
+                try:
+                    LOG.debug("Including file %s", fn)
+                    return self._read(fn, stack, new_rel)
+                except IOError:
+                    if is_optional:
+                        return ''
+                    else:
+                        raise
+
+        adjusted_contents = INCLUDE_PATT.sub(include_cb, contents)
+        stack.remove(fname)
+        return adjusted_contents
+
+    def _canon_name(self, fname, rel):
+        fname = fname.strip()
+        if not fname.startswith("/"):
+            fname = os.path.sep.join([rel, fname])
+        return os.path.realpath(fname)
+
+    def read(self, relative_to="."):
+        stack = set()
+        return self._read(self.root_fn, stack, rel=relative_to)
+    
diff --git a/cloudinit/log.py b/cloudinit/log.py
new file mode 100644
index 00000000..4d270045
--- /dev/null
+++ b/cloudinit/log.py
@@ -0,0 +1,94 @@
+# vim: tabstop=4 shiftwidth=4 softtabstop=4
+
+import logging
+import logging.handlers
+import sys
+
+# Logging levels for easy access
+CRITICAL = logging.CRITICAL
+FATAL = logging.FATAL
+ERROR = logging.ERROR
+WARNING = logging.WARNING
+WARN = logging.WARN
+INFO = logging.INFO
+DEBUG = logging.DEBUG
+NOTSET = logging.NOTSET
+
+# File log rotation settings
+ROTATE_AMOUNT = 10  # Only keep the past 9 + 1 active
+ROTATE_SIZE = 10 * 1024 * 1024  # 10 MB
+
+
+class ConsoleFormatter(logging.Formatter):
+
+    def _get_mini_level(self, record):
+        if record.levelno in [INFO, NOTSET] or not record.levelname:
+            return ''
+        lvlname = record.levelname
+        return lvlname[0].upper() + ": "
+
+    def format(self, record):
+        record.message = record.getMessage()
+        rdict = dict(record.__dict__)
+        rdict['minilevelname'] = self._get_mini_level(record)
+        # Skipping exception info for the console...
+        return self._fmt % (rdict)
+
+
+def setupLogging(level, filename=None, filelevel=logging.DEBUG):
+    root = getLogger()
+    consolelg = logging.StreamHandler(sys.stdout)
+    consolelg.setFormatter(ConsoleFormatter('%(minilevelname)s%(message)s'))
+    consolelg.setLevel(level)
+    root.addHandler(consolelg)
+    if filename:
+        filelg = logging.handlers.RotatingFileHandler(filename, maxBytes=ROTATE_SIZE, backupCount=ROTATE_AMOUNT)
+        filelg.setFormatter(logging.Formatter('%(levelname)s: @%(name)s : %(message)s'))
+        filelg.setLevel(filelevel)
+        root.addHandler(filelg)
+    root.setLevel(level)
+
+
+def logging_set_from_cfg(cfg):
+    log_cfgs = []
+    logcfg = util.get_cfg_option_str(cfg, "log_cfg", False)
+    if logcfg:
+        # if there is a 'logcfg' entry in the config, respect
+        # it, it is the old keyname
+        log_cfgs = [logcfg]
+    elif "log_cfgs" in cfg:
+        for cfg in cfg['log_cfgs']:
+            if isinstance(cfg, list):
+                log_cfgs.append('\n'.join(cfg))
+            else:
+                log_cfgs.append()
+
+    if not len(log_cfgs):
+        sys.stderr.write("Warning, no logging configured\n")
+        return
+
+    for logcfg in log_cfgs:
+        try:
+            logging.config.fileConfig(StringIO.StringIO(logcfg))
+            return
+        except:
+            pass
+
+    raise Exception("no valid logging found\n")
+
+
+def getLogger(name='cloudinit'):
+    return logging.getLogger(name)
+
+
+# Fixes this annoyance...
+# No handlers could be found for logger XXX annoying output...
+try:
+    from logging import NullHandler
+except ImportError:
+    class NullHandler(logging.Handler):
+        def emit(self, record):
+            pass
+
+logger = getLogger()
+logger.addHandler(NullHandler())
diff --git a/cloudinit/SshUtil.py b/cloudinit/ssh_util.py
similarity index 100%
rename from cloudinit/SshUtil.py
rename to cloudinit/ssh_util.py
diff --git a/cloudinit/templater.py b/cloudinit/templater.py
new file mode 100644
index 00000000..b6b320ab
--- /dev/null
+++ b/cloudinit/templater.py
@@ -0,0 +1,17 @@
+import os
+
+from Cheetah.Template import Template
+
+from cloudinit import util
+
+TEMPLATE_DIR = '/etc/cloud/templates/'
+
+
+def render_to_file(template, outfile, searchList):
+    contents = Template(file=os.path.join(TEMPLATE_DIR, template),
+                 searchList=[searchList]).respond()
+    util.write_file(outfile, contents)
+
+
+def render_string(template, searchList):
+    return Template(template, searchList=[searchList]).respond()
diff --git a/cloudinit/UserDataHandler.py b/cloudinit/user_data.py
similarity index 100%
rename from cloudinit/UserDataHandler.py
rename to cloudinit/user_data.py

From d34de5d4ab24c78704e5f8407d8459eba9ab94f5 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 12:45:28 -0700
Subject: [PATCH 003/434] Darn it. Those shouldn't be there!

---
 cloudinit/{handlers => sources}/DataSource.py            | 0
 cloudinit/{handlers => sources}/DataSourceCloudStack.py  | 0
 cloudinit/{handlers => sources}/DataSourceConfigDrive.py | 0
 cloudinit/{handlers => sources}/DataSourceEc2.py         | 0
 cloudinit/{handlers => sources}/DataSourceMAAS.py        | 0
 cloudinit/{handlers => sources}/DataSourceNoCloud.py     | 0
 cloudinit/{handlers => sources}/DataSourceOVF.py         | 0
 cloudinit/sources/__init__.py                            | 0
 8 files changed, 0 insertions(+), 0 deletions(-)
 rename cloudinit/{handlers => sources}/DataSource.py (100%)
 rename cloudinit/{handlers => sources}/DataSourceCloudStack.py (100%)
 rename cloudinit/{handlers => sources}/DataSourceConfigDrive.py (100%)
 rename cloudinit/{handlers => sources}/DataSourceEc2.py (100%)
 rename cloudinit/{handlers => sources}/DataSourceMAAS.py (100%)
 rename cloudinit/{handlers => sources}/DataSourceNoCloud.py (100%)
 rename cloudinit/{handlers => sources}/DataSourceOVF.py (100%)
 create mode 100644 cloudinit/sources/__init__.py

diff --git a/cloudinit/handlers/DataSource.py b/cloudinit/sources/DataSource.py
similarity index 100%
rename from cloudinit/handlers/DataSource.py
rename to cloudinit/sources/DataSource.py
diff --git a/cloudinit/handlers/DataSourceCloudStack.py b/cloudinit/sources/DataSourceCloudStack.py
similarity index 100%
rename from cloudinit/handlers/DataSourceCloudStack.py
rename to cloudinit/sources/DataSourceCloudStack.py
diff --git a/cloudinit/handlers/DataSourceConfigDrive.py b/cloudinit/sources/DataSourceConfigDrive.py
similarity index 100%
rename from cloudinit/handlers/DataSourceConfigDrive.py
rename to cloudinit/sources/DataSourceConfigDrive.py
diff --git a/cloudinit/handlers/DataSourceEc2.py b/cloudinit/sources/DataSourceEc2.py
similarity index 100%
rename from cloudinit/handlers/DataSourceEc2.py
rename to cloudinit/sources/DataSourceEc2.py
diff --git a/cloudinit/handlers/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
similarity index 100%
rename from cloudinit/handlers/DataSourceMAAS.py
rename to cloudinit/sources/DataSourceMAAS.py
diff --git a/cloudinit/handlers/DataSourceNoCloud.py b/cloudinit/sources/DataSourceNoCloud.py
similarity index 100%
rename from cloudinit/handlers/DataSourceNoCloud.py
rename to cloudinit/sources/DataSourceNoCloud.py
diff --git a/cloudinit/handlers/DataSourceOVF.py b/cloudinit/sources/DataSourceOVF.py
similarity index 100%
rename from cloudinit/handlers/DataSourceOVF.py
rename to cloudinit/sources/DataSourceOVF.py
diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
new file mode 100644
index 00000000..e69de29b

From c6861732769b2668ae0726fef226098713724659 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 12:48:22 -0700
Subject: [PATCH 004/434] Add a file that just deals with handling modules and
 part data

---
 cloudinit/handling.py | 101 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 101 insertions(+)
 create mode 100644 cloudinit/handling.py

diff --git a/cloudinit/handling.py b/cloudinit/handling.py
new file mode 100644
index 00000000..553abe4f
--- /dev/null
+++ b/cloudinit/handling.py
@@ -0,0 +1,101 @@
+import os
+
+from cloudinit import importer
+from cloudinit import log as logging
+from cloudinit.constants import (PER_INSTANCE, PER_ALWAYS)
+
+LOG = logging.getLogger(__name__)
+
+
+class InternalPartHandler:
+    freq = PER_INSTANCE
+    mtypes = []
+    handler_version = 1
+    handler = None
+
+    def __init__(self, handler, mtypes, frequency, version=2):
+        self.handler = handler
+        self.mtypes = mtypes
+        self.frequency = frequency
+        self.handler_version = version
+
+    def __repr__(self):
+        return("InternalPartHandler: [%s]" % self.mtypes)
+
+    def list_types(self):
+        return(self.mtypes)
+
+    def handle_part(self, data, ctype, filename, payload, frequency):
+        return(self.handler(data, ctype, filename, payload, frequency))
+
+
+def handler_register(mod, part_handlers, data, frequency=PER_INSTANCE):
+    if not hasattr(mod, "handler_version"):
+        setattr(mod, "handler_version", 1)
+
+    for mtype in mod.list_types():
+        part_handlers[mtype] = mod
+
+    handler_call_begin(mod, data, frequency)
+    return mod
+
+
+def handler_call_begin(mod, data, frequency):
+    handler_handle_part(mod, data, "__begin__", None, None, frequency)
+
+
+def handler_call_end(mod, data, frequency):
+    handler_handle_part(mod, data, "__end__", None, None, frequency)
+
+
+def handler_handle_part(mod, data, ctype, filename, payload, frequency):
+    # only add the handler if the module should run
+    modfreq = getattr(mod, "frequency", PER_INSTANCE)
+    if not (modfreq == PER_ALWAYS or
+            (frequency == PER_INSTANCE and modfreq == PER_INSTANCE)):
+        return
+    try:
+        if mod.handler_version == 1:
+            mod.handle_part(data, ctype, filename, payload)
+        else:
+            mod.handle_part(data, ctype, filename, payload, frequency)
+    except:
+        util.logexc(log)
+        traceback.print_exc(file=sys.stderr)
+
+
+def partwalker_handle_handler(pdata, _ctype, _filename, payload):
+    curcount = pdata['handlercount']
+    modname = 'part-handler-%03d' % curcount
+    frequency = pdata['frequency']
+
+    modfname = modname + ".py"
+    util.write_file(os.path.join(pdata['handlerdir'], modfname), payload, 0600)
+
+    try:
+        mod = importer.import_module(modname)
+        handler_register(mod, pdata['handlers'], pdata['data'], frequency)
+        pdata['handlercount'] = curcount + 1
+    except:
+        LOG.exception("Could not import module %s", modname)
+
+
+def partwalker_callback(pdata, ctype, filename, payload):
+    # data here is the part_handlers array and then the data to pass through
+    if ctype == "text/part-handler":
+        if 'handlercount' not in pdata:
+            pdata['handlercount'] = 0
+        partwalker_handle_handler(pdata, ctype, filename, payload)
+        return
+    if ctype not in pdata['handlers']:
+        if ctype == "text/x-not-multipart":
+            # Extract the first line or 24 bytes for displaying in the log
+            start = payload.split("\n", 1)[0][:24]
+            if start < payload:
+                details = "starting '%s...'" % start.encode("string-escape")
+            else:
+                details = repr(payload)
+            LOG.warning("Unhandled non-multipart userdata %s", details)
+        return
+    handler_handle_part(pdata['handlers'][ctype], pdata['data'],
+        ctype, filename, payload, pdata['frequency'])

From 7f4fb74d0651f9c65824e30372c265a3cb2474c3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 12:48:48 -0700
Subject: [PATCH 005/434] Add a file that just deals with url like functions

---
 cloudinit/url_helper.py | 147 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 147 insertions(+)
 create mode 100644 cloudinit/url_helper.py

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
new file mode 100644
index 00000000..0f0a9d0c
--- /dev/null
+++ b/cloudinit/url_helper.py
@@ -0,0 +1,147 @@
+import errno
+import httplib
+import time
+import urllib
+import urllib2
+
+from StringIO import StringIO
+
+from contextlib import closing
+
+from cloudinit import log as logging
+from cloudinit import shell as sh
+
+LOG = logging.getLogger(__name__)
+
+
+def ok_http_code(st):
+    return st in xrange(200, 400)
+
+
+def readurl(url, data=None, timeout=None, retries=0, sec_between=1, read_cb=None, headers=None):
+    openargs = {}
+    if timeout is not None:
+        openargs['timeout'] = int(timeout)
+
+    if data is None:
+        req = urllib2.Request(url, headers=headers)
+    else:
+        req = urllib2.Request(url, data=urllib.urlencode(data), headers=headers)
+
+    if retries <= 0:
+        retries = 1
+
+    last_excp = None
+    LOG.debug("Attempting to read from %s with %s attempts to be performed", url, retries)
+    for i in range(0, retries):
+        try:
+            with closing(urllib2.urlopen(req, **openargs)) as rh:
+                ofh = StringIO()
+                sh.pipe_in_out(rh, ofh, chunk_cb=read_cb)
+                return (ofh.getvalue(), rh.getcode())
+        except urllib2.HTTPError as e:
+            last_excp = e
+            LOG.exception("Failed at reading from %s.", url)
+        except urllib2.URLError as e:
+            # This can be a message string or
+            # another exception instance (socket.error for remote URLs, OSError for local URLs).
+            if (isinstance(e.reason, OSError) and
+                e.reason.errno == errno.ENOENT):
+                last_excp = e.reason
+            else:
+                last_excp = e
+            LOG.exception("Failed at reading from %s.", url)
+        LOG.debug("Please wait %s seconds while we wait to try again.", sec_between)
+        time.sleep(sec_between)
+
+    # Didn't work out
+    LOG.warn("Failed downloading from %s after %s attempts", url, i + 1)
+    if last_excp is not None:
+        raise last_excp
+
+
+def wait_for_url(urls, max_wait=None, timeout=None,
+                 status_cb=None, headers_cb=None, sleep_time=1):
+    """
+    urls:      a list of urls to try
+    max_wait:  roughly the maximum time to wait before giving up
+               The max time is *actually* len(urls)*timeout as each url will
+               be tried once and given the timeout provided.
+    timeout:   the timeout provided to urllib2.urlopen
+    status_cb: call method with string message when a url is not available
+    headers_cb: call method with single argument of url to get headers
+                for request.
+
+    the idea of this routine is to wait for the EC2 metdata service to
+    come up.  On both Eucalyptus and EC2 we have seen the case where
+    the instance hit the MD before the MD service was up.  EC2 seems
+    to have permenantely fixed this, though.
+
+    In openstack, the metadata service might be painfully slow, and
+    unable to avoid hitting a timeout of even up to 10 seconds or more
+    (LP: #894279) for a simple GET.
+
+    Offset those needs with the need to not hang forever (and block boot)
+    on a system where cloud-init is configured to look for EC2 Metadata
+    service but is not going to find one.  It is possible that the instance
+    data host (169.254.169.254) may be firewalled off Entirely for a sytem,
+    meaning that the connection will block forever unless a timeout is set.
+    """
+    starttime = time.time()
+
+    def nullstatus_cb(msg):
+        return
+
+    if status_cb is None:
+        status_cb = nullstatus_cb
+
+    def timeup(max_wait, starttime):
+        return ((max_wait <= 0 or max_wait is None) or
+                (time.time() - starttime > max_wait))
+
+    loop_n = 0
+    while True:
+        sleeptime = int(loop_n / 5) + 1
+        for url in urls:
+            now = time.time()
+            if loop_n != 0:
+                if timeup(max_wait, starttime):
+                    break
+                if timeout and (now + timeout > (starttime + max_wait)):
+                    # shorten timeout to not run way over max_time
+                    timeout = int((starttime + max_wait) - now)
+
+            reason = ""
+            try:
+                if headers_cb is not None:
+                    headers = headers_cb(url)
+                else:
+                    headers = {}
+
+                (resp, status_code) = readurl(url, headers=headers, timeout=timeout)
+                if not resp:
+                    reason = "empty response [%s]" % status_code
+                elif not ok_http_code(status_code):
+                    reason = "bad status code [%s]" % status_code
+                else:
+                    return url
+            except urllib2.HTTPError as e:
+                reason = "http error [%s]" % e.code
+            except urllib2.URLError as e:
+                reason = "url error [%s]" % e.reason
+            except socket.timeout as e:
+                reason = "socket timeout [%s]" % e
+            except Exception as e:
+                reason = "unexpected error [%s]" % e
+
+            status_cb("'%s' failed [%s/%ss]: %s" %
+                      (url, int(time.time() - starttime), max_wait,
+                       reason))
+
+        if timeup(max_wait, starttime):
+            break
+
+        loop_n = loop_n + 1
+        time.sleep(sleeptime)
+
+    return False

From 8acd6d390033ed76fea8aaf873edfb2f79180268 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 12:49:07 -0700
Subject: [PATCH 006/434] Add in a helper that is useful for running
 pep8/pylint

---
 checks.sh | 53 +++++++++++++++++++++++++++++++++++++++++++++++++++++
 pylintrc  | 42 ++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 95 insertions(+)
 create mode 100755 checks.sh
 create mode 100644 pylintrc

diff --git a/checks.sh b/checks.sh
new file mode 100755
index 00000000..f54cad36
--- /dev/null
+++ b/checks.sh
@@ -0,0 +1,53 @@
+#!/bin/bash
+
+set -u
+
+function find_src {
+  files=`find bin cloudinit -type f | grep "py\$"`
+  echo $files
+}
+
+function run_pep8 {
+  echo "Running pep8 ..."
+  files=$(find_src)
+  ignores="E202,E501"
+  output_filename="pep8.log"
+  opts="--ignore=$ignores --repeat"
+  pep8 ${opts} ${files} 2>&1 > $output_filename
+  if [ "$?" -ne "0" ]; then
+    echo "Some badness was found!"
+  fi
+  echo "Check '$output_filename' for a full report."
+}
+
+function run_pylint {
+  echo "Running pylint ..."
+  opts="--rcfile=pylintrc --output-format=parseable"
+  files=$(find_src)
+  output_filename="pylint.log"
+  pylint ${opts} ${files} 2>&1 > $output_filename
+  if [ "$?" -eq "1" ]; then
+    # pylint --long-help
+    # * 0 if everything went fine
+    # * 1 if a fatal message was issued
+    # * 2 if an error message was issued
+    # * 4 if a warning message was issued
+    # * 8 if a refactor message was issued
+    # * 16 if a convention message was issued
+    # * 32 on usage error
+    echo "A fatal pylint error occurred!"
+  else
+    if [ "$?" -eq "0" ]; then
+      echo "Your code is perfect you code master!"
+    else
+      echo "You are not yet a code master."
+      grep -i "Your code" $output_filename
+    fi
+  fi
+  echo "Check '$output_filename' for a full report."
+}
+
+
+run_pep8
+run_pylint
+
diff --git a/pylintrc b/pylintrc
new file mode 100644
index 00000000..a7447a19
--- /dev/null
+++ b/pylintrc
@@ -0,0 +1,42 @@
+# The format of this file isn't really documented; just use --generate-rcfile
+
+[Master]
+
+[Messages Control]
+
+# http://pylint-messages.wikidot.com/all-codes
+# NOTE(justinsb): We might want to have a 2nd strict pylintrc in future
+# C0111: Don't require docstrings on every method
+# R0912: Too many branches (huh)
+# R0914: Too many local variables is odd.
+# W0142: *args and **kwargs are fine.
+# W0511: TODOs in code comments are fine.
+# W0613: Unused argument '??' should be ok (they are useful sometimes to know intention of variable)
+# W0622: Redefining id is fine.
+disable=C0111,W0142,W0622,C0301,R0902,R0201,R0914,W0613,R0912,R0801
+
+[Basic]
+
+# Variable names can be 1 to 31 characters long, with lowercase and underscores
+variable-rgx=[a-z_][a-z0-9_]{0,30}$
+
+# Argument names can be 2 to 31 characters long, with lowercase and underscores
+argument-rgx=[a-z_][a-z0-9_]{1,30}$
+
+# Method names should be at least 3 characters long
+# and be lowercased with underscores
+method-rgx=([a-z_][a-z0-9_]{2,50}|setUp|tearDown)$
+
+# Don't require docstrings on tests.
+no-docstring-rgx=((__.*__)|([tT]est.*)|setUp|tearDown)$
+
+[Design]
+
+max-public-methods=100
+min-public-methods=0
+max-args=6
+
+[Variables]
+
+# List of additional names supposed to be defined in builtins. Remember that
+# you should avoid to define new builtins when possible.

From 88795392e3ff8c79ccb9f0e9b5741cb7be9bc15f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 13:46:54 -0700
Subject: [PATCH 007/434] 1. Move cloud init and cloud config objects to a
 cloud file. 2. Cleanup main __init__ file with shell additions, constants
 usage, os.path usage.

---
 cloudinit/__init__.py         | 618 +++-------------------------------
 cloudinit/sources/__init__.py | 214 ++++++++++++
 2 files changed, 265 insertions(+), 567 deletions(-)

diff --git a/cloudinit/__init__.py b/cloudinit/__init__.py
index 85c6fd1b..f223fbe8 100644
--- a/cloudinit/__init__.py
+++ b/cloudinit/__init__.py
@@ -20,627 +20,111 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 #
 
-varlibdir = '/var/lib/cloud'
-cur_instance_link = varlibdir + "/instance"
-boot_finished = cur_instance_link + "/boot-finished"
-system_config = '/etc/cloud/cloud.cfg'
-seeddir = varlibdir + "/seed"
-cfg_env_name = "CLOUD_CFG"
-
-cfg_builtin = """
-log_cfgs: []
-datasource_list: ["NoCloud", "ConfigDrive", "OVF", "MAAS", "Ec2", "CloudStack"]
-def_log_file: /var/log/cloud-init.log
-syslog_fix_perms: syslog:adm
-"""
-logger_name = "cloudinit"
-
-pathmap = {
-   "handlers": "/handlers",
-   "scripts": "/scripts",
-   "sem": "/sem",
-   "boothooks": "/boothooks",
-   "userdata_raw": "/user-data.txt",
-   "userdata": "/user-data.txt.i",
-   "obj_pkl": "/obj.pkl",
-   "cloud_config": "/cloud-config.txt",
-   "data": "/data",
-   None: "",
-}
-
-per_instance = "once-per-instance"
-per_always = "always"
-per_once = "once"
-
-parsed_cfgs = {}
-
 import os
 
-import cPickle
 import sys
 import os.path
 import errno
 import subprocess
 import yaml
-import logging
-import logging.config
-import StringIO
 import glob
 import traceback
 
+import cloudinit.log as logging
+import cloudinit.shell as sh
 import cloudinit.util as util
 
-
-class NullHandler(logging.Handler):
-    def emit(self, record):
-        pass
-
-
-log = logging.getLogger(logger_name)
-log.addHandler(NullHandler())
-
-
-def logging_set_from_cfg_file(cfg_file=system_config):
-    logging_set_from_cfg(util.get_base_cfg(cfg_file, cfg_builtin, parsed_cfgs))
-
-
-def logging_set_from_cfg(cfg):
-    log_cfgs = []
-    logcfg = util.get_cfg_option_str(cfg, "log_cfg", False)
-    if logcfg:
-        # if there is a 'logcfg' entry in the config, respect
-        # it, it is the old keyname
-        log_cfgs = [logcfg]
-    elif "log_cfgs" in cfg:
-        for cfg in cfg['log_cfgs']:
-            if isinstance(cfg, list):
-                log_cfgs.append('\n'.join(cfg))
-            else:
-                log_cfgs.append()
-
-    if not len(log_cfgs):
-        sys.stderr.write("Warning, no logging configured\n")
-        return
-
-    for logcfg in log_cfgs:
-        try:
-            logging.config.fileConfig(StringIO.StringIO(logcfg))
-            return
-        except:
-            pass
-
-    raise Exception("no valid logging found\n")
-
-
-import cloudinit.DataSource as DataSource
-import cloudinit.UserDataHandler as UserDataHandler
-
-
-class CloudInit:
-    cfg = None
-    part_handlers = {}
-    old_conffile = '/etc/ec2-init/ec2-config.cfg'
-    ds_deps = [DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK]
-    datasource = None
-    cloud_config_str = ''
-    datasource_name = ''
-
-    builtin_handlers = []
-
-    def __init__(self, ds_deps=None, sysconfig=system_config):
-        self.builtin_handlers = [
-            ['text/x-shellscript', self.handle_user_script, per_always],
-            ['text/cloud-config', self.handle_cloud_config, per_always],
-            ['text/upstart-job', self.handle_upstart_job, per_instance],
-            ['text/cloud-boothook', self.handle_cloud_boothook, per_always],
-        ]
-
-        if ds_deps != None:
-            self.ds_deps = ds_deps
-
-        self.sysconfig = sysconfig
-
-        self.cfg = self.read_cfg()
-
-    def read_cfg(self):
-        if self.cfg:
-            return(self.cfg)
-
-        try:
-            conf = util.get_base_cfg(self.sysconfig, cfg_builtin, parsed_cfgs)
-        except Exception:
-            conf = get_builtin_cfg()
-
-        # support reading the old ConfigObj format file and merging
-        # it into the yaml dictionary
-        try:
-            from configobj import ConfigObj
-            oldcfg = ConfigObj(self.old_conffile)
-            if oldcfg is None:
-                oldcfg = {}
-            conf = util.mergedict(conf, oldcfg)
-        except:
-            pass
-
-        return(conf)
-
-    def restore_from_cache(self):
-        try:
-            # we try to restore from a current link and static path
-            # by using the instance link, if purge_cache was called
-            # the file wont exist
-            cache = get_ipath_cur('obj_pkl')
-            f = open(cache, "rb")
-            data = cPickle.load(f)
-            f.close()
-            self.datasource = data
-            return True
-        except:
-            return False
-
-    def write_to_cache(self):
-        cache = self.get_ipath("obj_pkl")
-        try:
-            os.makedirs(os.path.dirname(cache))
-        except OSError as e:
-            if e.errno != errno.EEXIST:
-                return False
-
-        try:
-            f = open(cache, "wb")
-            cPickle.dump(self.datasource, f)
-            f.close()
-            os.chmod(cache, 0400)
-        except:
-            raise
-
-    def get_data_source(self):
-        if self.datasource is not None:
-            return True
-
-        if self.restore_from_cache():
-            log.debug("restored from cache type %s" % self.datasource)
-            return True
-
-        cfglist = self.cfg['datasource_list']
-        dslist = list_sources(cfglist, self.ds_deps)
-        dsnames = [f.__name__ for f in dslist]
-
-        log.debug("searching for data source in %s" % dsnames)
-        for cls in dslist:
-            ds = cls.__name__
-            try:
-                s = cls(sys_cfg=self.cfg)
-                if s.get_data():
-                    self.datasource = s
-                    self.datasource_name = ds
-                    log.debug("found data source %s" % ds)
-                    return True
-            except Exception as e:
-                log.warn("get_data of %s raised %s" % (ds, e))
-                util.logexc(log)
-        msg = "Did not find data source. searched classes: %s" % dsnames
-        log.debug(msg)
-        raise DataSourceNotFoundException(msg)
-
-    def set_cur_instance(self):
-        try:
-            os.unlink(cur_instance_link)
-        except OSError as e:
-            if e.errno != errno.ENOENT:
-                raise
-
-        iid = self.get_instance_id()
-        os.symlink("./instances/%s" % iid, cur_instance_link)
-        idir = self.get_ipath()
-        dlist = []
-        for d in ["handlers", "scripts", "sem"]:
-            dlist.append("%s/%s" % (idir, d))
-
-        util.ensure_dirs(dlist)
-
-        ds = "%s: %s\n" % (self.datasource.__class__, str(self.datasource))
-        dp = self.get_cpath('data')
-        util.write_file("%s/%s" % (idir, 'datasource'), ds)
-        util.write_file("%s/%s" % (dp, 'previous-datasource'), ds)
-        util.write_file("%s/%s" % (dp, 'previous-instance-id'), "%s\n" % iid)
-
-    def get_userdata(self):
-        return(self.datasource.get_userdata())
-
-    def get_userdata_raw(self):
-        return(self.datasource.get_userdata_raw())
-
-    def get_instance_id(self):
-        return(self.datasource.get_instance_id())
-
-    def update_cache(self):
-        self.write_to_cache()
-        self.store_userdata()
-
-    def store_userdata(self):
-        util.write_file(self.get_ipath('userdata_raw'),
-            self.datasource.get_userdata_raw(), 0600)
-        util.write_file(self.get_ipath('userdata'),
-            self.datasource.get_userdata(), 0600)
-
-    def sem_getpath(self, name, freq):
-        if freq == 'once-per-instance':
-            return("%s/%s" % (self.get_ipath("sem"), name))
-        return("%s/%s.%s" % (get_cpath("sem"), name, freq))
-
-    def sem_has_run(self, name, freq):
-        if freq == per_always:
-            return False
-        semfile = self.sem_getpath(name, freq)
-        if os.path.exists(semfile):
-            return True
-        return False
-
-    def sem_acquire(self, name, freq):
-        from time import time
-        semfile = self.sem_getpath(name, freq)
-
-        try:
-            os.makedirs(os.path.dirname(semfile))
-        except OSError as e:
-            if e.errno != errno.EEXIST:
-                raise e
-
-        if os.path.exists(semfile) and freq != per_always:
-            return False
-
-        # race condition
-        try:
-            f = open(semfile, "w")
-            f.write("%s\n" % str(time()))
-            f.close()
-        except:
-            return(False)
-        return(True)
-
-    def sem_clear(self, name, freq):
-        semfile = self.sem_getpath(name, freq)
-        try:
-            os.unlink(semfile)
-        except OSError as e:
-            if e.errno != errno.ENOENT:
-                return False
-
-        return True
-
-    # acquire lock on 'name' for given 'freq'
-    # if that does not exist, then call 'func' with given 'args'
-    # if 'clear_on_fail' is True and func throws an exception
-    #  then remove the lock (so it would run again)
-    def sem_and_run(self, semname, freq, func, args=None, clear_on_fail=False):
-        if args is None:
-            args = []
-        if self.sem_has_run(semname, freq):
-            log.debug("%s already ran %s", semname, freq)
-            return False
-        try:
-            if not self.sem_acquire(semname, freq):
-                raise Exception("Failed to acquire lock on %s" % semname)
-
-            func(*args)
-        except:
-            if clear_on_fail:
-                self.sem_clear(semname, freq)
-            raise
-
-        return True
-
-    # get_ipath : get the instance path for a name in pathmap
-    # (/var/lib/cloud/instances/<instance>/name)<name>)
-    def get_ipath(self, name=None):
-        return("%s/instances/%s%s"
-               % (varlibdir, self.get_instance_id(), pathmap[name]))
-
-    def consume_userdata(self, frequency=per_instance):
-        self.get_userdata()
-        data = self
-
-        cdir = get_cpath("handlers")
-        idir = self.get_ipath("handlers")
-
-        # add the path to the plugins dir to the top of our list for import
-        # instance dir should be read before cloud-dir
-        sys.path.insert(0, cdir)
-        sys.path.insert(0, idir)
-
-        part_handlers = {}
-        # add handlers in cdir
-        for fname in glob.glob("%s/*.py" % cdir):
-            if not os.path.isfile(fname):
-                continue
-            modname = os.path.basename(fname)[0:-3]
-            try:
-                mod = __import__(modname)
-                handler_register(mod, part_handlers, data, frequency)
-                log.debug("added handler for [%s] from %s" % (mod.list_types(),
-                                                              fname))
-            except:
-                log.warn("failed to initialize handler in %s" % fname)
-                util.logexc(log)
-
-        # add the internal handers if their type hasn't been already claimed
-        for (btype, bhand, bfreq) in self.builtin_handlers:
-            if btype in part_handlers:
-                continue
-            handler_register(InternalPartHandler(bhand, [btype], bfreq),
-                part_handlers, data, frequency)
-
-        # walk the data
-        pdata = {'handlers': part_handlers, 'handlerdir': idir,
-                 'data': data, 'frequency': frequency}
-        UserDataHandler.walk_userdata(self.get_userdata(),
-            partwalker_callback, data=pdata)
-
-        # give callbacks opportunity to finalize
-        called = []
-        for (_mtype, mod) in part_handlers.iteritems():
-            if mod in called:
-                continue
-            handler_call_end(mod, data, frequency)
-
-    def handle_user_script(self, _data, ctype, filename, payload, _frequency):
-        if ctype == "__end__":
-            return
-        if ctype == "__begin__":
-            # maybe delete existing things here
-            return
-
-        filename = filename.replace(os.sep, '_')
-        scriptsdir = get_ipath_cur('scripts')
-        util.write_file("%s/%s" %
-            (scriptsdir, filename), util.dos2unix(payload), 0700)
-
-    def handle_upstart_job(self, _data, ctype, filename, payload, frequency):
-        # upstart jobs are only written on the first boot
-        if frequency != per_instance:
-            return
-
-        if ctype == "__end__" or ctype == "__begin__":
-            return
-        if not filename.endswith(".conf"):
-            filename = filename + ".conf"
-
-        util.write_file("%s/%s" % ("/etc/init", filename),
-            util.dos2unix(payload), 0644)
-
-    def handle_cloud_config(self, _data, ctype, filename, payload, _frequency):
-        if ctype == "__begin__":
-            self.cloud_config_str = ""
-            return
-        if ctype == "__end__":
-            cloud_config = self.get_ipath("cloud_config")
-            util.write_file(cloud_config, self.cloud_config_str, 0600)
-
-            ## this could merge the cloud config with the system config
-            ## for now, not doing this as it seems somewhat circular
-            ## as CloudConfig does that also, merging it with this cfg
-            ##
-            # ccfg = yaml.load(self.cloud_config_str)
-            # if ccfg is None: ccfg = {}
-            # self.cfg = util.mergedict(ccfg, self.cfg)
-
-            return
-
-        self.cloud_config_str += "\n#%s\n%s" % (filename, payload)
-
-    def handle_cloud_boothook(self, _data, ctype, filename, payload,
-                              _frequency):
-        if ctype == "__end__":
-            return
-        if ctype == "__begin__":
-            return
-
-        filename = filename.replace(os.sep, '_')
-        payload = util.dos2unix(payload)
-        prefix = "#cloud-boothook"
-        start = 0
-        if payload.startswith(prefix):
-            start = len(prefix) + 1
-
-        boothooks_dir = self.get_ipath("boothooks")
-        filepath = "%s/%s" % (boothooks_dir, filename)
-        util.write_file(filepath, payload[start:], 0700)
-        try:
-            env = os.environ.copy()
-            env['INSTANCE_ID'] = self.datasource.get_instance_id()
-            subprocess.check_call([filepath], env=env)
-        except subprocess.CalledProcessError as e:
-            log.error("boothooks script %s returned %i" %
-                (filepath, e.returncode))
-        except Exception as e:
-            log.error("boothooks unknown exception %s when running %s" %
-                (e, filepath))
-
-    def get_public_ssh_keys(self):
-        return(self.datasource.get_public_ssh_keys())
-
-    def get_locale(self):
-        return(self.datasource.get_locale())
-
-    def get_mirror(self):
-        return(self.datasource.get_local_mirror())
-
-    def get_hostname(self, fqdn=False):
-        return(self.datasource.get_hostname(fqdn=fqdn))
-
-    def device_name_to_device(self, name):
-        return(self.datasource.device_name_to_device(name))
-
-    # I really don't know if this should be here or not, but
-    # I needed it in cc_update_hostname, where that code had a valid 'cloud'
-    # reference, but did not have a cloudinit handle
-    # (ie, no cloudinit.get_cpath())
-    def get_cpath(self, name=None):
-        return(get_cpath(name))
+from cloudinit.constants import (VAR_LIB_DIR, CFG_BUILTIN, CLOUD_CONFIG,
+                                 BOOT_FINISHED, CUR_INSTANCE_LINK, PATH_MAP)
+
+LOG = logging.getLogger(__name__)
+
+INIT_SUBDIRS = [
+    'scripts',
+    os.path.join('scripts', 'per-instance'),
+    os.path.join('scripts', 'per-once'),
+    os.path.join('scripts', 'per-boot'),
+    'seed',
+    'instances',
+    'handlers',
+    'sem',
+    'data'
+]
+
+
+# TODO: get rid of this global
+parsed_cfgs = {}
 
 
 def initfs():
-    subds = ['scripts/per-instance', 'scripts/per-once', 'scripts/per-boot',
-             'seed', 'instances', 'handlers', 'sem', 'data']
-    dlist = []
-    for subd in subds:
-        dlist.append("%s/%s" % (varlibdir, subd))
-    util.ensure_dirs(dlist)
 
-    cfg = util.get_base_cfg(system_config, cfg_builtin, parsed_cfgs)
+    # TODO don't do this every time this function is called?
+    dlist = []
+    for subd in INIT_SUBDIRS:
+        dlist.append(os.path.join(VAR_LIB_DIR, subd))
+    sh.ensure_dirs(dlist)
+
+    cfg = util.get_base_cfg(CLOUD_CONFIG, get_builtin_cfg(), parsed_cfgs)
     log_file = util.get_cfg_option_str(cfg, 'def_log_file', None)
     perms = util.get_cfg_option_str(cfg, 'syslog_fix_perms', None)
     if log_file:
-        fp = open(log_file, "ab")
-        fp.close()
+        sh.ensure_file(log_file)
     if log_file and perms:
         (u, g) = perms.split(':', 1)
         if u == "-1" or u == "None":
             u = None
         if g == "-1" or g == "None":
             g = None
-        util.chownbyname(log_file, u, g)
+        sh.chownbyname(log_file, u, g)
 
 
 def purge_cache(rmcur=True):
-    rmlist = [boot_finished]
+    rmlist = [BOOT_FINISHED]
     if rmcur:
-        rmlist.append(cur_instance_link)
+        rmlist.append(CUR_INSTANCE_LINK)
     for f in rmlist:
         try:
-            os.unlink(f)
+            sh.unlink(f)
         except OSError as e:
             if e.errno == errno.ENOENT:
                 continue
-            return(False)
+            return False
         except:
-            return(False)
-    return(True)
+            return False
+    return True
 
 
 # get_ipath_cur: get the current instance path for an item
 def get_ipath_cur(name=None):
-    return("%s/%s%s" % (varlibdir, "instance", pathmap[name]))
+    add_on = PATH_MAP.get(name)
+    ipath = os.path.join(VAR_LIB_DIR, 'instance')
+    if add_on:
+        ipath = os.path.join(ipath, add_on)
+    return ipath
 
 
 # get_cpath : get the "clouddir" (/var/lib/cloud/<name>)
 # for a name in dirmap
 def get_cpath(name=None):
-    return("%s%s" % (varlibdir, pathmap[name]))
+    cpath = VAR_LIB_DIR
+    add_on = PATH_MAP.get(name)
+    if add_on:
+        cpath = os.path.join(cpath, add_on)
+    return cpath
 
 
 def get_base_cfg(cfg_path=None):
     if cfg_path is None:
-        cfg_path = system_config
-    return(util.get_base_cfg(cfg_path, cfg_builtin, parsed_cfgs))
+        cfg_path = CLOUD_CONFIG
+    return util.get_base_cfg(cfg_path, get_builtin_cfg(), parsed_cfgs)
 
 
 def get_builtin_cfg():
-    return(yaml.load(cfg_builtin))
-
-
-class DataSourceNotFoundException(Exception):
-    pass
+    return dict(CFG_BUILTIN)
 
 
 def list_sources(cfg_list, depends):
-    return(DataSource.list_sources(cfg_list, depends, ["cloudinit", ""]))
-
-
-def handler_register(mod, part_handlers, data, frequency=per_instance):
-    if not hasattr(mod, "handler_version"):
-        setattr(mod, "handler_version", 1)
-
-    for mtype in mod.list_types():
-        part_handlers[mtype] = mod
-
-    handler_call_begin(mod, data, frequency)
-    return(mod)
-
-
-def handler_call_begin(mod, data, frequency):
-    handler_handle_part(mod, data, "__begin__", None, None, frequency)
-
-
-def handler_call_end(mod, data, frequency):
-    handler_handle_part(mod, data, "__end__", None, None, frequency)
-
-
-def handler_handle_part(mod, data, ctype, filename, payload, frequency):
-    # only add the handler if the module should run
-    modfreq = getattr(mod, "frequency", per_instance)
-    if not (modfreq == per_always or
-            (frequency == per_instance and modfreq == per_instance)):
-        return
-    try:
-        if mod.handler_version == 1:
-            mod.handle_part(data, ctype, filename, payload)
-        else:
-            mod.handle_part(data, ctype, filename, payload, frequency)
-    except:
-        util.logexc(log)
-        traceback.print_exc(file=sys.stderr)
-
-
-def partwalker_handle_handler(pdata, _ctype, _filename, payload):
-    curcount = pdata['handlercount']
-    modname = 'part-handler-%03d' % curcount
-    frequency = pdata['frequency']
-
-    modfname = modname + ".py"
-    util.write_file("%s/%s" % (pdata['handlerdir'], modfname), payload, 0600)
-
-    try:
-        mod = __import__(modname)
-        handler_register(mod, pdata['handlers'], pdata['data'], frequency)
-        pdata['handlercount'] = curcount + 1
-    except:
-        util.logexc(log)
-        traceback.print_exc(file=sys.stderr)
-
-
-def partwalker_callback(pdata, ctype, filename, payload):
-    # data here is the part_handlers array and then the data to pass through
-    if ctype == "text/part-handler":
-        if 'handlercount' not in pdata:
-            pdata['handlercount'] = 0
-        partwalker_handle_handler(pdata, ctype, filename, payload)
-        return
-    if ctype not in pdata['handlers']:
-        if ctype == "text/x-not-multipart":
-            # Extract the first line or 24 bytes for displaying in the log
-            start = payload.split("\n", 1)[0][:24]
-            if start < payload:
-                details = "starting '%s...'" % start.encode("string-escape")
-            else:
-                details = repr(payload)
-            log.warning("Unhandled non-multipart userdata %s", details)
-        return
-    handler_handle_part(pdata['handlers'][ctype], pdata['data'],
-        ctype, filename, payload, pdata['frequency'])
-
-
-class InternalPartHandler:
-    freq = per_instance
-    mtypes = []
-    handler_version = 1
-    handler = None
-
-    def __init__(self, handler, mtypes, frequency, version=2):
-        self.handler = handler
-        self.mtypes = mtypes
-        self.frequency = frequency
-        self.handler_version = version
-
-    def __repr__(self):
-        return("InternalPartHandler: [%s]" % self.mtypes)
-
-    def list_types(self):
-        return(self.mtypes)
-
-    def handle_part(self, data, ctype, filename, payload, frequency):
-        return(self.handler(data, ctype, filename, payload, frequency))
+    return (DataSource.list_sources(cfg_list, depends, ["cloudinit", ""]))
 
 
 def get_cmdline_url(names=('cloud-config-url', 'url'),
diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index e69de29b..e2a9150d 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -0,0 +1,214 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2009-2010 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Hafliger <juerg.haefliger@hp.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+
+DEP_FILESYSTEM = "FILESYSTEM"
+DEP_NETWORK = "NETWORK"
+
+import cloudinit.UserDataHandler as ud
+import cloudinit.util as util
+import socket
+
+
+class DataSource:
+    userdata = None
+    metadata = None
+    userdata_raw = None
+    cfgname = ""
+    # system config (passed in from cloudinit,
+    # cloud-config before input from the DataSource)
+    sys_cfg = {}
+    # datasource config, the cloud-config['datasource']['__name__']
+    ds_cfg = {}  # datasource config
+
+    def __init__(self, sys_cfg=None):
+        if not self.cfgname:
+            name = str(self.__class__).split(".")[-1]
+            if name.startswith("DataSource"):
+                name = name[len("DataSource"):]
+            self.cfgname = name
+        if sys_cfg:
+            self.sys_cfg = sys_cfg
+
+        self.ds_cfg = util.get_cfg_by_path(self.sys_cfg,
+                          ("datasource", self.cfgname), self.ds_cfg)
+
+    def get_userdata(self):
+        if self.userdata == None:
+            self.userdata = ud.preprocess_userdata(self.userdata_raw)
+        return self.userdata
+
+    def get_userdata_raw(self):
+        return(self.userdata_raw)
+
+    # the data sources' config_obj is a cloud-config formated
+    # object that came to it from ways other than cloud-config
+    # because cloud-config content would be handled elsewhere
+    def get_config_obj(self):
+        return({})
+
+    def get_public_ssh_keys(self):
+        keys = []
+        if 'public-keys' not in self.metadata:
+            return([])
+
+        if isinstance(self.metadata['public-keys'], str):
+            return(str(self.metadata['public-keys']).splitlines())
+
+        if isinstance(self.metadata['public-keys'], list):
+            return(self.metadata['public-keys'])
+
+        for _keyname, klist in self.metadata['public-keys'].items():
+            # lp:506332 uec metadata service responds with
+            # data that makes boto populate a string for 'klist' rather
+            # than a list.
+            if isinstance(klist, str):
+                klist = [klist]
+            for pkey in klist:
+                # there is an empty string at the end of the keylist, trim it
+                if pkey:
+                    keys.append(pkey)
+
+        return(keys)
+
+    def device_name_to_device(self, _name):
+        # translate a 'name' to a device
+        # the primary function at this point is on ec2
+        # to consult metadata service, that has
+        #  ephemeral0: sdb
+        # and return 'sdb' for input 'ephemeral0'
+        return(None)
+
+    def get_locale(self):
+        return('en_US.UTF-8')
+
+    def get_local_mirror(self):
+        return None
+
+    def get_instance_id(self):
+        if 'instance-id' not in self.metadata:
+            return "iid-datasource"
+        return(self.metadata['instance-id'])
+
+    def get_hostname(self, fqdn=False):
+        defdomain = "localdomain"
+        defhost = "localhost"
+
+        domain = defdomain
+        if not 'local-hostname' in self.metadata:
+
+            # this is somewhat questionable really.
+            # the cloud datasource was asked for a hostname
+            # and didn't have one. raising error might be more appropriate
+            # but instead, basically look up the existing hostname
+            toks = []
+
+            hostname = socket.gethostname()
+
+            fqdn = util.get_fqdn_from_hosts(hostname)
+
+            if fqdn and fqdn.find(".") > 0:
+                toks = str(fqdn).split(".")
+            elif hostname:
+                toks = [hostname, defdomain]
+            else:
+                toks = [defhost, defdomain]
+
+        else:
+            # if there is an ipv4 address in 'local-hostname', then
+            # make up a hostname (LP: #475354) in format ip-xx.xx.xx.xx
+            lhost = self.metadata['local-hostname']
+            if is_ipv4(lhost):
+                toks = "ip-%s" % lhost.replace(".", "-")
+            else:
+                toks = lhost.split(".")
+
+        if len(toks) > 1:
+            hostname = toks[0]
+            domain = '.'.join(toks[1:])
+        else:
+            hostname = toks[0]
+
+        if fqdn:
+            return "%s.%s" % (hostname, domain)
+        else:
+            return hostname
+
+
+# return a list of classes that have the same depends as 'depends'
+# iterate through cfg_list, loading "DataSourceCollections" modules
+# and calling their "get_datasource_list".
+# return an ordered list of classes that match
+#
+# - modules must be named "DataSource<item>", where 'item' is an entry
+#   in cfg_list
+# - if pkglist is given, it will iterate try loading from that package
+#   ie, pkglist=[ "foo", "" ]
+#     will first try to load foo.DataSource<item>
+#     then DataSource<item>
+def list_sources(cfg_list, depends, pkglist=None):
+    if pkglist is None:
+        pkglist = []
+    retlist = []
+    for ds_coll in cfg_list:
+        for pkg in pkglist:
+            if pkg:
+                pkg = "%s." % pkg
+            try:
+                mod = __import__("%sDataSource%s" % (pkg, ds_coll))
+                if pkg:
+                    mod = getattr(mod, "DataSource%s" % ds_coll)
+                lister = getattr(mod, "get_datasource_list")
+                retlist.extend(lister(depends))
+                break
+            except:
+                raise
+    return(retlist)
+
+
+# depends is a list of dependencies (DEP_FILESYSTEM)
+# dslist is a list of 2 item lists
+# dslist = [
+#   ( class, ( depends-that-this-class-needs ) )
+# }
+# it returns a list of 'class' that matched these deps exactly
+# it is a helper function for DataSourceCollections
+def list_from_depends(depends, dslist):
+    retlist = []
+    depset = set(depends)
+    for elem in dslist:
+        (cls, deps) = elem
+        if depset == set(deps):
+            retlist.append(cls)
+    return(retlist)
+
+
+def is_ipv4(instr):
+    """ determine if input string is a ipv4 address. return boolean"""
+    toks = instr.split('.')
+    if len(toks) != 4:
+        return False
+
+    try:
+        toks = [x for x in toks if (int(x) < 256 and int(x) > 0)]
+    except:
+        return False
+
+    return (len(toks) == 4)

From dad3bab2f79d99d3ec71ab8a5df200bafab608c0 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 13:47:47 -0700
Subject: [PATCH 008/434] Move the contents of this file to __init__ in
 sources.

---
 cloudinit/sources/DataSource.py | 214 --------------------------------
 1 file changed, 214 deletions(-)
 delete mode 100644 cloudinit/sources/DataSource.py

diff --git a/cloudinit/sources/DataSource.py b/cloudinit/sources/DataSource.py
deleted file mode 100644
index e2a9150d..00000000
--- a/cloudinit/sources/DataSource.py
+++ /dev/null
@@ -1,214 +0,0 @@
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2009-2010 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Hafliger <juerg.haefliger@hp.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-
-DEP_FILESYSTEM = "FILESYSTEM"
-DEP_NETWORK = "NETWORK"
-
-import cloudinit.UserDataHandler as ud
-import cloudinit.util as util
-import socket
-
-
-class DataSource:
-    userdata = None
-    metadata = None
-    userdata_raw = None
-    cfgname = ""
-    # system config (passed in from cloudinit,
-    # cloud-config before input from the DataSource)
-    sys_cfg = {}
-    # datasource config, the cloud-config['datasource']['__name__']
-    ds_cfg = {}  # datasource config
-
-    def __init__(self, sys_cfg=None):
-        if not self.cfgname:
-            name = str(self.__class__).split(".")[-1]
-            if name.startswith("DataSource"):
-                name = name[len("DataSource"):]
-            self.cfgname = name
-        if sys_cfg:
-            self.sys_cfg = sys_cfg
-
-        self.ds_cfg = util.get_cfg_by_path(self.sys_cfg,
-                          ("datasource", self.cfgname), self.ds_cfg)
-
-    def get_userdata(self):
-        if self.userdata == None:
-            self.userdata = ud.preprocess_userdata(self.userdata_raw)
-        return self.userdata
-
-    def get_userdata_raw(self):
-        return(self.userdata_raw)
-
-    # the data sources' config_obj is a cloud-config formated
-    # object that came to it from ways other than cloud-config
-    # because cloud-config content would be handled elsewhere
-    def get_config_obj(self):
-        return({})
-
-    def get_public_ssh_keys(self):
-        keys = []
-        if 'public-keys' not in self.metadata:
-            return([])
-
-        if isinstance(self.metadata['public-keys'], str):
-            return(str(self.metadata['public-keys']).splitlines())
-
-        if isinstance(self.metadata['public-keys'], list):
-            return(self.metadata['public-keys'])
-
-        for _keyname, klist in self.metadata['public-keys'].items():
-            # lp:506332 uec metadata service responds with
-            # data that makes boto populate a string for 'klist' rather
-            # than a list.
-            if isinstance(klist, str):
-                klist = [klist]
-            for pkey in klist:
-                # there is an empty string at the end of the keylist, trim it
-                if pkey:
-                    keys.append(pkey)
-
-        return(keys)
-
-    def device_name_to_device(self, _name):
-        # translate a 'name' to a device
-        # the primary function at this point is on ec2
-        # to consult metadata service, that has
-        #  ephemeral0: sdb
-        # and return 'sdb' for input 'ephemeral0'
-        return(None)
-
-    def get_locale(self):
-        return('en_US.UTF-8')
-
-    def get_local_mirror(self):
-        return None
-
-    def get_instance_id(self):
-        if 'instance-id' not in self.metadata:
-            return "iid-datasource"
-        return(self.metadata['instance-id'])
-
-    def get_hostname(self, fqdn=False):
-        defdomain = "localdomain"
-        defhost = "localhost"
-
-        domain = defdomain
-        if not 'local-hostname' in self.metadata:
-
-            # this is somewhat questionable really.
-            # the cloud datasource was asked for a hostname
-            # and didn't have one. raising error might be more appropriate
-            # but instead, basically look up the existing hostname
-            toks = []
-
-            hostname = socket.gethostname()
-
-            fqdn = util.get_fqdn_from_hosts(hostname)
-
-            if fqdn and fqdn.find(".") > 0:
-                toks = str(fqdn).split(".")
-            elif hostname:
-                toks = [hostname, defdomain]
-            else:
-                toks = [defhost, defdomain]
-
-        else:
-            # if there is an ipv4 address in 'local-hostname', then
-            # make up a hostname (LP: #475354) in format ip-xx.xx.xx.xx
-            lhost = self.metadata['local-hostname']
-            if is_ipv4(lhost):
-                toks = "ip-%s" % lhost.replace(".", "-")
-            else:
-                toks = lhost.split(".")
-
-        if len(toks) > 1:
-            hostname = toks[0]
-            domain = '.'.join(toks[1:])
-        else:
-            hostname = toks[0]
-
-        if fqdn:
-            return "%s.%s" % (hostname, domain)
-        else:
-            return hostname
-
-
-# return a list of classes that have the same depends as 'depends'
-# iterate through cfg_list, loading "DataSourceCollections" modules
-# and calling their "get_datasource_list".
-# return an ordered list of classes that match
-#
-# - modules must be named "DataSource<item>", where 'item' is an entry
-#   in cfg_list
-# - if pkglist is given, it will iterate try loading from that package
-#   ie, pkglist=[ "foo", "" ]
-#     will first try to load foo.DataSource<item>
-#     then DataSource<item>
-def list_sources(cfg_list, depends, pkglist=None):
-    if pkglist is None:
-        pkglist = []
-    retlist = []
-    for ds_coll in cfg_list:
-        for pkg in pkglist:
-            if pkg:
-                pkg = "%s." % pkg
-            try:
-                mod = __import__("%sDataSource%s" % (pkg, ds_coll))
-                if pkg:
-                    mod = getattr(mod, "DataSource%s" % ds_coll)
-                lister = getattr(mod, "get_datasource_list")
-                retlist.extend(lister(depends))
-                break
-            except:
-                raise
-    return(retlist)
-
-
-# depends is a list of dependencies (DEP_FILESYSTEM)
-# dslist is a list of 2 item lists
-# dslist = [
-#   ( class, ( depends-that-this-class-needs ) )
-# }
-# it returns a list of 'class' that matched these deps exactly
-# it is a helper function for DataSourceCollections
-def list_from_depends(depends, dslist):
-    retlist = []
-    depset = set(depends)
-    for elem in dslist:
-        (cls, deps) = elem
-        if depset == set(deps):
-            retlist.append(cls)
-    return(retlist)
-
-
-def is_ipv4(instr):
-    """ determine if input string is a ipv4 address. return boolean"""
-    toks = instr.split('.')
-    if len(toks) != 4:
-        return False
-
-    try:
-        toks = [x for x in toks if (int(x) < 256 and int(x) > 0)]
-    except:
-        return False
-
-    return (len(toks) == 4)

From b8c07e662287361b363a3331776620c8f390eb23 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 13:48:30 -0700
Subject: [PATCH 009/434] Start moving code from there to here.

---
 cloudinit/handling.py | 147 +++++++++++++++++++++---------------------
 1 file changed, 74 insertions(+), 73 deletions(-)

diff --git a/cloudinit/handling.py b/cloudinit/handling.py
index 553abe4f..8f6424e3 100644
--- a/cloudinit/handling.py
+++ b/cloudinit/handling.py
@@ -7,8 +7,81 @@ from cloudinit.constants import (PER_INSTANCE, PER_ALWAYS)
 LOG = logging.getLogger(__name__)
 
 
+def handler_register(mod, part_handlers, data, frequency=per_instance):
+    if not hasattr(mod, "handler_version"):
+        setattr(mod, "handler_version", 1)
+
+    for mtype in mod.list_types():
+        part_handlers[mtype] = mod
+
+    handler_call_begin(mod, data, frequency)
+    return(mod)
+
+
+def handler_call_begin(mod, data, frequency):
+    handler_handle_part(mod, data, "__begin__", None, None, frequency)
+
+
+def handler_call_end(mod, data, frequency):
+    handler_handle_part(mod, data, "__end__", None, None, frequency)
+
+
+def handler_handle_part(mod, data, ctype, filename, payload, frequency):
+    # only add the handler if the module should run
+    modfreq = getattr(mod, "frequency", per_instance)
+    if not (modfreq == per_always or
+            (frequency == per_instance and modfreq == per_instance)):
+        return
+    try:
+        if mod.handler_version == 1:
+            mod.handle_part(data, ctype, filename, payload)
+        else:
+            mod.handle_part(data, ctype, filename, payload, frequency)
+    except:
+        util.logexc(log)
+        traceback.print_exc(file=sys.stderr)
+
+
+def partwalker_handle_handler(pdata, _ctype, _filename, payload):
+    curcount = pdata['handlercount']
+    modname = 'part-handler-%03d' % curcount
+    frequency = pdata['frequency']
+
+    modfname = modname + ".py"
+    util.write_file("%s/%s" % (pdata['handlerdir'], modfname), payload, 0600)
+
+    try:
+        mod = __import__(modname)
+        handler_register(mod, pdata['handlers'], pdata['data'], frequency)
+        pdata['handlercount'] = curcount + 1
+    except:
+        util.logexc(log)
+        traceback.print_exc(file=sys.stderr)
+
+
+def partwalker_callback(pdata, ctype, filename, payload):
+    # data here is the part_handlers array and then the data to pass through
+    if ctype == "text/part-handler":
+        if 'handlercount' not in pdata:
+            pdata['handlercount'] = 0
+        partwalker_handle_handler(pdata, ctype, filename, payload)
+        return
+    if ctype not in pdata['handlers']:
+        if ctype == "text/x-not-multipart":
+            # Extract the first line or 24 bytes for displaying in the log
+            start = payload.split("\n", 1)[0][:24]
+            if start < payload:
+                details = "starting '%s...'" % start.encode("string-escape")
+            else:
+                details = repr(payload)
+            log.warning("Unhandled non-multipart userdata %s", details)
+        return
+    handler_handle_part(pdata['handlers'][ctype], pdata['data'],
+        ctype, filename, payload, pdata['frequency'])
+
+
 class InternalPartHandler:
-    freq = PER_INSTANCE
+    freq = per_instance
     mtypes = []
     handler_version = 1
     handler = None
@@ -27,75 +100,3 @@ class InternalPartHandler:
 
     def handle_part(self, data, ctype, filename, payload, frequency):
         return(self.handler(data, ctype, filename, payload, frequency))
-
-
-def handler_register(mod, part_handlers, data, frequency=PER_INSTANCE):
-    if not hasattr(mod, "handler_version"):
-        setattr(mod, "handler_version", 1)
-
-    for mtype in mod.list_types():
-        part_handlers[mtype] = mod
-
-    handler_call_begin(mod, data, frequency)
-    return mod
-
-
-def handler_call_begin(mod, data, frequency):
-    handler_handle_part(mod, data, "__begin__", None, None, frequency)
-
-
-def handler_call_end(mod, data, frequency):
-    handler_handle_part(mod, data, "__end__", None, None, frequency)
-
-
-def handler_handle_part(mod, data, ctype, filename, payload, frequency):
-    # only add the handler if the module should run
-    modfreq = getattr(mod, "frequency", PER_INSTANCE)
-    if not (modfreq == PER_ALWAYS or
-            (frequency == PER_INSTANCE and modfreq == PER_INSTANCE)):
-        return
-    try:
-        if mod.handler_version == 1:
-            mod.handle_part(data, ctype, filename, payload)
-        else:
-            mod.handle_part(data, ctype, filename, payload, frequency)
-    except:
-        util.logexc(log)
-        traceback.print_exc(file=sys.stderr)
-
-
-def partwalker_handle_handler(pdata, _ctype, _filename, payload):
-    curcount = pdata['handlercount']
-    modname = 'part-handler-%03d' % curcount
-    frequency = pdata['frequency']
-
-    modfname = modname + ".py"
-    util.write_file(os.path.join(pdata['handlerdir'], modfname), payload, 0600)
-
-    try:
-        mod = importer.import_module(modname)
-        handler_register(mod, pdata['handlers'], pdata['data'], frequency)
-        pdata['handlercount'] = curcount + 1
-    except:
-        LOG.exception("Could not import module %s", modname)
-
-
-def partwalker_callback(pdata, ctype, filename, payload):
-    # data here is the part_handlers array and then the data to pass through
-    if ctype == "text/part-handler":
-        if 'handlercount' not in pdata:
-            pdata['handlercount'] = 0
-        partwalker_handle_handler(pdata, ctype, filename, payload)
-        return
-    if ctype not in pdata['handlers']:
-        if ctype == "text/x-not-multipart":
-            # Extract the first line or 24 bytes for displaying in the log
-            start = payload.split("\n", 1)[0][:24]
-            if start < payload:
-                details = "starting '%s...'" % start.encode("string-escape")
-            else:
-                details = repr(payload)
-            LOG.warning("Unhandled non-multipart userdata %s", details)
-        return
-    handler_handle_part(pdata['handlers'][ctype], pdata['data'],
-        ctype, filename, payload, pdata['frequency'])

From 7fafc515f938a011d6cb1701725d81dfa9c284e0 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 13:48:49 -0700
Subject: [PATCH 010/434] Add this file which will contain the cloud init and
 cloud config classes.

---
 cloudinit/cloud.py | 368 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 368 insertions(+)
 create mode 100644 cloudinit/cloud.py

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
new file mode 100644
index 00000000..eb71439b
--- /dev/null
+++ b/cloudinit/cloud.py
@@ -0,0 +1,368 @@
+import os
+
+import cPickle as pickle
+
+
+class CloudInit(object):
+    cfg = None
+    part_handlers = {}
+    old_conffile = '/etc/ec2-init/ec2-config.cfg'
+    ds_deps = [DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK]
+    datasource = None
+    cloud_config_str = ''
+    datasource_name = ''
+
+    builtin_handlers = []
+
+    def __init__(self, ds_deps=None, sysconfig=system_config):
+        self.builtin_handlers = [
+            ['text/x-shellscript', self.handle_user_script, per_always],
+            ['text/cloud-config', self.handle_cloud_config, per_always],
+            ['text/upstart-job', self.handle_upstart_job, per_instance],
+            ['text/cloud-boothook', self.handle_cloud_boothook, per_always],
+        ]
+
+        if ds_deps != None:
+            self.ds_deps = ds_deps
+
+        self.sysconfig = sysconfig
+
+        self.cfg = self.read_cfg()
+
+    def read_cfg(self):
+        if self.cfg:
+            return(self.cfg)
+
+        try:
+            conf = util.get_base_cfg(self.sysconfig, cfg_builtin, parsed_cfgs)
+        except Exception:
+            conf = get_builtin_cfg()
+
+        # support reading the old ConfigObj format file and merging
+        # it into the yaml dictionary
+        try:
+            from configobj import ConfigObj
+            oldcfg = ConfigObj(self.old_conffile)
+            if oldcfg is None:
+                oldcfg = {}
+            conf = util.mergedict(conf, oldcfg)
+        except:
+            pass
+
+        return(conf)
+
+    def restore_from_cache(self):
+        try:
+            # we try to restore from a current link and static path
+            # by using the instance link, if purge_cache was called
+            # the file wont exist
+            cache = get_ipath_cur('obj_pkl')
+            f = open(cache, "rb")
+            data = cPickle.load(f)
+            f.close()
+            self.datasource = data
+            return True
+        except:
+            return False
+
+    def write_to_cache(self):
+        cache = self.get_ipath("obj_pkl")
+        try:
+            os.makedirs(os.path.dirname(cache))
+        except OSError as e:
+            if e.errno != errno.EEXIST:
+                return False
+
+        try:
+            f = open(cache, "wb")
+            cPickle.dump(self.datasource, f)
+            f.close()
+            os.chmod(cache, 0400)
+        except:
+            raise
+
+    def get_data_source(self):
+        if self.datasource is not None:
+            return True
+
+        if self.restore_from_cache():
+            log.debug("restored from cache type %s" % self.datasource)
+            return True
+
+        cfglist = self.cfg['datasource_list']
+        dslist = list_sources(cfglist, self.ds_deps)
+        dsnames = [f.__name__ for f in dslist]
+
+        log.debug("searching for data source in %s" % dsnames)
+        for cls in dslist:
+            ds = cls.__name__
+            try:
+                s = cls(sys_cfg=self.cfg)
+                if s.get_data():
+                    self.datasource = s
+                    self.datasource_name = ds
+                    log.debug("found data source %s" % ds)
+                    return True
+            except Exception as e:
+                log.warn("get_data of %s raised %s" % (ds, e))
+                util.logexc(log)
+        msg = "Did not find data source. searched classes: %s" % dsnames
+        log.debug(msg)
+        raise DataSourceNotFoundException(msg)
+
+    def set_cur_instance(self):
+        try:
+            os.unlink(cur_instance_link)
+        except OSError as e:
+            if e.errno != errno.ENOENT:
+                raise
+
+        iid = self.get_instance_id()
+        os.symlink("./instances/%s" % iid, cur_instance_link)
+        idir = self.get_ipath()
+        dlist = []
+        for d in ["handlers", "scripts", "sem"]:
+            dlist.append("%s/%s" % (idir, d))
+
+        util.ensure_dirs(dlist)
+
+        ds = "%s: %s\n" % (self.datasource.__class__, str(self.datasource))
+        dp = self.get_cpath('data')
+        util.write_file("%s/%s" % (idir, 'datasource'), ds)
+        util.write_file("%s/%s" % (dp, 'previous-datasource'), ds)
+        util.write_file("%s/%s" % (dp, 'previous-instance-id'), "%s\n" % iid)
+
+    def get_userdata(self):
+        return(self.datasource.get_userdata())
+
+    def get_userdata_raw(self):
+        return(self.datasource.get_userdata_raw())
+
+    def get_instance_id(self):
+        return(self.datasource.get_instance_id())
+
+    def update_cache(self):
+        self.write_to_cache()
+        self.store_userdata()
+
+    def store_userdata(self):
+        util.write_file(self.get_ipath('userdata_raw'),
+            self.datasource.get_userdata_raw(), 0600)
+        util.write_file(self.get_ipath('userdata'),
+            self.datasource.get_userdata(), 0600)
+
+    def sem_getpath(self, name, freq):
+        if freq == 'once-per-instance':
+            return("%s/%s" % (self.get_ipath("sem"), name))
+        return("%s/%s.%s" % (get_cpath("sem"), name, freq))
+
+    def sem_has_run(self, name, freq):
+        if freq == per_always:
+            return False
+        semfile = self.sem_getpath(name, freq)
+        if os.path.exists(semfile):
+            return True
+        return False
+
+    def sem_acquire(self, name, freq):
+        from time import time
+        semfile = self.sem_getpath(name, freq)
+
+        try:
+            os.makedirs(os.path.dirname(semfile))
+        except OSError as e:
+            if e.errno != errno.EEXIST:
+                raise e
+
+        if os.path.exists(semfile) and freq != per_always:
+            return False
+
+        # race condition
+        try:
+            f = open(semfile, "w")
+            f.write("%s\n" % str(time()))
+            f.close()
+        except:
+            return(False)
+        return(True)
+
+    def sem_clear(self, name, freq):
+        semfile = self.sem_getpath(name, freq)
+        try:
+            os.unlink(semfile)
+        except OSError as e:
+            if e.errno != errno.ENOENT:
+                return False
+
+        return True
+
+    # acquire lock on 'name' for given 'freq'
+    # if that does not exist, then call 'func' with given 'args'
+    # if 'clear_on_fail' is True and func throws an exception
+    #  then remove the lock (so it would run again)
+    def sem_and_run(self, semname, freq, func, args=None, clear_on_fail=False):
+        if args is None:
+            args = []
+        if self.sem_has_run(semname, freq):
+            log.debug("%s already ran %s", semname, freq)
+            return False
+        try:
+            if not self.sem_acquire(semname, freq):
+                raise Exception("Failed to acquire lock on %s" % semname)
+
+            func(*args)
+        except:
+            if clear_on_fail:
+                self.sem_clear(semname, freq)
+            raise
+
+        return True
+
+    # get_ipath : get the instance path for a name in pathmap
+    # (/var/lib/cloud/instances/<instance>/name)<name>)
+    def get_ipath(self, name=None):
+        return("%s/instances/%s%s"
+               % (varlibdir, self.get_instance_id(), pathmap[name]))
+
+    def consume_userdata(self, frequency=per_instance):
+        self.get_userdata()
+        data = self
+
+        cdir = get_cpath("handlers")
+        idir = self.get_ipath("handlers")
+
+        # add the path to the plugins dir to the top of our list for import
+        # instance dir should be read before cloud-dir
+        sys.path.insert(0, cdir)
+        sys.path.insert(0, idir)
+
+        part_handlers = {}
+        # add handlers in cdir
+        for fname in glob.glob("%s/*.py" % cdir):
+            if not os.path.isfile(fname):
+                continue
+            modname = os.path.basename(fname)[0:-3]
+            try:
+                mod = __import__(modname)
+                handler_register(mod, part_handlers, data, frequency)
+                log.debug("added handler for [%s] from %s" % (mod.list_types(),
+                                                              fname))
+            except:
+                log.warn("failed to initialize handler in %s" % fname)
+                util.logexc(log)
+
+        # add the internal handers if their type hasn't been already claimed
+        for (btype, bhand, bfreq) in self.builtin_handlers:
+            if btype in part_handlers:
+                continue
+            handler_register(InternalPartHandler(bhand, [btype], bfreq),
+                part_handlers, data, frequency)
+
+        # walk the data
+        pdata = {'handlers': part_handlers, 'handlerdir': idir,
+                 'data': data, 'frequency': frequency}
+        UserDataHandler.walk_userdata(self.get_userdata(),
+            partwalker_callback, data=pdata)
+
+        # give callbacks opportunity to finalize
+        called = []
+        for (_mtype, mod) in part_handlers.iteritems():
+            if mod in called:
+                continue
+            handler_call_end(mod, data, frequency)
+
+    def handle_user_script(self, _data, ctype, filename, payload, _frequency):
+        if ctype == "__end__":
+            return
+        if ctype == "__begin__":
+            # maybe delete existing things here
+            return
+
+        filename = filename.replace(os.sep, '_')
+        scriptsdir = get_ipath_cur('scripts')
+        util.write_file("%s/%s" %
+            (scriptsdir, filename), util.dos2unix(payload), 0700)
+
+    def handle_upstart_job(self, _data, ctype, filename, payload, frequency):
+        # upstart jobs are only written on the first boot
+        if frequency != per_instance:
+            return
+
+        if ctype == "__end__" or ctype == "__begin__":
+            return
+        if not filename.endswith(".conf"):
+            filename = filename + ".conf"
+
+        util.write_file("%s/%s" % ("/etc/init", filename),
+            util.dos2unix(payload), 0644)
+
+    def handle_cloud_config(self, _data, ctype, filename, payload, _frequency):
+        if ctype == "__begin__":
+            self.cloud_config_str = ""
+            return
+        if ctype == "__end__":
+            cloud_config = self.get_ipath("cloud_config")
+            util.write_file(cloud_config, self.cloud_config_str, 0600)
+
+            ## this could merge the cloud config with the system config
+            ## for now, not doing this as it seems somewhat circular
+            ## as CloudConfig does that also, merging it with this cfg
+            ##
+            # ccfg = yaml.load(self.cloud_config_str)
+            # if ccfg is None: ccfg = {}
+            # self.cfg = util.mergedict(ccfg, self.cfg)
+
+            return
+
+        self.cloud_config_str += "\n#%s\n%s" % (filename, payload)
+
+    def handle_cloud_boothook(self, _data, ctype, filename, payload,
+                              _frequency):
+        if ctype == "__end__":
+            return
+        if ctype == "__begin__":
+            return
+
+        filename = filename.replace(os.sep, '_')
+        payload = util.dos2unix(payload)
+        prefix = "#cloud-boothook"
+        start = 0
+        if payload.startswith(prefix):
+            start = len(prefix) + 1
+
+        boothooks_dir = self.get_ipath("boothooks")
+        filepath = "%s/%s" % (boothooks_dir, filename)
+        util.write_file(filepath, payload[start:], 0700)
+        try:
+            env = os.environ.copy()
+            env['INSTANCE_ID'] = self.datasource.get_instance_id()
+            subprocess.check_call([filepath], env=env)
+        except subprocess.CalledProcessError as e:
+            log.error("boothooks script %s returned %i" %
+                (filepath, e.returncode))
+        except Exception as e:
+            log.error("boothooks unknown exception %s when running %s" %
+                (e, filepath))
+
+    def get_public_ssh_keys(self):
+        return(self.datasource.get_public_ssh_keys())
+
+    def get_locale(self):
+        return(self.datasource.get_locale())
+
+    def get_mirror(self):
+        return(self.datasource.get_local_mirror())
+
+    def get_hostname(self, fqdn=False):
+        return(self.datasource.get_hostname(fqdn=fqdn))
+
+    def device_name_to_device(self, name):
+        return(self.datasource.device_name_to_device(name))
+
+    # I really don't know if this should be here or not, but
+    # I needed it in cc_update_hostname, where that code had a valid 'cloud'
+    # reference, but did not have a cloudinit handle
+    # (ie, no cloudinit.get_cpath())
+    def get_cpath(self, name=None):
+        return(get_cpath(name))
+

From 01915e468722939eea4a10b6e03e935f92058f3a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 13:49:07 -0700
Subject: [PATCH 011/434] Add in a utility class that will handle all
 shell-like actions.

---
 cloudinit/shell.py | 183 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 183 insertions(+)
 create mode 100644 cloudinit/shell.py

diff --git a/cloudinit/shell.py b/cloudinit/shell.py
new file mode 100644
index 00000000..17dae817
--- /dev/null
+++ b/cloudinit/shell.py
@@ -0,0 +1,183 @@
+import os
+import shutil
+import subprocess
+
+from StringIO import StringIO
+
+from cloudinit import exceptions as excp
+from cloudinit import log as logging
+
+try:
+    import selinux
+    HAVE_LIBSELINUX = True
+except ImportError:
+    HAVE_LIBSELINUX = False
+
+
+LOG = logging.getLogger(__name__)
+
+
+class SeLinuxGuard(object):
+    def __init__(self, path, recursive=False):
+        self.path = path
+        self.recursive = recursive
+        self.engaged = False
+        if HAVE_LIBSELINUX and selinux.is_selinux_enabled():
+            self.engaged = True
+
+    def __enter__(self):
+        return self.engaged
+
+    def __exit__(self, type, value, traceback):
+        if self.engaged:
+            LOG.debug("Disengaging selinux mode for %s: %s", self.path, self.recursive)
+            selinux.restorecon(self.path, recursive=self.recursive)
+
+
+def read_file(fname, read_cb=None):
+    LOG.debug("Reading from %s", fname)
+    with open(fname, 'rb') as fh:
+        ofh = StringIO()
+        pipe_in_out(fh, ofh, chunk_cb=read_cb)
+        return ofh.getvalue()
+
+
+def pipe_in_out(in_fh, out_fh, chunk_size=1024, chunk_cb=None):
+    bytes_piped = 0
+    LOG.debug("Transferring the contents of %s to %s in chunks of size %s.", in_fh, out_fh, chunk_size)
+    while True:
+        data = in_fh.read(chunk_size)
+        if data == '':
+            break
+        else:
+            out_fh.write(data)
+            bytes_piped += len(data)
+            if chunk_cb:
+                chunk_cb(bytes_piped)
+    out_fh.flush()
+    return bytes_piped
+
+
+def chownbyname(fname, user=None, group=None):
+    uid = -1
+    gid = -1
+    if user == None and group == None:
+        return
+    if user:
+        # TODO: why is this late imported
+        import pwd
+        uid = pwd.getpwnam(user).pw_uid
+    if group:
+        # TODO: why is this late imported
+        import grp
+        gid = grp.getgrnam(group).gr_gid
+
+    os.chown(fname, uid, gid)
+
+
+def ensure_dirs(dirlist, mode=0755):
+    for d in dirlist:
+        ensure_dir(d, mode)
+
+
+def ensure_dir(path, mode=0755):
+    if not os.path.isdir(path):
+        fixmodes = []
+        LOG.debug("Ensuring directory exists at path %s", dir_name)
+        try:
+            os.makedirs(path)
+        except OSError as e:
+            if e.errno != errno.EEXIST:
+                raise e
+        if mode is not None:
+            os.chmod(path, mode)
+
+def del_file(path):
+    LOG.debug("Attempting to remove %s", path)
+    os.unlink(path)
+
+
+def ensure_file(path):
+    if not os.path.isfile(path):
+        write_file(path, content='')
+
+
+def write_file(filename, content, mode=0644, omode="wb"):
+    """
+    Writes a file with the given content and sets the file mode as specified.
+    Resotres the SELinux context if possible.
+
+    @param filename: The full path of the file to write.
+    @param content: The content to write to the file.
+    @param mode: The filesystem mode to set on the file.
+    @param omode: The open mode used when opening the file (r, rb, a, etc.)
+    """
+    try:
+        os.makedirs(os.path.dirname(filename))
+    except OSError as e:
+        if e.errno != errno.EEXIST:
+            raise e
+
+    LOG.debug("Writing to %s (%o) %s bytes", filename, mode, len(content))
+    with open(filename, omode) as fh:
+        with SeLinuxGuard(filename):
+            fh.write(content)
+            if mode is not None:
+                os.chmod(filename, mode)
+
+def delete_dir_contents(dirname):
+    """
+    Deletes all contents of a directory without deleting the directory itself.
+
+    @param dirname: The directory whose contents should be deleted.
+    """
+    for node in os.listdir(dirname):
+        node_fullpath = os.path.join(dirname, node)
+        if os.path.isdir(node_fullpath):
+            shutil.rmtree(node_fullpath)
+        else:
+            os.unlink(node_fullpath)
+
+
+def subp(args, input_data=None, allowed_rc=None):
+    if allowed_rc is None:
+        allowed_rc = [0]
+    try:
+        sp = subprocess.Popen(args, stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE, stdin=subprocess.PIPE)
+        (out, err) = sp.communicate(input_data)
+    except OSError as e:
+        raise excp.ProcessExecutionError(cmd=args, reason=e)
+    rc = sp.returncode
+    if rc not in allowed_rc:
+        raise excp.ProcessExecutionError(stdout=out, stderr=err,
+                                         exit_code=rc,
+                                         cmd=args)
+    # Just ensure blank instead of none??
+    if not out:
+        out = ''
+    if not err:
+        err = ''
+    return (out, err)
+
+
+# shellify, takes a list of commands
+#  for each entry in the list
+#    if it is an array, shell protect it (with single ticks)
+#    if it is a string, do nothing
+def shellify(cmdlist, add_header=True):
+    content = ''
+    if add_header:
+        content += "#!/bin/sh\n"
+    escaped = "%s%s%s%s" % ("'", '\\', "'", "'")
+    for args in cmdlist:
+        # if the item is a list, wrap all items in single tick
+        # if its not, then just write it directly
+        if isinstance(args, list):
+            fixed = []
+            for f in args:
+                fixed.append("'%s'" % str(f).replace("'", escaped))
+            content = "%s%s\n" % (content, ' '.join(fixed))
+        else:
+            content = "%s%s\n" % (content, str(args))
+    return content

From b18d8f4fb3a24b8031c1d9f54d201384358e5126 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 7 Jun 2012 13:50:38 -0700
Subject: [PATCH 012/434] Add a standard exception holding file.

---
 cloudinit/exceptions.py | 62 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 62 insertions(+)
 create mode 100644 cloudinit/exceptions.py

diff --git a/cloudinit/exceptions.py b/cloudinit/exceptions.py
new file mode 100644
index 00000000..235ded7a
--- /dev/null
+++ b/cloudinit/exceptions.py
@@ -0,0 +1,62 @@
+# vim: tabstop=4 shiftwidth=4 softtabstop=4
+
+
+class ProcessExecutionError(IOError):
+
+    message_tmpl = ('%(description)s\nCommand: %(cmd)s\n'
+                    'Exit code: %(exit_code)s\nStdout: %(stdout)r\n'
+                    'Stderr: %(stderr)r')
+
+    def __init__(self, stdout=None, stderr=None,
+                 exit_code=None, cmd=None,
+                 description=None, reason=None):
+        if not cmd:
+            self.cmd = '-'
+        else:
+            self.cmd = cmd
+
+        if not description:
+            self.description = 'Unexpected error while running command.'
+        else:
+            self.description = description
+
+        if not isinstance(exit_code, (long, int)):
+            self.exit_code = '-'
+        else:
+            self.exit_code = exit_code
+
+        if not stderr:
+            self.stderr = ''
+        else:
+            self.stderr = stderr
+
+        if not stdout:
+            self.stdout = ''
+        else:
+            self.stdout = stdout
+
+        message = self.message_tmpl % {
+            'description': self.description,
+            'cmd': self.cmd,
+            'exit_code': self.exit_code,
+            'stdout': self.stdout,
+            'stderr': self.stderr,
+        }
+        IOError.__init__(self, message)
+        self.reason = reason
+
+
+class MountFailedError(Exception):
+    pass
+
+
+class StackExceeded(Exception):
+    pass
+
+
+class RecursiveInclude(Exception):
+    pass
+
+
+class DataSourceNotFoundException(Exception):
+    pass

From 90316284cfa0d44c112b81bb663a378508eac824 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:53:42 -0700
Subject: [PATCH 013/434] Moving exceptions to modules where they are used.
 Seems to make sense.

---
 cloudinit/exceptions.py | 62 -----------------------------------------
 1 file changed, 62 deletions(-)
 delete mode 100644 cloudinit/exceptions.py

diff --git a/cloudinit/exceptions.py b/cloudinit/exceptions.py
deleted file mode 100644
index 235ded7a..00000000
--- a/cloudinit/exceptions.py
+++ /dev/null
@@ -1,62 +0,0 @@
-# vim: tabstop=4 shiftwidth=4 softtabstop=4
-
-
-class ProcessExecutionError(IOError):
-
-    message_tmpl = ('%(description)s\nCommand: %(cmd)s\n'
-                    'Exit code: %(exit_code)s\nStdout: %(stdout)r\n'
-                    'Stderr: %(stderr)r')
-
-    def __init__(self, stdout=None, stderr=None,
-                 exit_code=None, cmd=None,
-                 description=None, reason=None):
-        if not cmd:
-            self.cmd = '-'
-        else:
-            self.cmd = cmd
-
-        if not description:
-            self.description = 'Unexpected error while running command.'
-        else:
-            self.description = description
-
-        if not isinstance(exit_code, (long, int)):
-            self.exit_code = '-'
-        else:
-            self.exit_code = exit_code
-
-        if not stderr:
-            self.stderr = ''
-        else:
-            self.stderr = stderr
-
-        if not stdout:
-            self.stdout = ''
-        else:
-            self.stdout = stdout
-
-        message = self.message_tmpl % {
-            'description': self.description,
-            'cmd': self.cmd,
-            'exit_code': self.exit_code,
-            'stdout': self.stdout,
-            'stderr': self.stderr,
-        }
-        IOError.__init__(self, message)
-        self.reason = reason
-
-
-class MountFailedError(Exception):
-    pass
-
-
-class StackExceeded(Exception):
-    pass
-
-
-class RecursiveInclude(Exception):
-    pass
-
-
-class DataSourceNotFoundException(Exception):
-    pass

From 2e233898d8f55427c02c4f55ccdd8d86ac0f3f19 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:54:21 -0700
Subject: [PATCH 014/434] Moved this to a file called parts which handles this
 type of functionality.

---
 cloudinit/handling.py | 102 ------------------------------------------
 1 file changed, 102 deletions(-)
 delete mode 100644 cloudinit/handling.py

diff --git a/cloudinit/handling.py b/cloudinit/handling.py
deleted file mode 100644
index 8f6424e3..00000000
--- a/cloudinit/handling.py
+++ /dev/null
@@ -1,102 +0,0 @@
-import os
-
-from cloudinit import importer
-from cloudinit import log as logging
-from cloudinit.constants import (PER_INSTANCE, PER_ALWAYS)
-
-LOG = logging.getLogger(__name__)
-
-
-def handler_register(mod, part_handlers, data, frequency=per_instance):
-    if not hasattr(mod, "handler_version"):
-        setattr(mod, "handler_version", 1)
-
-    for mtype in mod.list_types():
-        part_handlers[mtype] = mod
-
-    handler_call_begin(mod, data, frequency)
-    return(mod)
-
-
-def handler_call_begin(mod, data, frequency):
-    handler_handle_part(mod, data, "__begin__", None, None, frequency)
-
-
-def handler_call_end(mod, data, frequency):
-    handler_handle_part(mod, data, "__end__", None, None, frequency)
-
-
-def handler_handle_part(mod, data, ctype, filename, payload, frequency):
-    # only add the handler if the module should run
-    modfreq = getattr(mod, "frequency", per_instance)
-    if not (modfreq == per_always or
-            (frequency == per_instance and modfreq == per_instance)):
-        return
-    try:
-        if mod.handler_version == 1:
-            mod.handle_part(data, ctype, filename, payload)
-        else:
-            mod.handle_part(data, ctype, filename, payload, frequency)
-    except:
-        util.logexc(log)
-        traceback.print_exc(file=sys.stderr)
-
-
-def partwalker_handle_handler(pdata, _ctype, _filename, payload):
-    curcount = pdata['handlercount']
-    modname = 'part-handler-%03d' % curcount
-    frequency = pdata['frequency']
-
-    modfname = modname + ".py"
-    util.write_file("%s/%s" % (pdata['handlerdir'], modfname), payload, 0600)
-
-    try:
-        mod = __import__(modname)
-        handler_register(mod, pdata['handlers'], pdata['data'], frequency)
-        pdata['handlercount'] = curcount + 1
-    except:
-        util.logexc(log)
-        traceback.print_exc(file=sys.stderr)
-
-
-def partwalker_callback(pdata, ctype, filename, payload):
-    # data here is the part_handlers array and then the data to pass through
-    if ctype == "text/part-handler":
-        if 'handlercount' not in pdata:
-            pdata['handlercount'] = 0
-        partwalker_handle_handler(pdata, ctype, filename, payload)
-        return
-    if ctype not in pdata['handlers']:
-        if ctype == "text/x-not-multipart":
-            # Extract the first line or 24 bytes for displaying in the log
-            start = payload.split("\n", 1)[0][:24]
-            if start < payload:
-                details = "starting '%s...'" % start.encode("string-escape")
-            else:
-                details = repr(payload)
-            log.warning("Unhandled non-multipart userdata %s", details)
-        return
-    handler_handle_part(pdata['handlers'][ctype], pdata['data'],
-        ctype, filename, payload, pdata['frequency'])
-
-
-class InternalPartHandler:
-    freq = per_instance
-    mtypes = []
-    handler_version = 1
-    handler = None
-
-    def __init__(self, handler, mtypes, frequency, version=2):
-        self.handler = handler
-        self.mtypes = mtypes
-        self.frequency = frequency
-        self.handler_version = version
-
-    def __repr__(self):
-        return("InternalPartHandler: [%s]" % self.mtypes)
-
-    def list_types(self):
-        return(self.mtypes)
-
-    def handle_part(self, data, ctype, filename, payload, frequency):
-        return(self.handler(data, ctype, filename, payload, frequency))

From be1fd842796ad29776111a79089d309a6d6214b3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:54:45 -0700
Subject: [PATCH 015/434] Seems like the util function extraction was not
 actually needed.

---
 cloudinit/includer.py | 65 -------------------------------------------
 1 file changed, 65 deletions(-)
 delete mode 100644 cloudinit/includer.py

diff --git a/cloudinit/includer.py b/cloudinit/includer.py
deleted file mode 100644
index d1022c5a..00000000
--- a/cloudinit/includer.py
+++ /dev/null
@@ -1,65 +0,0 @@
-import os
-import re
-
-from cloudinit import downloader as down
-from cloudinit import exceptions as excp
-from cloudinit import log as logging
-from cloudinit import shell as sh
-
-INCLUDE_PATT = re.compile("^#(opt_include|include)[ \t](.*)$", re.MULTILINE)
-OPT_PATS = ['opt_include']
-
-LOG = logging.getLogger(__name__)
-
-
-class Includer(object):
-
-    def __init__(self, root_fn, stack_limit=10):
-        self.root_fn = root_fn
-        self.stack_limit = stack_limit
-
-    def _read_file(self, fname):
-        return sh.read_file(fname)
-
-    def _read(self, fname, stack, rel):
-        if len(stack) >= self.stack_limit:
-            raise excp.StackExceeded("Stack limit of %s reached while including %s" % (self.stack_limit, fname))
-
-        canon_fname = self._canon_name(fname, rel)
-        if canon_fname in stack:
-            raise excp.RecursiveInclude("File %s recursively included" % (canon_fname))
-
-        stack.add(canon_fname)
-        new_rel = os.path.dirname(canon_fname)
-        contents = self._read_file(canon_fname)
-
-        def include_cb(match):
-            is_optional = (match.group(1).lower() in OPT_PATS)
-            fn = match.group(2).strip()
-            if not fn:
-                # Should we die??
-                return match.group(0)
-            else:
-                try:
-                    LOG.debug("Including file %s", fn)
-                    return self._read(fn, stack, new_rel)
-                except IOError:
-                    if is_optional:
-                        return ''
-                    else:
-                        raise
-
-        adjusted_contents = INCLUDE_PATT.sub(include_cb, contents)
-        stack.remove(fname)
-        return adjusted_contents
-
-    def _canon_name(self, fname, rel):
-        fname = fname.strip()
-        if not fname.startswith("/"):
-            fname = os.path.sep.join([rel, fname])
-        return os.path.realpath(fname)
-
-    def read(self, relative_to="."):
-        stack = set()
-        return self._read(self.root_fn, stack, rel=relative_to)
-    

From 01bc41f1cf90aee1250f4ad11ff797adb82bae2b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:55:02 -0700
Subject: [PATCH 016/434] Putting back into utils for now (until that gets to
 big).

---
 cloudinit/shell.py | 183 ---------------------------------------------
 1 file changed, 183 deletions(-)
 delete mode 100644 cloudinit/shell.py

diff --git a/cloudinit/shell.py b/cloudinit/shell.py
deleted file mode 100644
index 17dae817..00000000
--- a/cloudinit/shell.py
+++ /dev/null
@@ -1,183 +0,0 @@
-import os
-import shutil
-import subprocess
-
-from StringIO import StringIO
-
-from cloudinit import exceptions as excp
-from cloudinit import log as logging
-
-try:
-    import selinux
-    HAVE_LIBSELINUX = True
-except ImportError:
-    HAVE_LIBSELINUX = False
-
-
-LOG = logging.getLogger(__name__)
-
-
-class SeLinuxGuard(object):
-    def __init__(self, path, recursive=False):
-        self.path = path
-        self.recursive = recursive
-        self.engaged = False
-        if HAVE_LIBSELINUX and selinux.is_selinux_enabled():
-            self.engaged = True
-
-    def __enter__(self):
-        return self.engaged
-
-    def __exit__(self, type, value, traceback):
-        if self.engaged:
-            LOG.debug("Disengaging selinux mode for %s: %s", self.path, self.recursive)
-            selinux.restorecon(self.path, recursive=self.recursive)
-
-
-def read_file(fname, read_cb=None):
-    LOG.debug("Reading from %s", fname)
-    with open(fname, 'rb') as fh:
-        ofh = StringIO()
-        pipe_in_out(fh, ofh, chunk_cb=read_cb)
-        return ofh.getvalue()
-
-
-def pipe_in_out(in_fh, out_fh, chunk_size=1024, chunk_cb=None):
-    bytes_piped = 0
-    LOG.debug("Transferring the contents of %s to %s in chunks of size %s.", in_fh, out_fh, chunk_size)
-    while True:
-        data = in_fh.read(chunk_size)
-        if data == '':
-            break
-        else:
-            out_fh.write(data)
-            bytes_piped += len(data)
-            if chunk_cb:
-                chunk_cb(bytes_piped)
-    out_fh.flush()
-    return bytes_piped
-
-
-def chownbyname(fname, user=None, group=None):
-    uid = -1
-    gid = -1
-    if user == None and group == None:
-        return
-    if user:
-        # TODO: why is this late imported
-        import pwd
-        uid = pwd.getpwnam(user).pw_uid
-    if group:
-        # TODO: why is this late imported
-        import grp
-        gid = grp.getgrnam(group).gr_gid
-
-    os.chown(fname, uid, gid)
-
-
-def ensure_dirs(dirlist, mode=0755):
-    for d in dirlist:
-        ensure_dir(d, mode)
-
-
-def ensure_dir(path, mode=0755):
-    if not os.path.isdir(path):
-        fixmodes = []
-        LOG.debug("Ensuring directory exists at path %s", dir_name)
-        try:
-            os.makedirs(path)
-        except OSError as e:
-            if e.errno != errno.EEXIST:
-                raise e
-        if mode is not None:
-            os.chmod(path, mode)
-
-def del_file(path):
-    LOG.debug("Attempting to remove %s", path)
-    os.unlink(path)
-
-
-def ensure_file(path):
-    if not os.path.isfile(path):
-        write_file(path, content='')
-
-
-def write_file(filename, content, mode=0644, omode="wb"):
-    """
-    Writes a file with the given content and sets the file mode as specified.
-    Resotres the SELinux context if possible.
-
-    @param filename: The full path of the file to write.
-    @param content: The content to write to the file.
-    @param mode: The filesystem mode to set on the file.
-    @param omode: The open mode used when opening the file (r, rb, a, etc.)
-    """
-    try:
-        os.makedirs(os.path.dirname(filename))
-    except OSError as e:
-        if e.errno != errno.EEXIST:
-            raise e
-
-    LOG.debug("Writing to %s (%o) %s bytes", filename, mode, len(content))
-    with open(filename, omode) as fh:
-        with SeLinuxGuard(filename):
-            fh.write(content)
-            if mode is not None:
-                os.chmod(filename, mode)
-
-def delete_dir_contents(dirname):
-    """
-    Deletes all contents of a directory without deleting the directory itself.
-
-    @param dirname: The directory whose contents should be deleted.
-    """
-    for node in os.listdir(dirname):
-        node_fullpath = os.path.join(dirname, node)
-        if os.path.isdir(node_fullpath):
-            shutil.rmtree(node_fullpath)
-        else:
-            os.unlink(node_fullpath)
-
-
-def subp(args, input_data=None, allowed_rc=None):
-    if allowed_rc is None:
-        allowed_rc = [0]
-    try:
-        sp = subprocess.Popen(args, stdout=subprocess.PIPE,
-            stderr=subprocess.PIPE, stdin=subprocess.PIPE)
-        (out, err) = sp.communicate(input_data)
-    except OSError as e:
-        raise excp.ProcessExecutionError(cmd=args, reason=e)
-    rc = sp.returncode
-    if rc not in allowed_rc:
-        raise excp.ProcessExecutionError(stdout=out, stderr=err,
-                                         exit_code=rc,
-                                         cmd=args)
-    # Just ensure blank instead of none??
-    if not out:
-        out = ''
-    if not err:
-        err = ''
-    return (out, err)
-
-
-# shellify, takes a list of commands
-#  for each entry in the list
-#    if it is an array, shell protect it (with single ticks)
-#    if it is a string, do nothing
-def shellify(cmdlist, add_header=True):
-    content = ''
-    if add_header:
-        content += "#!/bin/sh\n"
-    escaped = "%s%s%s%s" % ("'", '\\', "'", "'")
-    for args in cmdlist:
-        # if the item is a list, wrap all items in single tick
-        # if its not, then just write it directly
-        if isinstance(args, list):
-            fixed = []
-            for f in args:
-                fixed.append("'%s'" % str(f).replace("'", escaped))
-            content = "%s%s\n" % (content, ' '.join(fixed))
-        else:
-            content = "%s%s\n" % (content, str(args))
-    return content

From a7ffaeccc9c99aa4bb58c76e6274224a3089b6f3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:55:23 -0700
Subject: [PATCH 017/434] Renamed this, since its more of settings, not all
 constants.

---
 cloudinit/{constants.py => settings.py} | 3 +++
 1 file changed, 3 insertions(+)
 rename cloudinit/{constants.py => settings.py} (91%)

diff --git a/cloudinit/constants.py b/cloudinit/settings.py
similarity index 91%
rename from cloudinit/constants.py
rename to cloudinit/settings.py
index 7bc90f27..830d970d 100644
--- a/cloudinit/constants.py
+++ b/cloudinit/settings.py
@@ -7,6 +7,7 @@ SEED_DIR = os.path.join(VAR_LIB_DIR, "seed")
 
 CFG_ENV_NAME = "CLOUD_CFG"
 CLOUD_CONFIG = '/etc/cloud/cloud.cfg'
+OLD_CLOUD_CONFIG = '/etc/ec2-init/ec2-config.cfg'
 
 CFG_BUILTIN = {
     'datasource_list': ['NoCloud',
@@ -35,3 +36,5 @@ PATH_MAP = {
 PER_INSTANCE = "once-per-instance"
 PER_ALWAYS = "always"
 PER_ONCE = "once"
+
+TEMPLATE_DIR = '/etc/cloud/templates/'

From 393b3681798a88bb2393da5636ea465418b8e0ca Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:55:52 -0700
Subject: [PATCH 018/434] This now only holds some simple top level functions.
 TODO: maybe just move them to utils?

---
 cloudinit/__init__.py | 53 +++++++++++--------------------------------
 1 file changed, 13 insertions(+), 40 deletions(-)

diff --git a/cloudinit/__init__.py b/cloudinit/__init__.py
index f223fbe8..2c291ff5 100644
--- a/cloudinit/__init__.py
+++ b/cloudinit/__init__.py
@@ -23,18 +23,17 @@
 import os
 
 import sys
-import os.path
 import errno
 import subprocess
 import yaml
 import glob
-import traceback
 
-import cloudinit.log as logging
-import cloudinit.shell as sh
-import cloudinit.util as util
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import url_helper as uhelp
+from cloudinit import util
 
-from cloudinit.constants import (VAR_LIB_DIR, CFG_BUILTIN, CLOUD_CONFIG,
+from cloudinit.settings import (VAR_LIB_DIR, CFG_BUILTIN, CLOUD_CONFIG,
                                  BOOT_FINISHED, CUR_INSTANCE_LINK, PATH_MAP)
 
 LOG = logging.getLogger(__name__)
@@ -62,20 +61,20 @@ def initfs():
     dlist = []
     for subd in INIT_SUBDIRS:
         dlist.append(os.path.join(VAR_LIB_DIR, subd))
-    sh.ensure_dirs(dlist)
+    util.ensure_dirs(dlist)
 
     cfg = util.get_base_cfg(CLOUD_CONFIG, get_builtin_cfg(), parsed_cfgs)
     log_file = util.get_cfg_option_str(cfg, 'def_log_file', None)
     perms = util.get_cfg_option_str(cfg, 'syslog_fix_perms', None)
     if log_file:
-        sh.ensure_file(log_file)
+        util.ensure_file(log_file)
     if log_file and perms:
         (u, g) = perms.split(':', 1)
         if u == "-1" or u == "None":
             u = None
         if g == "-1" or g == "None":
             g = None
-        sh.chownbyname(log_file, u, g)
+        util.chownbyname(log_file, u, g)
 
 
 def purge_cache(rmcur=True):
@@ -83,36 +82,10 @@ def purge_cache(rmcur=True):
     if rmcur:
         rmlist.append(CUR_INSTANCE_LINK)
     for f in rmlist:
-        try:
-            sh.unlink(f)
-        except OSError as e:
-            if e.errno == errno.ENOENT:
-                continue
-            return False
-        except:
-            return False
+        util.unlink(f)
     return True
 
 
-# get_ipath_cur: get the current instance path for an item
-def get_ipath_cur(name=None):
-    add_on = PATH_MAP.get(name)
-    ipath = os.path.join(VAR_LIB_DIR, 'instance')
-    if add_on:
-        ipath = os.path.join(ipath, add_on)
-    return ipath
-
-
-# get_cpath : get the "clouddir" (/var/lib/cloud/<name>)
-# for a name in dirmap
-def get_cpath(name=None):
-    cpath = VAR_LIB_DIR
-    add_on = PATH_MAP.get(name)
-    if add_on:
-        cpath = os.path.join(cpath, add_on)
-    return cpath
-
-
 def get_base_cfg(cfg_path=None):
     if cfg_path is None:
         cfg_path = CLOUD_CONFIG
@@ -124,7 +97,7 @@ def get_builtin_cfg():
 
 
 def list_sources(cfg_list, depends):
-    return (DataSource.list_sources(cfg_list, depends, ["cloudinit", ""]))
+    return (sources.list_sources(cfg_list, depends, ["cloudinit", ""]))
 
 
 def get_cmdline_url(names=('cloud-config-url', 'url'),
@@ -140,11 +113,11 @@ def get_cmdline_url(names=('cloud-config-url', 'url'),
         if key in data:
             url = data[key]
             break
-    if url == None:
+
+    if url is None:
         return (None, None, None)
 
-    contents = util.readurl(url)
-
+    contents = uhelp.readurl(url)
     if contents.startswith(starts):
         return (key, url, contents)
 

From a61b86853477d3c23e0e34c48e9c7d9e06ac760e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:56:15 -0700
Subject: [PATCH 019/434] This now holds the following classes:

CloudInit - cut up to only provide some basic init processes
CloudPartData - provided to handlers so that they can fetch needed data without providing the whole enchilda of cloud init.
CloudPaths - holds the paths that should be used, for instances, for non-instances and such.
CloudSemaphores - holds the concept of cloud inits sempaphores, but cleaned up, using context manager to help here.
CloudHandlers - holds the user data handlers to be activated
CloudConfig - the cloud config object (to be cleaned up)
---
 cloudinit/cloud.py | 663 +++++++++++++++++++++++++--------------------
 1 file changed, 366 insertions(+), 297 deletions(-)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index eb71439b..cfb1c011 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -1,368 +1,437 @@
-import os
+from time import time
 
 import cPickle as pickle
+import contextlib
+import os
+import sys
+import weakref
+
+
+from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS,
+                                OLD_CLOUD_CONFIG, CLOUD_CONFIG,
+                                CFG_BUILTIN, CUR_INSTANCE_LINK)
+from cloudinit import (get_builtin_cfg, get_base_cfg)
+from cloudinit import log as logging
+from cloudinit import parts
+from cloudinit import sources
+from cloudinit import util
+from cloudinit import user_data
+
+LOG = logging.getLogger(__name__)
+
+
+class CloudSemaphores(object):
+    def __init__(self, paths):
+        self.paths = paths
+
+    # acquire lock on 'name' for given 'freq' and run function 'func'
+    # if 'clear_on_fail' is True and 'func' throws an exception
+    # then remove the lock (so it would run again)
+    def run_functor(self, name, freq, functor, args=None, clear_on_fail=False):
+        if not args:
+            args = []
+        if self.has_run(name, freq):
+            LOG.debug("%s already ran %s", name, freq)
+            return False
+        with self.lock(name, freq, clear_on_fail) as lock:
+            if not lock:
+                raise RuntimeError("Failed to acquire lock on %s" % name)
+            else:
+                LOG.debug("Running %s with args %s using lock %s", func, args, lock)
+                func(*args)
+        return True
+
+    @contextlib.contextmanager
+    def lock(self, name, freq, clear_on_fail=False):
+        try:
+            yield self._acquire(name, freq)
+        except:
+            if clear_on_fail:
+                self.clear(name, freq)
+            raise
+
+    def clear(self, name, freq):
+        sem_file = self._getpath(name, freq)
+        try:
+            util.del_file(sem_file)
+        except IOError:
+            return False
+        return True
+
+    def _acquire(self, name, freq):
+        if self.has_run(name, freq):
+            return None
+        # This is a race condition since nothing atomic is happening
+        # here, but this should be ok due to the nature of when
+        # and where cloud-init runs... (file writing is not a lock..)
+        sem_file = self._getpath(name, freq)
+        contents = "%s\n" % str(time())
+        try:
+            util.write_file(sem_file, contents)
+        except (IOError, OSError):
+            return None
+        return sem_file
+
+    def has_run(self, name, freq):
+        if freq == PER_ALWAYS:
+            return False
+        sem_file = self._get_path(name, freq)
+        if os.path.exists(sem_file):
+            return True
+        return False
+
+    def _get_path(self, name, freq):
+        sem_path = self.init.get_ipath("sem")
+        if freq == PER_INSTANCE:
+            return os.path.join(sem_path, name)
+        return os.path.join(sem_path, "%s.%s" % (name, freq))
+
+
+class CloudPaths(object):
+    def __init__(self, init):
+        self.config = CLOUD_CONFIG
+        self.old_config = OLD_CLOUD_CONFIG
+        self.var_dir = VAR_LIB_DIR
+        self.instance_link = CUR_INSTANCE_LINK
+        self.init = weakref.proxy(init)
+        self.upstart_conf_d = "/etc/init"
+
+    def _get_path_key(self, name):
+        return PATH_MAP.get(name)
+
+    # get_ipath_cur: get the current instance path for an item
+    def get_ipath_cur(self, name=None):
+        add_on = self._get_path_key(name)
+        ipath = os.path.join(self.var_dir, 'instance')
+        if add_on:
+            ipath = os.path.join(ipath, add_on)
+        return ipath
+
+    # get_cpath : get the "clouddir" (/var/lib/cloud/<name>)
+    # for a name in dirmap
+    def get_cpath(self, name=None):
+        cpath = self.var_dir
+        add_on = self._get_path_key(name)
+        if add_on:
+            cpath = os.path.join(cpath, add_on)
+        return cpath
+
+    # get_ipath : get the instance path for a name in pathmap
+    # (/var/lib/cloud/instances/<instance>/<name>)
+    def get_ipath(self, name=None):
+        iid = self.init.datasource.get_instance_id()
+        ipath = os.path.join(self.var_dir, 'instances', iid)
+        add_on = self._get_path_key(name)
+        if add_on:
+            ipath = os.path.join(ipath, add_on)
+        return ipath
+
+
+class CloudPartData(object):
+    def __init__(self, datasource, paths):
+        self.datasource = datasource
+        self.paths = paths
+
+    def get_userdata(self):
+        return self.datasource.get_userdata()
+
+    def get_public_ssh_keys(self):
+        return self.datasource.get_public_ssh_keys()
+
+    def get_locale(self):
+        return self.datasource.get_locale()
+
+    def get_mirror(self):
+        return self.datasource.get_local_mirror()
+
+    def get_hostname(self, fqdn=False):
+        return self.datasource.get_hostname(fqdn=fqdn)
+
+    def device_name_to_device(self, name):
+        return self.datasource.device_name_to_device(name)
+
+    def get_ipath_cur(self, name=None):
+        return self.paths.get_ipath_cur(name)
+
+    def get_cpath(self, name=None):
+        return self.paths.get_cpath(name)
+
+    def get_ipath(self, name=None):
+        return self.paths.get_ipath(name)
 
 
 class CloudInit(object):
-    cfg = None
-    part_handlers = {}
-    old_conffile = '/etc/ec2-init/ec2-config.cfg'
-    ds_deps = [DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK]
-    datasource = None
-    cloud_config_str = ''
-    datasource_name = ''
-
-    builtin_handlers = []
-
-    def __init__(self, ds_deps=None, sysconfig=system_config):
-        self.builtin_handlers = [
-            ['text/x-shellscript', self.handle_user_script, per_always],
-            ['text/cloud-config', self.handle_cloud_config, per_always],
-            ['text/upstart-job', self.handle_upstart_job, per_instance],
-            ['text/cloud-boothook', self.handle_cloud_boothook, per_always],
-        ]
-
-        if ds_deps != None:
+    def __init__(self, ds_deps=None):
+        self.datasource = None
+        if ds_deps:
             self.ds_deps = ds_deps
+        else:
+            self.ds_deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
+        self.paths = CloudPaths(self)
+        self.sems = CloudSemaphores(self.paths)
+        self.cfg = self._read_cfg()
 
-        self.sysconfig = sysconfig
-
-        self.cfg = self.read_cfg()
-
-    def read_cfg(self):
-        if self.cfg:
-            return(self.cfg)
-
-        try:
-            conf = util.get_base_cfg(self.sysconfig, cfg_builtin, parsed_cfgs)
-        except Exception:
-            conf = get_builtin_cfg()
-
+    def _read_cfg_old(self):
         # support reading the old ConfigObj format file and merging
         # it into the yaml dictionary
         try:
             from configobj import ConfigObj
-            oldcfg = ConfigObj(self.old_conffile)
-            if oldcfg is None:
-                oldcfg = {}
-            conf = util.mergedict(conf, oldcfg)
-        except:
-            pass
+        except ImportError:
+            ConfigObj = None
+        if not ConfigObj:
+            return {}
+        old_cfg = ConfigObj(self.paths.old_config_fn)
+        return dict(old_cfg)
 
-        return(conf)
+    def read_cfg(self):
+        if not self.cfg:
+            self.cfg = self._read_cfg()
+        return self.cfg
 
+    def _read_cfg(self):
+        starting_config = get_builtin_cfg()
+        try:
+            conf = get_base_cfg(self.paths.config, starting_config)
+        except Exception:
+            conf = starting_config
+        old_conf = self._read_cfg_old()
+        conf = util.mergedict(conf, old_conf)
+        return conf
+    
     def restore_from_cache(self):
+        pickled_fn = self.paths.get_ipath_cur('obj_pkl')
         try:
             # we try to restore from a current link and static path
             # by using the instance link, if purge_cache was called
             # the file wont exist
-            cache = get_ipath_cur('obj_pkl')
-            f = open(cache, "rb")
-            data = cPickle.load(f)
-            f.close()
-            self.datasource = data
+            self.datasource = pickle.loads(util.load_file(pickled_fn))
             return True
-        except:
+        except Exception as e:
+            LOG.debug("Failed loading pickled datasource from %s due to %s", pickled_fn, e)
             return False
-
+    
     def write_to_cache(self):
-        cache = self.get_ipath("obj_pkl")
+        pickled_fn = self.paths.get_ipath_cur("obj_pkl")
         try:
-            os.makedirs(os.path.dirname(cache))
-        except OSError as e:
-            if e.errno != errno.EEXIST:
-                return False
-
-        try:
-            f = open(cache, "wb")
-            cPickle.dump(self.datasource, f)
-            f.close()
-            os.chmod(cache, 0400)
-        except:
-            raise
-
+            contents = pickle.dumps(self.datasource)
+            util.write_file(pickled_fn, contents, mode=0400)
+        except Exception as e:
+            LOG.debug("Failed pickling datasource to %s due to %s", pickled_fn, e)
+            return False
+    
     def get_data_source(self):
-        if self.datasource is not None:
+        if self.datasource:
             return True
-
         if self.restore_from_cache():
-            log.debug("restored from cache type %s" % self.datasource)
+            LOG.debug("Restored from cache datasource: %s" % self.datasource)
             return True
-
-        cfglist = self.cfg['datasource_list']
-        dslist = list_sources(cfglist, self.ds_deps)
-        dsnames = [f.__name__ for f in dslist]
-
-        log.debug("searching for data source in %s" % dsnames)
-        for cls in dslist:
-            ds = cls.__name__
-            try:
-                s = cls(sys_cfg=self.cfg)
-                if s.get_data():
-                    self.datasource = s
-                    self.datasource_name = ds
-                    log.debug("found data source %s" % ds)
-                    return True
-            except Exception as e:
-                log.warn("get_data of %s raised %s" % (ds, e))
-                util.logexc(log)
-        msg = "Did not find data source. searched classes: %s" % dsnames
-        log.debug(msg)
-        raise DataSourceNotFoundException(msg)
-
+        (ds, dsname) = sources.find_source(self.cfg, self.ds_deps)
+        LOG.debug("Loaded datasource %s:%s", dsname, ds)
+        self.datasource = ds
+        return True
+    
     def set_cur_instance(self):
-        try:
-            os.unlink(cur_instance_link)
-        except OSError as e:
-            if e.errno != errno.ENOENT:
-                raise
+        # Ensure we are hooked into the right symlink for the current instance
+        idir = self.paths.get_ipath()
+        util.del_file(self.paths.instance_link)
+        util.sym_link(idir, self.paths.instance_link)
 
-        iid = self.get_instance_id()
-        os.symlink("./instances/%s" % iid, cur_instance_link)
-        idir = self.get_ipath()
         dlist = []
         for d in ["handlers", "scripts", "sem"]:
-            dlist.append("%s/%s" % (idir, d))
-
+            dlist.append(os.path.join(idir, d))
         util.ensure_dirs(dlist)
 
-        ds = "%s: %s\n" % (self.datasource.__class__, str(self.datasource))
-        dp = self.get_cpath('data')
-        util.write_file("%s/%s" % (idir, 'datasource'), ds)
-        util.write_file("%s/%s" % (dp, 'previous-datasource'), ds)
-        util.write_file("%s/%s" % (dp, 'previous-instance-id'), "%s\n" % iid)
-
-    def get_userdata(self):
-        return(self.datasource.get_userdata())
-
-    def get_userdata_raw(self):
-        return(self.datasource.get_userdata_raw())
-
-    def get_instance_id(self):
-        return(self.datasource.get_instance_id())
+        # Write out information on what is being used for the current instance
+        # and what may have been used for a previous instance...
+        dp = self.paths.get_cpath('data')
+        ds = "%s: %s\n" % (self.datasource.__class__, self.datasource)
+        previous_ds = ''
+        ds_fn = os.path.join(idir, 'datasource')
+        try:
+            previous_ds = util.load_file(ds_fn).strip()
+        except IOError as e:
+            pass
+        if not previous_ds:
+            # TODO: ?? is this right
+            previous_ds = ds
+        util.write_file(ds_fn, ds)
+        util.write_file(os.path.join(dp, 'previous-datasource'), previous_ds)
+        iid = self.datasource.get_instance_id()
+        previous_iid = ''
+        p_iid_fn = os.path.join(dp, 'previous-instance-id')
+        try:
+            previous_iid = util.load_file(p_iid_fn).strip()
+        except IOError as e:
+            pass
+        if not previous_iid:
+            # TODO: ?? is this right
+            previous_iid = iid
+        util.write_file(p_iid_fn, "%s\n" % previous_iid)
 
     def update_cache(self):
         self.write_to_cache()
         self.store_userdata()
 
     def store_userdata(self):
-        util.write_file(self.get_ipath('userdata_raw'),
-            self.datasource.get_userdata_raw(), 0600)
-        util.write_file(self.get_ipath('userdata'),
-            self.datasource.get_userdata(), 0600)
+        raw_ud = "%s" % (self.datasource.get_userdata_raw())
+        util.write_file(self.paths.get_ipath('userdata_raw'), raw_ud, 0600)
+        ud = "%s" % (self.datasource.get_userdata())
+        util.write_file(self.paths.get_ipath('userdata'), ud, 0600)
 
-    def sem_getpath(self, name, freq):
-        if freq == 'once-per-instance':
-            return("%s/%s" % (self.get_ipath("sem"), name))
-        return("%s/%s.%s" % (get_cpath("sem"), name, freq))
-
-    def sem_has_run(self, name, freq):
-        if freq == per_always:
-            return False
-        semfile = self.sem_getpath(name, freq)
-        if os.path.exists(semfile):
-            return True
-        return False
-
-    def sem_acquire(self, name, freq):
-        from time import time
-        semfile = self.sem_getpath(name, freq)
-
-        try:
-            os.makedirs(os.path.dirname(semfile))
-        except OSError as e:
-            if e.errno != errno.EEXIST:
-                raise e
-
-        if os.path.exists(semfile) and freq != per_always:
-            return False
-
-        # race condition
-        try:
-            f = open(semfile, "w")
-            f.write("%s\n" % str(time()))
-            f.close()
-        except:
-            return(False)
-        return(True)
-
-    def sem_clear(self, name, freq):
-        semfile = self.sem_getpath(name, freq)
-        try:
-            os.unlink(semfile)
-        except OSError as e:
-            if e.errno != errno.ENOENT:
-                return False
-
-        return True
-
-    # acquire lock on 'name' for given 'freq'
-    # if that does not exist, then call 'func' with given 'args'
-    # if 'clear_on_fail' is True and func throws an exception
-    #  then remove the lock (so it would run again)
-    def sem_and_run(self, semname, freq, func, args=None, clear_on_fail=False):
-        if args is None:
-            args = []
-        if self.sem_has_run(semname, freq):
-            log.debug("%s already ran %s", semname, freq)
-            return False
-        try:
-            if not self.sem_acquire(semname, freq):
-                raise Exception("Failed to acquire lock on %s" % semname)
-
-            func(*args)
-        except:
-            if clear_on_fail:
-                self.sem_clear(semname, freq)
-            raise
-
-        return True
-
-    # get_ipath : get the instance path for a name in pathmap
-    # (/var/lib/cloud/instances/<instance>/name)<name>)
-    def get_ipath(self, name=None):
-        return("%s/instances/%s%s"
-               % (varlibdir, self.get_instance_id(), pathmap[name]))
-
-    def consume_userdata(self, frequency=per_instance):
-        self.get_userdata()
-        data = self
-
-        cdir = get_cpath("handlers")
-        idir = self.get_ipath("handlers")
-
-        # add the path to the plugins dir to the top of our list for import
+    def consume_userdata(self, frequency=PER_INSTANCE):
+        cdir = self.paths.get_cpath("handlers")
+        idir = self.paths.get_ipath("handlers")
+    
+        # Add the path to the plugins dir to the top of our list for import
         # instance dir should be read before cloud-dir
         sys.path.insert(0, cdir)
         sys.path.insert(0, idir)
 
-        part_handlers = {}
-        # add handlers in cdir
-        for fname in glob.glob("%s/*.py" % cdir):
+        # Data will be a little proxy that modules can use
+        data = CloudPartData(self.datasource, self.paths)
+
+        # This keeps track of all the active handlers
+        handlers = CloudHandlers(self)
+
+        # Add handlers in cdir
+        for fname in glob.glob(os.path.join(cdir, "*.py")):
             if not os.path.isfile(fname):
                 continue
             modname = os.path.basename(fname)[0:-3]
             try:
-                mod = __import__(modname)
-                handler_register(mod, part_handlers, data, frequency)
-                log.debug("added handler for [%s] from %s" % (mod.list_types(),
-                                                              fname))
+                mod = parts.fixup_module(importer.import_module(modname))
+                types = handlers.register(mod)
+                LOG.debug("Added handler for [%s] from %s", types, fname)
             except:
-                log.warn("failed to initialize handler in %s" % fname)
-                util.logexc(log)
+                LOG.exception("Failed to register handler in %s", fname)
 
-        # add the internal handers if their type hasn't been already claimed
-        for (btype, bhand, bfreq) in self.builtin_handlers:
-            if btype in part_handlers:
-                continue
-            handler_register(InternalPartHandler(bhand, [btype], bfreq),
-                part_handlers, data, frequency)
+        def_handlers = handlers.register_defaults()
+        if def_handlers:
+            LOG.debug("Registered default handlers for [%s]", def_handlers)
 
-        # walk the data
-        pdata = {'handlers': part_handlers, 'handlerdir': idir,
-                 'data': data, 'frequency': frequency}
-        UserDataHandler.walk_userdata(self.get_userdata(),
-            partwalker_callback, data=pdata)
-
-        # give callbacks opportunity to finalize
+        # Init the handlers first
+        # Ensure userdata fetched before activation
         called = []
-        for (_mtype, mod) in part_handlers.iteritems():
+        for (_mtype, mod) in handlers.iteritems():
             if mod in called:
                 continue
-            handler_call_end(mod, data, frequency)
+            parts.call_begin(mod, data, frequency)
+            called.append(mod)
 
-    def handle_user_script(self, _data, ctype, filename, payload, _frequency):
-        if ctype == "__end__":
-            return
-        if ctype == "__begin__":
-            # maybe delete existing things here
-            return
+        # Walk the user data
+        part_data = {
+            'handlers': handlers,
+            'handlerdir': idir,
+            'data': data, 
+            'frequency': frequency,
+            'handlercount': 0,
+        }
+        user_data.walk(data.get_userdata(), parts.walker_callback, data=part_data)
 
-        filename = filename.replace(os.sep, '_')
-        scriptsdir = get_ipath_cur('scripts')
-        util.write_file("%s/%s" %
-            (scriptsdir, filename), util.dos2unix(payload), 0700)
+        # Give callbacks opportunity to finalize
+        called = []
+        for (_mtype, mod) in handlers.iteritems():
+            if mod in called:
+                continue
+            parts.call_end(mod, data, frequency)
+            called.append(mod)
 
-    def handle_upstart_job(self, _data, ctype, filename, payload, frequency):
-        # upstart jobs are only written on the first boot
-        if frequency != per_instance:
-            return
 
-        if ctype == "__end__" or ctype == "__begin__":
-            return
-        if not filename.endswith(".conf"):
-            filename = filename + ".conf"
+class CloudHandlers(object):
 
-        util.write_file("%s/%s" % ("/etc/init", filename),
-            util.dos2unix(payload), 0644)
+    def __init__(self, paths):
+        self.paths = paths
+        self.registered = {}
 
-    def handle_cloud_config(self, _data, ctype, filename, payload, _frequency):
-        if ctype == "__begin__":
-            self.cloud_config_str = ""
-            return
-        if ctype == "__end__":
-            cloud_config = self.get_ipath("cloud_config")
-            util.write_file(cloud_config, self.cloud_config_str, 0600)
+    def __contains__(self, item):
+        return self.is_registered(item)
 
-            ## this could merge the cloud config with the system config
-            ## for now, not doing this as it seems somewhat circular
-            ## as CloudConfig does that also, merging it with this cfg
-            ##
-            # ccfg = yaml.load(self.cloud_config_str)
-            # if ccfg is None: ccfg = {}
-            # self.cfg = util.mergedict(ccfg, self.cfg)
+    def __getitem__(self, key):
+        return self._get_handler(key)
 
-            return
+    def is_registered(self, content_type):
+        return content_type in self.registered
 
-        self.cloud_config_str += "\n#%s\n%s" % (filename, payload)
+    def register(self, mod):
+        types = set()
+        for t in mod.list_types():
+            self.registered[t] = handler
+            types.add(t)
+        return types
 
-    def handle_cloud_boothook(self, _data, ctype, filename, payload,
-                              _frequency):
-        if ctype == "__end__":
-            return
-        if ctype == "__begin__":
-            return
+    def _get_handler(self, content_type):
+        return self.registered[content_type]
 
-        filename = filename.replace(os.sep, '_')
-        payload = util.dos2unix(payload)
-        prefix = "#cloud-boothook"
-        start = 0
-        if payload.startswith(prefix):
-            start = len(prefix) + 1
+    def items(self):
+        return self.registered.items()
 
-        boothooks_dir = self.get_ipath("boothooks")
-        filepath = "%s/%s" % (boothooks_dir, filename)
-        util.write_file(filepath, payload[start:], 0700)
+    def iteritems(self):
+        return self.registered.iteritems()
+
+    def _get_default_handlers(self):
+        def_handlers = []
+        if self.paths.get_ipath("cloud_config"):
+            def_handlers.append(parts.CloudConfigPartHandler(self.paths.get_ipath("cloud_config")))
+        if self.paths.get_ipath_cur('scripts'):
+            def_handlers.append(parts.ShellScriptPartHandler(self.paths.get_ipath_cur('scripts')))
+        if self.paths.get_ipath("boothooks"):
+            def_handlers.append(parts.BootHookPartHandler(self.paths.get_ipath("boothooks")))
+        if self.paths.upstart_conf_d:
+            def_handlers.append(parts.UpstartJobPartHandler(self.paths.upstart_conf_d))
+        return def_handlers
+
+    def register_defaults(self):
+        registered = set()
+        for h in self._get_default_handlers():
+            for t in h.list_types():
+                if not self.is_registered(t)
+                    self.register_handler(t, h)
+                    registered.add(t)
+        return registered
+
+
+class CloudConfig(object):
+    cfgfile = None
+    cfg = None
+
+    def __init__(self, cfgfile, cloud=None, ds_deps=None):
+        if cloud == None:
+            self.cloud = cloudinit.CloudInit(ds_deps)
+            self.cloud.get_data_source()
+        else:
+            self.cloud = cloud
+        self.cfg = self.get_config_obj(cfgfile)
+
+    def get_config_obj(self, cfgfile):
         try:
-            env = os.environ.copy()
-            env['INSTANCE_ID'] = self.datasource.get_instance_id()
-            subprocess.check_call([filepath], env=env)
-        except subprocess.CalledProcessError as e:
-            log.error("boothooks script %s returned %i" %
-                (filepath, e.returncode))
-        except Exception as e:
-            log.error("boothooks unknown exception %s when running %s" %
-                (e, filepath))
+            cfg = util.read_conf(cfgfile)
+        except:
+            # TODO: this 'log' could/should be passed in
+            cloudinit.log.critical("Failed loading of cloud config '%s'. "
+                                   "Continuing with empty config\n" % cfgfile)
+            cloudinit.log.debug(traceback.format_exc() + "\n")
+            cfg = None
+        if cfg is None:
+            cfg = {}
 
-    def get_public_ssh_keys(self):
-        return(self.datasource.get_public_ssh_keys())
+        try:
+            ds_cfg = self.cloud.datasource.get_config_obj()
+        except:
+            ds_cfg = {}
 
-    def get_locale(self):
-        return(self.datasource.get_locale())
+        cfg = util.mergedict(cfg, ds_cfg)
+        return(util.mergedict(cfg, self.cloud.cfg))
 
-    def get_mirror(self):
-        return(self.datasource.get_local_mirror())
+    def handle(self, name, args, freq=None):
+        try:
+            mod = __import__("cc_" + name.replace("-", "_"), globals())
+            def_freq = getattr(mod, "frequency", per_instance)
+            handler = getattr(mod, "handle")
 
-    def get_hostname(self, fqdn=False):
-        return(self.datasource.get_hostname(fqdn=fqdn))
-
-    def device_name_to_device(self, name):
-        return(self.datasource.device_name_to_device(name))
-
-    # I really don't know if this should be here or not, but
-    # I needed it in cc_update_hostname, where that code had a valid 'cloud'
-    # reference, but did not have a cloudinit handle
-    # (ie, no cloudinit.get_cpath())
-    def get_cpath(self, name=None):
-        return(get_cpath(name))
+            if not freq:
+                freq = def_freq
 
+            self.cloud.sem_and_run("config-" + name, freq, handler,
+                [name, self.cfg, self.cloud, cloudinit.log, args])
+        except:
+            raise

From 30aa87777af4424d47e59013644ab8b8c1db22fc Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:58:37 -0700
Subject: [PATCH 020/434] Working on making this have the old setup (where
 strings are taken in for config) as well as file names (for those that have
 files).

---
 cloudinit/log.py | 44 +++++++++++++++++---------------------------
 1 file changed, 17 insertions(+), 27 deletions(-)

diff --git a/cloudinit/log.py b/cloudinit/log.py
index 4d270045..2dda405d 100644
--- a/cloudinit/log.py
+++ b/cloudinit/log.py
@@ -2,8 +2,13 @@
 
 import logging
 import logging.handlers
+import logging.config
+
+import os
 import sys
 
+from StringIO import StringIO
+
 # Logging levels for easy access
 CRITICAL = logging.CRITICAL
 FATAL = logging.FATAL
@@ -14,10 +19,6 @@ INFO = logging.INFO
 DEBUG = logging.DEBUG
 NOTSET = logging.NOTSET
 
-# File log rotation settings
-ROTATE_AMOUNT = 10  # Only keep the past 9 + 1 active
-ROTATE_SIZE = 10 * 1024 * 1024  # 10 MB
-
 
 class ConsoleFormatter(logging.Formatter):
 
@@ -31,50 +32,39 @@ class ConsoleFormatter(logging.Formatter):
         record.message = record.getMessage()
         rdict = dict(record.__dict__)
         rdict['minilevelname'] = self._get_mini_level(record)
-        # Skipping exception info for the console...
         return self._fmt % (rdict)
 
 
-def setupLogging(level, filename=None, filelevel=logging.DEBUG):
-    root = getLogger()
-    consolelg = logging.StreamHandler(sys.stdout)
-    consolelg.setFormatter(ConsoleFormatter('%(minilevelname)s%(message)s'))
-    consolelg.setLevel(level)
-    root.addHandler(consolelg)
-    if filename:
-        filelg = logging.handlers.RotatingFileHandler(filename, maxBytes=ROTATE_SIZE, backupCount=ROTATE_AMOUNT)
-        filelg.setFormatter(logging.Formatter('%(levelname)s: @%(name)s : %(message)s'))
-        filelg.setLevel(filelevel)
-        root.addHandler(filelg)
-    root.setLevel(level)
-
-
-def logging_set_from_cfg(cfg):
+def setupLogging(cfg):
     log_cfgs = []
-    logcfg = util.get_cfg_option_str(cfg, "log_cfg", False)
-    if logcfg:
+    log_cfg = cfg.get('logcfg')
+    if log_cfg:
         # if there is a 'logcfg' entry in the config, respect
         # it, it is the old keyname
-        log_cfgs = [logcfg]
+        log_cfgs = [log_cfg]
     elif "log_cfgs" in cfg:
         for cfg in cfg['log_cfgs']:
             if isinstance(cfg, list):
                 log_cfgs.append('\n'.join(cfg))
             else:
-                log_cfgs.append()
+                log_cfgs.append(cfg)
 
     if not len(log_cfgs):
         sys.stderr.write("Warning, no logging configured\n")
         return
 
+    am_worked = 0
     for logcfg in log_cfgs:
         try:
-            logging.config.fileConfig(StringIO.StringIO(logcfg))
-            return
+            if not os.path.isfile(logcfg):
+                logcfg = StringIO(logcfg)
+            logging.config.fileConfig(logcfg)
+            am_worked += 1
         except:
             pass
 
-    raise Exception("no valid logging found\n")
+    if not am_worked:
+        sys.stderr.write("Warning, no logging configured\n")
 
 
 def getLogger(name='cloudinit'):

From ff9b73c1936854daac61ad2fd167418be042e320 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 17:59:31 -0700
Subject: [PATCH 021/434] Ensure files end with ".tmpl" if they don't
 initially.

---
 cloudinit/templater.py | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/cloudinit/templater.py b/cloudinit/templater.py
index b6b320ab..5a3563a2 100644
--- a/cloudinit/templater.py
+++ b/cloudinit/templater.py
@@ -2,14 +2,17 @@ import os
 
 from Cheetah.Template import Template
 
+from cloudinit import settings
 from cloudinit import util
 
-TEMPLATE_DIR = '/etc/cloud/templates/'
-
 
 def render_to_file(template, outfile, searchList):
-    contents = Template(file=os.path.join(TEMPLATE_DIR, template),
-                 searchList=[searchList]).respond()
+    fn = template
+    (base, ext) = os.path.splitext(fn)
+    if ext != ".tmpl":
+        fn = "%s.tmpl" % (fn)
+    fn = os.path.join(settings.TEMPLATE_DIR, fn)
+    contents = Template(file=fn, searchList=[searchList]).respond()
     util.write_file(outfile, contents)
 
 

From 285660490d126b8a6e1917b7d90187e15fcbf26e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:00:52 -0700
Subject: [PATCH 022/434] Cleaning this up, logic should be more sound around
 attempts and retries now.

---
 cloudinit/url_helper.py | 30 +++++++++++++-----------------
 1 file changed, 13 insertions(+), 17 deletions(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 0f0a9d0c..ed78c92e 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -1,15 +1,11 @@
 import errno
-import httplib
 import time
 import urllib
 import urllib2
 
-from StringIO import StringIO
-
 from contextlib import closing
 
 from cloudinit import log as logging
-from cloudinit import shell as sh
 
 LOG = logging.getLogger(__name__)
 
@@ -18,7 +14,7 @@ def ok_http_code(st):
     return st in xrange(200, 400)
 
 
-def readurl(url, data=None, timeout=None, retries=0, sec_between=1, read_cb=None, headers=None):
+def readurl(url, data=None, timeout=None, retries=0, sec_between=1, headers=None):
     openargs = {}
     if timeout is not None:
         openargs['timeout'] = int(timeout)
@@ -31,14 +27,13 @@ def readurl(url, data=None, timeout=None, retries=0, sec_between=1, read_cb=None
     if retries <= 0:
         retries = 1
 
+    attempts = retries + 1
     last_excp = None
-    LOG.debug("Attempting to read from %s with %s attempts to be performed", url, retries)
-    for i in range(0, retries):
+    LOG.debug("Attempting to read from %s with %s attempts to be performed", url, attempts)
+    for i in range(0, attempts):
         try:
             with closing(urllib2.urlopen(req, **openargs)) as rh:
-                ofh = StringIO()
-                sh.pipe_in_out(rh, ofh, chunk_cb=read_cb)
-                return (ofh.getvalue(), rh.getcode())
+                return (rh.read(), rh.getcode())
         except urllib2.HTTPError as e:
             last_excp = e
             LOG.exception("Failed at reading from %s.", url)
@@ -51,11 +46,12 @@ def readurl(url, data=None, timeout=None, retries=0, sec_between=1, read_cb=None
             else:
                 last_excp = e
             LOG.exception("Failed at reading from %s.", url)
-        LOG.debug("Please wait %s seconds while we wait to try again.", sec_between)
-        time.sleep(sec_between)
+        if i + 1 < attempts:
+            LOG.debug("Please wait %s seconds while we wait to try again.", sec_between)
+            time.sleep(sec_between)
 
     # Didn't work out
-    LOG.warn("Failed downloading from %s after %s attempts", url, i + 1)
+    LOG.warn("Failed downloading from %s after %s attempts", url, attempts)
     if last_excp is not None:
         raise last_excp
 
@@ -118,11 +114,11 @@ def wait_for_url(urls, max_wait=None, timeout=None,
                 else:
                     headers = {}
 
-                (resp, status_code) = readurl(url, headers=headers, timeout=timeout)
+                (resp, sc) = readurl(url, headers=headers, timeout=timeout)
                 if not resp:
-                    reason = "empty response [%s]" % status_code
-                elif not ok_http_code(status_code):
-                    reason = "bad status code [%s]" % status_code
+                    reason = "empty response [%s]" % sc
+                elif not ok_http_code(sc):
+                    reason = "bad status code [%s]" % sc
                 else:
                     return url
             except urllib2.HTTPError as e:

From beeb6594241cf6c9b5ac3a6c4b612b5336ba4df9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:01:24 -0700
Subject: [PATCH 023/434] Large amounts of refactoring.

Now there exists a class which processes the user data down to a mime message and just some small utility methods to walk and determine types.

Large amount of content type cleanups & constant creation.
---
 cloudinit/user_data.py | 395 +++++++++++++++++++++--------------------
 1 file changed, 202 insertions(+), 193 deletions(-)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index ec914480..f35e5d38 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -18,19 +18,23 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import email
+import hashlib
+import os
+import urllib
 
+import email
 from email.mime.multipart import MIMEMultipart
 from email.mime.text import MIMEText
 from email.mime.base import MIMEBase
+
 import yaml
-import cloudinit
-import cloudinit.util as util
-import hashlib
-import urllib
+
+from cloudinit import url_helper
+from cloudinit import util
 
 
-starts_with_mappings = {
+# Different file beginnings to there content type
+INCLUSION_TYPES_MAP = {
     '#include': 'text/x-include-url',
     '#include-once': 'text/x-include-once-url',
     '#!': 'text/x-shellscript',
@@ -41,170 +45,210 @@ starts_with_mappings = {
     '#cloud-config-archive': 'text/cloud-config-archive',
 }
 
+# Various special content types
+TYPE_NEEDED = ["text/plain", "text/x-not-multipart"]
+INCLUDE_TYPES = ['text/x-include-url', 'text/x-include-once-url']
+ARCHIVE_TYPES = ["text/cloud-config-archive"]
+UNDEF_TYPE = "text/plain"
+ARCHIVE_UNDEF_TYPE = "text/cloud-config"
+NOT_MULTIPART_TYPE = "text/x-not-multipart"
+OCTET_TYPE = 'application/octet-stream'
 
-# if 'string' is compressed return decompressed otherwise return it
-def decomp_str(string):
-    import StringIO
-    import gzip
-    try:
-        uncomp = gzip.GzipFile(None, "rb", 1, StringIO.StringIO(string)).read()
-        return(uncomp)
-    except:
-        return(string)
+# Sorted longest first
+INCLUSION_SRCH = sorted(INCLUSION_TYPES_MAP.keys(), key=(lambda e: 0 - len(e)))
+
+# Msg header used to track attachments
+ATTACHMENT_FIELD = 'Number-Attachments'
+
+# This will be used to create a filename from a url (or like) entry
+# When we want to make sure a entry isn't included more than once across sessions.
+INCLUDE_ONCE_HASHER = 'md5'
+
+# For those pieces without filenames
+PART_FN_TPL = 'part-%03d'
 
 
-def do_include(content, appendmsg):
-    import os
-    # is just a list of urls, one per line
-    # also support '#include <url here>'
-    includeonce = False
-    for line in content.splitlines():
-        if line == "#include":
-            continue
-        if line == "#include-once":
-            includeonce = True
-            continue
-        if line.startswith("#include-once"):
-            line = line[len("#include-once"):].lstrip()
-            includeonce = True
-        elif line.startswith("#include"):
-            line = line[len("#include"):].lstrip()
-        if line.startswith("#"):
-            continue
-        if line.strip() == "":
-            continue
+class UserDataProcessor(object):
+    def __init__(self, paths):
+        self.paths = paths
 
-        # urls cannot not have leading or trailing white space
-        msum = hashlib.md5()  # pylint: disable=E1101
-        msum.update(line.strip())
-        includeonce_filename = "%s/urlcache/%s" % (
-            cloudinit.get_ipath_cur("data"), msum.hexdigest())
-        try:
-            if includeonce and os.path.isfile(includeonce_filename):
-                with open(includeonce_filename, "r") as fp:
-                    content = fp.read()
-            else:
-                content = urllib.urlopen(line).read()
-                if includeonce:
-                    util.write_file(includeonce_filename, content, mode=0600)
-        except Exception:
-            raise
+    def process(self, blob):
+        base_msg = convert_string(blob)
+        process_msg = MIMEMultipart()
+        self._process_msg(base_msg, process_msg)
+        return process_msg
 
-        process_includes(message_from_string(decomp_str(content)), appendmsg)
-
-
-def explode_cc_archive(archive, appendmsg):
-    for ent in yaml.load(archive):
-        # ent can be one of:
-        #  dict { 'filename' : 'value', 'content' : 'value', 'type' : 'value' }
-        #    filename and type not be present
-        # or
-        #  scalar(payload)
-
-        def_type = "text/cloud-config"
-        if isinstance(ent, str):
-            ent = {'content': ent}
-
-        content = ent.get('content', '')
-        mtype = ent.get('type', None)
-        if mtype == None:
-            mtype = type_from_startswith(content, def_type)
-
-        maintype, subtype = mtype.split('/', 1)
-        if maintype == "text":
-            msg = MIMEText(content, _subtype=subtype)
-        else:
-            msg = MIMEBase(maintype, subtype)
-            msg.set_payload(content)
-
-        if 'filename' in ent:
-            msg.add_header('Content-Disposition', 'attachment',
-                           filename=ent['filename'])
-
-        for header in ent.keys():
-            if header in ('content', 'filename', 'type'):
+    def _process_msg(self, base_msg, append_msg):
+        for part in base_msg.walk():
+            # multipart/* are just containers
+            if part.get_content_maintype() == 'multipart':
                 continue
-            msg.add_header(header, ent['header'])
+    
+            ctype = None
+            ctype_orig = part.get_content_type()
+            payload = part.get_payload(decode=True)
+    
+            if not ctype_orig:
+                ctype_orig = UNDEF_TYPE
+    
+            if ctype_orig in TYPE_NEEDED:
+                ctype = type_from_starts_with(payload)
+    
+            if ctype is None:
+                ctype = ctype_orig
+    
+            if ctype in INCLUDE_TYPES:
+                self._do_include(payload, append_msg)
+                continue
+    
+            if ctype in ARCHIVE_TYPES:
+                self._explode_archive(payload, append_msg)
+                continue
+    
+            if 'Content-Type' in base_msg:
+                base_msg.replace_header('Content-Type', ctype)
+            else:
+                base_msg['Content-Type'] = ctype
+    
+            self._attach_part(append_msg, part)
 
-        _attach_part(appendmsg, msg)
+    def _get_include_once_filename(self, entry):
+        msum = hashlib.new(INCLUDE_ONCE_HASHER)
+        msum.update(entry)
+        entry_fn = msum.hexdigest()[0:64]  # Don't get to long now
+        return os.path.join(self.paths.get_ipath_cur('data'), 'urlcache', entry_fn)
+
+    def _do_include(self, content, append_msg):
+        # is just a list of urls, one per line
+        # also support '#include <url here>'
+        for line in content.splitlines():
+            includeonce = False
+            if line in ("#include", "#include-once"):
+                continue
+            if line.startswith("#include-once"):
+                line = line[len("#include-once"):].lstrip()
+                includeonce = True
+            elif line.startswith("#include"):
+                line = line[len("#include"):].lstrip()
+            if line.startswith("#"):
+                continue
+            include_url = line.strip()
+            if not include_url:
+                continue
+
+            includeonce_filename = self._get_include_once_filename(include_url)
+            if includeonce and os.path.isfile(includeonce_filename):
+                content = util.load_file(includeonce_filename)
+            else:
+                (content, st) = url_helper.readurl(include_url)
+                if includeonce and url_helper.ok_http_code(st):
+                    util.write_file(includeonce_filename, content, mode=0600)
+                if not url_helper.ok_http_code(st):
+                    content = ''
+
+            new_msg = convert_string(content)
+            self._process_msg(new_msg, append_msg)
+
+    def _explode_archive(self, archive, append_msg):
+        try:
+            entries = yaml.load(archive)
+        except:
+            entries = []
+        if not isinstance(entries, (list, set)):
+            # TODO raise?
+            entries = []
+
+        for ent in entries:
+            # ent can be one of:
+            #  dict { 'filename' : 'value', 'content' : 'value', 'type' : 'value' }
+            #    filename and type not be present
+            # or
+            #  scalar(payload)
+            if isinstance(ent, str):
+                ent = {'content': ent}
+            if not isinstance(ent, (dict)):
+                # TODO raise?
+                continue
+
+            content = ent.get('content', '')
+            mtype = ent.get('type')
+            if not mtype:
+                mtype = type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
+
+            maintype, subtype = mtype.split('/', 1)
+            if maintype == "text":
+                msg = MIMEText(content, _subtype=subtype)
+            else:
+                msg = MIMEBase(maintype, subtype)
+                msg.set_payload(content)
+
+            if 'filename' in ent:
+                msg.add_header('Content-Disposition', 'attachment', filename=ent['filename'])
+
+            for header in ent.keys():
+                if header in ('content', 'filename', 'type'):
+                    continue
+                msg.add_header(header, ent['header'])
+
+            self._attach_part(append_msg, msg)
+
+    def _multi_part_count(self, outer_msg, new_count=None):
+        """
+        Return the number of attachments to this MIMEMultipart by looking
+        at its 'Number-Attachments' header.
+        """
+        if ATTACHMENT_FIELD not in outer_msg:
+            outer_msg[ATTACHMENT_FIELD] = str(0)
+    
+        if new_count is not None:
+            outer_msg.replace_header(ATTACHMENT_FIELD, str(new_count))
+    
+        fetched_count = 0
+        try:
+            fetched_count = int(outer_msg.get(ATTACHMENT_FIELD))
+        except (ValueError, TypeError):
+            outer_msg.replace_header(ATTACHMENT_FIELD, str(fetched_count))
+        return fetched_count
+
+    def _attach_part(self, outer_msg, part):
+        """
+        Attach an part to an outer message. outermsg must be a MIMEMultipart.
+        Modifies a header in the message to keep track of number of attachments.
+        """
+        cur = self._multi_part_count(outer_msg)
+        if not part.get_filename():
+            part.add_header('Content-Disposition', 'attachment', filename=PART_FN_TPL % (cur + 1))
+        outer_msg.attach(part)
+        self._multi_part_count(outer_msg, cur + 1)
 
 
-def multi_part_count(outermsg, newcount=None):
-    """
-    Return the number of attachments to this MIMEMultipart by looking
-    at its 'Number-Attachments' header.
-    """
-    nfield = 'Number-Attachments'
-    if nfield not in outermsg:
-        outermsg[nfield] = "0"
-
-    if newcount != None:
-        outermsg.replace_header(nfield, str(newcount))
-
-    return(int(outermsg.get('Number-Attachments', 0)))
-
-
-def _attach_part(outermsg, part):
-    """
-    Attach an part to an outer message. outermsg must be a MIMEMultipart.
-    Modifies a header in outermsg to keep track of number of attachments.
-    """
-    cur = multi_part_count(outermsg)
-    if not part.get_filename(None):
-        part.add_header('Content-Disposition', 'attachment',
-            filename='part-%03d' % (cur + 1))
-    outermsg.attach(part)
-    multi_part_count(outermsg, cur + 1)
-
-
-def type_from_startswith(payload, default=None):
-    # slist is sorted longest first
-    slist = sorted(starts_with_mappings.keys(), key=lambda e: 0 - len(e))
-    for sstr in slist:
-        if payload.startswith(sstr):
-            return(starts_with_mappings[sstr])
-    return default
-
-
-def process_includes(msg, appendmsg=None):
-    if appendmsg == None:
-        appendmsg = MIMEMultipart()
-
-    for part in msg.walk():
+# Callback is a function that will be called with 
+# (data, content_type, filename, payload)
+def walk(ud_msg, callback, data):
+    partnum = 0
+    for part in ud_msg.walk():
         # multipart/* are just containers
         if part.get_content_maintype() == 'multipart':
             continue
 
-        ctype = None
-        ctype_orig = part.get_content_type()
-
-        payload = part.get_payload(decode=True)
-
-        if ctype_orig in ("text/plain", "text/x-not-multipart"):
-            ctype = type_from_startswith(payload)
-
+        ctype = part.get_content_type()
         if ctype is None:
-            ctype = ctype_orig
+            ctype = OCTET_TYPE
 
-        if ctype in ('text/x-include-url', 'text/x-include-once-url'):
-            do_include(payload, appendmsg)
-            continue
+        filename = part.get_filename()
+        if not filename:
+            filename = PART_FN_TPL % partnum
 
-        if ctype == "text/cloud-config-archive":
-            explode_cc_archive(payload, appendmsg)
-            continue
-
-        if 'Content-Type' in msg:
-            msg.replace_header('Content-Type', ctype)
-        else:
-            msg['Content-Type'] = ctype
-
-        _attach_part(appendmsg, part)
+        callback(data, ctype, filename, part.get_payload(decode=True))
+        partnum = partnum + 1
 
 
-def message_from_string(data, headers=None):
-    if headers is None:
+def convert_string(self, raw_data, headers=None):
+    if not data:
+        data = ''
+    if not headers:
         headers = {}
+    data = util.decomp_str(raw_data)
     if "mime-version:" in data[0:4096].lower():
         msg = email.message_from_string(data)
         for (key, val) in headers.items():
@@ -213,50 +257,15 @@ def message_from_string(data, headers=None):
             else:
                 msg[key] = val
     else:
-        mtype = headers.get("Content-Type", "text/x-not-multipart")
+        mtype = headers.get("Content-Type", NOT_MULTIPART_TYPE)
         maintype, subtype = mtype.split("/", 1)
         msg = MIMEBase(maintype, subtype, *headers)
         msg.set_payload(data)
-
-    return(msg)
+    return msg
 
 
-# this is heavily wasteful, reads through userdata string input
-def preprocess_userdata(data):
-    newmsg = MIMEMultipart()
-    process_includes(message_from_string(decomp_str(data)), newmsg)
-    return(newmsg.as_string())
-
-
-# callback is a function that will be called with (data, content_type,
-# filename, payload)
-def walk_userdata(istr, callback, data=None):
-    partnum = 0
-    for part in message_from_string(istr).walk():
-        # multipart/* are just containers
-        if part.get_content_maintype() == 'multipart':
-            continue
-
-        ctype = part.get_content_type()
-        if ctype is None:
-            ctype = 'application/octet-stream'
-
-        filename = part.get_filename()
-        if not filename:
-            filename = 'part-%03d' % partnum
-
-        callback(data, ctype, filename, part.get_payload(decode=True))
-
-        partnum = partnum + 1
-
-
-if __name__ == "__main__":
-    def main():
-        import sys
-        data = decomp_str(file(sys.argv[1]).read())
-        newmsg = MIMEMultipart()
-        process_includes(message_from_string(data), newmsg)
-        print newmsg
-        print "#found %s parts" % multi_part_count(newmsg)
-
-    main()
+def type_from_starts_with(payload, default=None):
+    for text in INCLUSION_SRCH:
+        if payload.startswith(text):
+            return INCLUSION_TYPES_MAP[text]
+    return default

From e07f581f4f3bb3869f36f3629da625a2f8076f70 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:02:29 -0700
Subject: [PATCH 024/434] Moved the shell functionality back in here.

---
 cloudinit/util.py | 951 +++++++++++++++++++++-------------------------
 1 file changed, 437 insertions(+), 514 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 47397418..265a3a97 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -18,24 +18,24 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import yaml
+from StringIO import StringIO
+
+import contextlib
+import grp
+import gzip
 import os
-import os.path
+import platform
+import pwd
 import shutil
-import errno
 import subprocess
-from Cheetah.Template import Template
-import urllib2
-import urllib
-import logging
-import re
-import socket
-import sys
-import time
-import tempfile
-import traceback
 import urlparse
 
+import yaml
+
+from cloudinit import log as logging
+from cloudinit import url_helper as uhelp
+
+
 try:
     import selinux
     HAVE_LIBSELINUX = True
@@ -43,53 +43,153 @@ except ImportError:
     HAVE_LIBSELINUX = False
 
 
+LOG = logging.getLogger(__name__)
+
+# Helps cleanup filenames to ensure they aren't FS incompatible
+FN_REPLACEMENTS = {
+    os.sep: '_',
+}
+
+
+class ProcessExecutionError(IOError):
+
+    MESSAGE_TMPL = ('%(description)s\nCommand: %(cmd)s\n'
+                    'Exit code: %(exit_code)s\nStdout: %(stdout)r\n'
+                    'Stderr: %(stderr)r')
+
+    def __init__(self, stdout=None, stderr=None,
+                 exit_code=None, cmd=None,
+                 description=None, reason=None):
+        if not cmd:
+            self.cmd = '-'
+        else:
+            self.cmd = cmd
+
+        if not description:
+            self.description = 'Unexpected error while running command.'
+        else:
+            self.description = description
+
+        if not isinstance(exit_code, (long, int)):
+            self.exit_code = '-'
+        else:
+            self.exit_code = exit_code
+
+        if not stderr:
+            self.stderr = ''
+        else:
+            self.stderr = stderr
+
+        if not stdout:
+            self.stdout = ''
+        else:
+            self.stdout = stdout
+
+        message = self.MESSAGE_TMPL % {
+            'description': self.description,
+            'cmd': self.cmd,
+            'exit_code': self.exit_code,
+            'stdout': self.stdout,
+            'stderr': self.stderr,
+        }
+        IOError.__init__(self, message)
+        self.reason = reason
+
+
+class _SeLinuxGuard(object):
+    def __init__(self, path, recursive=False):
+        self.path = path
+        self.recursive = recursive
+        self.engaged = False
+        if HAVE_LIBSELINUX and selinux.is_selinux_enabled():
+            self.engaged = True
+
+    def __enter__(self):
+        return self.engaged
+
+    def __exit__(self, type, value, traceback):
+        if self.engaged:
+            LOG.debug("Disengaging selinux mode for %s: %s", self.path, self.recursive)
+            selinux.restorecon(self.path, recursive=self.recursive)
+
+
+def translate_bool(val):
+    if not val:
+        return False
+    if val is isinstance(val, bool):
+        return val
+    if str(val).lower().strip() in ['true', '1', 'on', 'yes']:
+        return True
+    return False
+
+
 def read_conf(fname):
     try:
-        stream = open(fname, "r")
-        conf = yaml.load(stream)
-        stream.close()
-        return conf
+        mp = yaml.load(load_file(fname))
+        if not isinstance(mp, (dict)):
+            return {}
+        return mp
     except IOError as e:
         if e.errno == errno.ENOENT:
             return {}
         raise
 
 
-def get_base_cfg(cfgfile, cfg_builtin="", parsed_cfgs=None):
-    kerncfg = {}
-    syscfg = {}
+def clean_filename(fn):
+    for (k, v) in FN_REPLACEMENTS.items():
+        fn = fn.replace(k, v)
+    return fn.strip()
+
+
+def decomp_str(data):
+    try:
+        uncomp = gzip.GzipFile(None, "rb", 1, StringIO(data)).read()
+        return uncomp
+    except:
+        return data
+
+
+def is_ipv4(instr):
+    """ determine if input string is a ipv4 address. return boolean"""
+    toks = instr.split('.')
+    if len(toks) != 4:
+        return False
+
+    try:
+        toks = [x for x in toks if (int(x) < 256 and int(x) > 0)]
+    except:
+        return False
+
+    return (len(toks) == 4)
+
+
+def get_base_cfg(cfgfile, cfg_builtin=None, parsed_cfgs=None):
     if parsed_cfgs and cfgfile in parsed_cfgs:
-        return(parsed_cfgs[cfgfile])
+        return parsed_cfgs[cfgfile]
 
     syscfg = read_conf_with_confd(cfgfile)
-
     kern_contents = read_cc_from_cmdline()
+    kerncfg = {}
     if kern_contents:
         kerncfg = yaml.load(kern_contents)
 
     # kernel parameters override system config
     combined = mergedict(kerncfg, syscfg)
-
     if cfg_builtin:
-        builtin = yaml.load(cfg_builtin)
-        fin = mergedict(combined, builtin)
+        fin = mergedict(combined, cfg_builtin)
     else:
         fin = combined
 
-    if parsed_cfgs != None:
+    # Cache it?
+    if parsed_cfgs:
         parsed_cfgs[cfgfile] = fin
-    return(fin)
+    return fin
 
 
 def get_cfg_option_bool(yobj, key, default=False):
     if key not in yobj:
         return default
-    val = yobj[key]
-    if val is True:
-        return True
-    if str(val).lower() in ['true', '1', 'on', 'yes']:
-        return True
-    return False
+    return translate_bool(yobj[key])
 
 
 def get_cfg_option_str(yobj, key, default=None):
@@ -98,6 +198,15 @@ def get_cfg_option_str(yobj, key, default=None):
     return yobj[key]
 
 
+def system_info():
+    return {
+        'platform': platform.platform(),
+        'release': platform.release(),
+        'python': platform.python_version(),
+        'uname': platform.uname(),
+    }
+
+
 def get_cfg_option_list_or_str(yobj, key, default=None):
     """
     Gets the C{key} config option from C{yobj} as a list of strings. If the
@@ -127,7 +236,7 @@ def get_cfg_by_path(yobj, keyp, default=None):
         if tok not in cur:
             return(default)
         cur = cur[tok]
-    return(cur)
+    return cur
 
 
 def mergedict(src, cand):
@@ -141,50 +250,29 @@ def mergedict(src, cand):
                 src[k] = v
             else:
                 src[k] = mergedict(src[k], v)
+    else:
+        if not isinstance(src, dict):
+            raise TypeError("Attempting to merge a non dictionary source type: %s" % (type(src)))
+        if not isinstance(cand, dict):
+            raise TypeError("Attempting to merge a non dictionary candiate type: %s" % (type(cand)))
     return src
 
 
-def delete_dir_contents(dirname):
-    """
-    Deletes all contents of a directory without deleting the directory itself.
-
-    @param dirname: The directory whose contents should be deleted.
-    """
-    for node in os.listdir(dirname):
-        node_fullpath = os.path.join(dirname, node)
-        if os.path.isdir(node_fullpath):
-            shutil.rmtree(node_fullpath)
-        else:
-            os.unlink(node_fullpath)
-
-
-def write_file(filename, content, mode=0644, omode="wb"):
-    """
-    Writes a file with the given content and sets the file mode as specified.
-    Resotres the SELinux context if possible.
-
-    @param filename: The full path of the file to write.
-    @param content: The content to write to the file.
-    @param mode: The filesystem mode to set on the file.
-    @param omode: The open mode used when opening the file (r, rb, a, etc.)
-    """
+@contextlib.contextmanager
+def tempdir(**kwargs):
+    # This seems like it was only added in python 3.2
+    # Make it since its useful...
+    # See: http://bugs.python.org/file12970/tempdir.patch
+    tdir = tempfile.mkdtemp(**kwargs)
     try:
-        os.makedirs(os.path.dirname(filename))
-    except OSError as e:
-        if e.errno != errno.EEXIST:
-            raise e
-
-    f = open(filename, omode)
-    if mode is not None:
-        os.chmod(filename, mode)
-    f.write(content)
-    f.close()
-    restorecon_if_possible(filename)
+        yield tdir
+    finally:
+        del_dir(tdir)
 
 
-def restorecon_if_possible(path, recursive=False):
-    if HAVE_LIBSELINUX and selinux.is_selinux_enabled():
-        selinux.restorecon(path, recursive=recursive)
+def del_dir(path):
+    LOG.debug("Recursively deleting %s", path)
+    shutil.rmtree(path)
 
 
 # get keyid from keyserver
@@ -202,7 +290,8 @@ def getkeybyid(keyid, keyserver):
     [ -n "${armour}" ] && echo "${armour}"
     """
     args = ['sh', '-c', shcmd, "export-gpg-keyid", keyid, keyserver]
-    return(subp(args)[0])
+    (stdout, stderr) = subp(args)
+    return stdout
 
 
 def runparts(dirp, skip_no_exist=True):
@@ -210,38 +299,19 @@ def runparts(dirp, skip_no_exist=True):
         return
 
     failed = 0
+    attempted = 0
     for exe_name in sorted(os.listdir(dirp)):
         exe_path = os.path.join(dirp, exe_name)
         if os.path.isfile(exe_path) and os.access(exe_path, os.X_OK):
-            popen = subprocess.Popen([exe_path])
-            popen.communicate()
-            if popen.returncode is not 0:
+            attempted += 1
+            try:
+                subp([exe_path])
+            except ProcessExecutionError as e:
+                LOG.exception("Failed running %s [%i]", exe_path, e.exit_code)
                 failed += 1
-                sys.stderr.write("failed: %s [%i]\n" %
-                    (exe_path, popen.returncode))
-    if failed:
-        raise RuntimeError('runparts: %i failures' % failed)
 
-
-def subp(args, input_=None):
-    sp = subprocess.Popen(args, stdout=subprocess.PIPE,
-        stderr=subprocess.PIPE, stdin=subprocess.PIPE)
-    out, err = sp.communicate(input_)
-    if sp.returncode is not 0:
-        raise subprocess.CalledProcessError(sp.returncode, args, (out, err))
-    return(out, err)
-
-
-def render_to_file(template, outfile, searchList):
-    t = Template(file='/etc/cloud/templates/%s.tmpl' % template,
-                 searchList=[searchList])
-    f = open(outfile, 'w')
-    f.write(t.respond())
-    f.close()
-
-
-def render_string(template, searchList):
-    return(Template(template, searchList=[searchList]).respond())
+    if failed and attempted:
+        raise RuntimeError('runparts: %i failures in %i attempted commands' % (failed, attempted))
 
 
 # read_optional_seed
@@ -254,13 +324,12 @@ def read_optional_seed(fill, base="", ext="", timeout=5):
         fill['user-data'] = ud
         fill['meta-data'] = md
         return True
-    except OSError, e:
+    except OSError as e:
         if e.errno == errno.ENOENT:
             return False
         raise
 
 
-# raise OSError with enoent if not found
 def read_seeded(base="", ext="", timeout=5, retries=10, file_retries=0):
     if base.startswith("/"):
         base = "file://%s" % base
@@ -276,89 +345,14 @@ def read_seeded(base="", ext="", timeout=5, retries=10, file_retries=0):
         ud_url = "%s%s%s" % (base, "user-data", ext)
         md_url = "%s%s%s" % (base, "meta-data", ext)
 
-    no_exc = object()
-    raise_err = no_exc
-    for attempt in range(0, retries + 1):
-        try:
-            md_str = readurl(md_url, timeout=timeout)
-            ud = readurl(ud_url, timeout=timeout)
-            md = yaml.load(md_str)
-
-            return(md, ud)
-        except urllib2.HTTPError as e:
-            raise_err = e
-        except urllib2.URLError as e:
-            raise_err = e
-            if (isinstance(e.reason, OSError) and
-                e.reason.errno == errno.ENOENT):
-                raise_err = e.reason
-
-        if attempt == retries:
-            break
-
-        #print "%s failed, sleeping" % attempt
-        time.sleep(1)
-
-    raise(raise_err)
-
-
-def logexc(log, lvl=logging.DEBUG):
-    log.log(lvl, traceback.format_exc())
-
-
-class RecursiveInclude(Exception):
-    pass
-
-
-def read_file_with_includes(fname, rel=".", stack=None, patt=None):
-    if stack is None:
-        stack = []
-    if not fname.startswith("/"):
-        fname = os.sep.join((rel, fname))
-
-    fname = os.path.realpath(fname)
-
-    if fname in stack:
-        raise(RecursiveInclude("%s recursively included" % fname))
-    if len(stack) > 10:
-        raise(RecursiveInclude("%s included, stack size = %i" %
-                               (fname, len(stack))))
-
-    if patt == None:
-        patt = re.compile("^#(opt_include|include)[ \t].*$", re.MULTILINE)
-
-    try:
-        fp = open(fname)
-        contents = fp.read()
-        fp.close()
-    except:
-        raise
-
-    rel = os.path.dirname(fname)
-    stack.append(fname)
-
-    cur = 0
-    while True:
-        match = patt.search(contents[cur:])
-        if not match:
-            break
-        loc = match.start() + cur
-        endl = match.end() + cur
-
-        (key, cur_fname) = contents[loc:endl].split(None, 2)
-        cur_fname = cur_fname.strip()
-
-        try:
-            inc_contents = read_file_with_includes(cur_fname, rel, stack, patt)
-        except IOError, e:
-            if e.errno == errno.ENOENT and key == "#opt_include":
-                inc_contents = ""
-            else:
-                raise
-        contents = contents[0:loc] + inc_contents + contents[endl + 1:]
-        cur = loc + len(inc_contents)
-    stack.pop()
-    return(contents)
+    (md_str, msc) = uhelp.readurl(md_url, timeout=timeout, retries=retries)
+    (ud, usc) = uhelp.readurl(ud_url, timeout=timeout, retries=retries)
+    md = None
+    if md_str and uhelp.ok_http_code(msc):
+        md = yaml.load(md_str)
+    if not uhelp.ok_http_code(usc):
+        ud = None
+    return (md, ud)
 
 
 def read_conf_d(confd):
@@ -369,46 +363,32 @@ def read_conf_d(confd):
     confs = [f for f in confs if f.endswith(".cfg")]
 
     # remove anything not a file
-    confs = [f for f in confs if os.path.isfile("%s/%s" % (confd, f))]
+    confs = [f for f in confs if os.path.isfile(os.path.join(confd, f))]
 
     cfg = {}
     for conf in confs:
-        cfg = mergedict(cfg, read_conf("%s/%s" % (confd, conf)))
+        cfg = mergedict(cfg, read_conf(os.path.join(confd, conf)))
 
-    return(cfg)
+    return cfg
 
 
 def read_conf_with_confd(cfgfile):
     cfg = read_conf(cfgfile)
+
     confd = False
     if "conf_d" in cfg:
         if cfg['conf_d'] is not None:
             confd = cfg['conf_d']
             if not isinstance(confd, str):
-                raise Exception("cfgfile %s contains 'conf_d' "
+                raise RuntimeError("cfgfile %s contains 'conf_d' "
                                 "with non-string" % cfgfile)
     elif os.path.isdir("%s.d" % cfgfile):
         confd = "%s.d" % cfgfile
 
     if not confd:
-        return(cfg)
+        return cfg
 
-    confd_cfg = read_conf_d(confd)
-
-    return(mergedict(confd_cfg, cfg))
-
-
-def get_cmdline():
-    if 'DEBUG_PROC_CMDLINE' in os.environ:
-        cmdline = os.environ["DEBUG_PROC_CMDLINE"]
-    else:
-        try:
-            cmdfp = open("/proc/cmdline")
-            cmdline = cmdfp.read().strip()
-            cmdfp.close()
-        except:
-            cmdline = ""
-    return(cmdline)
+    return mergedict(read_conf_d(confd), cfg)
 
 
 def read_cc_from_cmdline(cmdline=None):
@@ -439,147 +419,15 @@ def read_cc_from_cmdline(cmdline=None):
 
         begin = cmdline.find(tag_begin, end + end_l)
 
-    return('\n'.join(tokens))
+    return '\n'.join(tokens)
 
 
-def ensure_dirs(dirlist, mode=0755):
-    fixmodes = []
-    for d in dirlist:
-        try:
-            if mode != None:
-                os.makedirs(d)
-            else:
-                os.makedirs(d, mode)
-        except OSError as e:
-            if e.errno != errno.EEXIST:
-                raise
-            if mode != None:
-                fixmodes.append(d)
-
-    for d in fixmodes:
-        os.chmod(d, mode)
-
-
-def chownbyname(fname, user=None, group=None):
-    uid = -1
-    gid = -1
-    if user == None and group == None:
-        return
-    if user:
-        import pwd
-        uid = pwd.getpwnam(user).pw_uid
-    if group:
-        import grp
-        gid = grp.getgrnam(group).gr_gid
-
-    os.chown(fname, uid, gid)
-
-
-def readurl(url, data=None, timeout=None):
-    openargs = {}
-    if timeout != None:
-        openargs['timeout'] = timeout
-
-    if data is None:
-        req = urllib2.Request(url)
-    else:
-        encoded = urllib.urlencode(data)
-        req = urllib2.Request(url, encoded)
-
-    response = urllib2.urlopen(req, **openargs)
-    return(response.read())
-
-
-# shellify, takes a list of commands
-#  for each entry in the list
-#    if it is an array, shell protect it (with single ticks)
-#    if it is a string, do nothing
-def shellify(cmdlist):
-    content = "#!/bin/sh\n"
-    escaped = "%s%s%s%s" % ("'", '\\', "'", "'")
-    for args in cmdlist:
-        # if the item is a list, wrap all items in single tick
-        # if its not, then just write it directly
-        if isinstance(args, list):
-            fixed = []
-            for f in args:
-                fixed.append("'%s'" % str(f).replace("'", escaped))
-            content = "%s%s\n" % (content, ' '.join(fixed))
-        else:
-            content = "%s%s\n" % (content, str(args))
-    return content
-
-
-def dos2unix(string):
+def dos2unix(contents):
     # find first end of line
-    pos = string.find('\n')
-    if pos <= 0 or string[pos - 1] != '\r':
-        return(string)
-    return(string.replace('\r\n', '\n'))
-
-
-def is_container():
-    # is this code running in a container of some sort
-
-    for helper in ('running-in-container', 'lxc-is-container'):
-        try:
-            # try to run a helper program. if it returns true
-            # then we're inside a container. otherwise, no
-            sp = subprocess.Popen(helper, stdout=subprocess.PIPE,
-                                  stderr=subprocess.PIPE)
-            sp.communicate(None)
-            return(sp.returncode == 0)
-        except OSError as e:
-            if e.errno != errno.ENOENT:
-                raise
-
-    # this code is largely from the logic in
-    # ubuntu's /etc/init/container-detect.conf
-    try:
-        # Detect old-style libvirt
-        # Detect OpenVZ containers
-        pid1env = get_proc_env(1)
-        if "container" in pid1env:
-            return True
-
-        if "LIBVIRT_LXC_UUID" in pid1env:
-            return True
-
-    except IOError as e:
-        if e.errno != errno.ENOENT:
-            pass
-
-    # Detect OpenVZ containers
-    if os.path.isdir("/proc/vz") and not os.path.isdir("/proc/bc"):
-        return True
-
-    try:
-        # Detect Vserver containers
-        with open("/proc/self/status") as fp:
-            lines = fp.read().splitlines()
-            for line in lines:
-                if line.startswith("VxID:"):
-                    (_key, val) = line.strip().split(":", 1)
-                    if val != "0":
-                        return True
-    except IOError as e:
-        if e.errno != errno.ENOENT:
-            pass
-
-    return False
-
-
-def get_proc_env(pid):
-    # return the environment in a dict that a given process id was started with
-    env = {}
-    with open("/proc/%s/environ" % pid) as fp:
-        toks = fp.read().split("\0")
-        for tok in toks:
-            if tok == "":
-                continue
-            (name, val) = tok.split("=", 1)
-            env[name] = val
-    return env
+    pos = contents.find('\n')
+    if pos <= 0 or contents[pos - 1] != '\r':
+        return contents
+    return contents.replace('\r\n', '\n')
 
 
 def get_hostname_fqdn(cfg, cloud):
@@ -603,7 +451,7 @@ def get_hostname_fqdn(cfg, cloud):
                 hostname = cfg['hostname']
             else:
                 hostname = cloud.get_hostname()
-    return(hostname, fqdn)
+    return (hostname, fqdn)
 
 
 def get_fqdn_from_hosts(hostname, filename="/etc/hosts"):
@@ -612,26 +460,22 @@ def get_fqdn_from_hosts(hostname, filename="/etc/hosts"):
     # did not have did not have 'bind' in the order attribute
     fqdn = None
     try:
-        with open(filename, "r") as hfp:
-            for line in hfp.readlines():
-                hashpos = line.find("#")
-                if hashpos >= 0:
-                    line = line[0:hashpos]
-                toks = line.split()
-
-                # if there there is less than 3 entries (ip, canonical, alias)
-                # then ignore this line
-                if len(toks) < 3:
-                    continue
-
-                if hostname in toks[2:]:
-                    fqdn = toks[1]
-                    break
-            hfp.close()
+        for line in load_file(filename).splitlines():
+            hashpos = line.find("#")
+            if hashpos >= 0:
+                line = line[0:hashpos]
+            toks = line.split()
+        
+            # if there there is less than 3 entries (ip, canonical, alias)
+            # then ignore this line
+            if len(toks) < 3:
+                continue
+        
+            if hostname in toks[2:]:
+                fqdn = toks[1]
+                break
     except IOError as e:
-        if e.errno == errno.ENOENT:
-            pass
-
+        pass
     return fqdn
 
 
@@ -646,7 +490,7 @@ def is_resolvable(name):
 
 def is_resolvable_url(url):
     """ determine if this url is resolvable (existing or ip) """
-    return(is_resolvable(urlparse.urlparse(url).hostname))
+    return (is_resolvable(urlparse.urlparse(url).hostname))
 
 
 def search_for_mirror(candidates):
@@ -656,8 +500,7 @@ def search_for_mirror(candidates):
             if is_resolvable_url(cand):
                 return cand
         except Exception:
-            raise
-
+            pass
     return None
 
 
@@ -669,7 +512,7 @@ def close_stdin():
     if _CLOUD_INIT_SAVE_STDIN is set in environment to a non empty or '0' value
     then input will not be closed (only useful potentially for debugging).
     """
-    if os.environ.get("_CLOUD_INIT_SAVE_STDIN") in ("", "0", False):
+    if os.environ.get("_CLOUD_INIT_SAVE_STDIN") in ("", "0", 'False'):
         return
     with open(os.devnull) as fp:
         os.dup2(fp.fileno(), sys.stdin.fileno())
@@ -685,163 +528,244 @@ def find_devs_with(criteria):
     """
     try:
         (out, _err) = subp(['blkid', '-t%s' % criteria, '-odevice'])
-    except subprocess.CalledProcessError:
-        return([])
-    return(str(out).splitlines())
+    except ProcessExecutionError:
+        return []
+    return (out.splitlines())
 
 
-class mountFailedError(Exception):
-    pass
+def load_file(fname, read_cb=None):
+    LOG.debug("Reading from %s", fname)
+    with open(fname, 'rb') as fh:
+        ofh = StringIO()
+        pipe_in_out(fh, ofh, chunk_cb=read_cb)
+        return ofh.getvalue()
 
 
-def mount_callback_umount(device, callback, data=None):
-    """
-    mount the device, call method 'callback' passing the directory
-    in which it was mounted, then unmount.  Return whatever 'callback'
-    returned.  If data != None, also pass data to callback.
-    """
-
-    def _cleanup(umount, tmpd):
-        if umount:
-            try:
-                subp(["umount", '-l', umount])
-            except subprocess.CalledProcessError:
-                raise
-        if tmpd:
-            os.rmdir(tmpd)
-
-    # go through mounts to see if it was already mounted
-    fp = open("/proc/mounts")
-    mounts = fp.readlines()
-    fp.close()
-
-    tmpd = None
-
-    mounted = {}
-    for mpline in mounts:
-        (dev, mp, fstype, _opts, _freq, _passno) = mpline.split()
-        mp = mp.replace("\\040", " ")
-        mounted[dev] = (dev, fstype, mp, False)
-
-    umount = False
-    if device in mounted:
-        mountpoint = "%s/" % mounted[device][2]
+def get_cmdline():
+    if 'DEBUG_PROC_CMDLINE' in os.environ:
+        cmdline = os.environ["DEBUG_PROC_CMDLINE"]
     else:
-        tmpd = tempfile.mkdtemp()
-
-        mountcmd = ["mount", "-o", "ro", device, tmpd]
-
         try:
-            (_out, _err) = subp(mountcmd)
-            umount = tmpd
-        except subprocess.CalledProcessError as exc:
-            _cleanup(umount, tmpd)
-            raise mountFailedError(exc.output[1])
+            cmdline = load_file("/proc/cmdline").strip()
+        except:
+            cmdline = ""
+    return cmdline
 
-        mountpoint = "%s/" % tmpd
+
+def pipe_in_out(in_fh, out_fh, chunk_size=1024, chunk_cb=None):
+    bytes_piped = 0
+    LOG.debug("Transferring the contents of %s to %s in chunks of size %s.", in_fh, out_fh, chunk_size)
+    while True:
+        data = in_fh.read(chunk_size)
+        if data == '':
+            break
+        else:
+            out_fh.write(data)
+            bytes_piped += len(data)
+            if chunk_cb:
+                chunk_cb(bytes_piped)
+    out_fh.flush()
+    return bytes_piped
+
+
+def chownbyid(fname, uid=None, gid=None):
+    if uid == None and gid == None:
+        return
+    LOG.debug("Changing the ownership of %s to %s:%s", fname, uid, gid)
+    os.chown(fname, uid, gid)
+
+
+def chownbyname(fname, user=None, group=None):
+    uid = -1
+    gid = -1
+    if user:
+        uid = pwd.getpwnam(user).pw_uid
+    if group:
+        gid = grp.getgrnam(group).gr_gid
+    chownbyid(fname, uid, gid)
+
+
+def ensure_dirs(dirlist, mode=0755):
+    for d in dirlist:
+        ensure_dir(d, mode)
+
+
+def ensure_dir(path, mode=0755):
+    if not os.path.isdir(path):
+        fixmodes = []
+        LOG.debug("Ensuring directory exists at path %s (perms=%s)", dir_name, mode)
+        try:
+            os.makedirs(path)
+        except OSError as e:
+            if e.errno != errno.EEXIST:
+                raise e
+        if mode is not None:
+            os.chmod(path, mode)
+
+
+def sym_link(source, link):
+    LOG.debug("Creating symbolic link from %r => %r" % (link, source))
+    os.symlink(source, link)
+
+
+def del_file(path):
+    LOG.debug("Attempting to remove %s", path)
+    try:
+        os.unlink(path)
+    except OSError as e:
+        if e.errno != errno.ENOENT:
+            raise e
+
+
+def ensure_file(path):
+    write_file(path, content='', omode="ab")
+
+
+def write_file(filename, content, mode=0644, omode="wb"):
+    """
+    Writes a file with the given content and sets the file mode as specified.
+    Resotres the SELinux context if possible.
+
+    @param filename: The full path of the file to write.
+    @param content: The content to write to the file.
+    @param mode: The filesystem mode to set on the file.
+    @param omode: The open mode used when opening the file (r, rb, a, etc.)
+    """
+    ensure_dir(os.path.dirname(filename))
+    LOG.debug("Writing to %s - %s (perms=%s) %s bytes", filename, omode, mode, len(content))
+    with open(filename, omode) as fh:
+        with _SeLinuxGuard(filename):
+            fh.write(content)
+            fh.flush()
+            if mode is not None:
+                os.chmod(filename, mode)
+
+
+def delete_dir_contents(dirname):
+    """
+    Deletes all contents of a directory without deleting the directory itself.
+
+    @param dirname: The directory whose contents should be deleted.
+    """
+    for node in os.listdir(dirname):
+        node_fullpath = os.path.join(dirname, node)
+        if os.path.isdir(node_fullpath):
+            del_dir(node_fullpath)
+        else:
+            del_file(node_fullpath)
+
+
+def subp(args, input_data=None, allowed_rc=None, env=None):
+    if allowed_rc is None:
+        allowed_rc = [0]
+    try:
+        LOG.debug("Running command %s with allowed return codes %s", args, allowed_rc)
+        sp = subprocess.Popen(args, stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE, stdin=subprocess.PIPE,
+            env=env)
+        (out, err) = sp.communicate(input_data)
+    except OSError as e:
+        raise ProcessExecutionError(cmd=args, reason=e)
+    rc = sp.returncode
+    if rc not in allowed_rc:
+        raise ProcessExecutionError(stdout=out, stderr=err,
+                                         exit_code=rc,
+                                         cmd=args)
+    # Just ensure blank instead of none??
+    if not out:
+        out = ''
+    if not err:
+        err = ''
+    return (out, err)
+
+
+# shellify, takes a list of commands
+#  for each entry in the list
+#    if it is an array, shell protect it (with single ticks)
+#    if it is a string, do nothing
+def shellify(cmdlist, add_header=True):
+    content = ''
+    if add_header:
+        content += "#!/bin/sh\n"
+    escaped = "%s%s%s%s" % ("'", '\\', "'", "'")
+    for args in cmdlist:
+        # if the item is a list, wrap all items in single tick
+        # if its not, then just write it directly
+        if isinstance(args, list):
+            fixed = []
+            for f in args:
+                fixed.append("'%s'" % str(f).replace("'", escaped))
+            content = "%s%s\n" % (content, ' '.join(fixed))
+        else:
+            content = "%s%s\n" % (content, str(args))
+    return content
+
+
+def is_container():
+    # is this code running in a container of some sort
+
+    for helper in ('running-in-container', 'lxc-is-container'):
+        try:
+            # try to run a helper program. if it returns true/zero
+            # then we're inside a container. otherwise, no
+            cmd = [helper]
+            (stdout, stderr) = subp(cmd, allowed_rc=[0])
+            return True
+        except IOError as e:
+            pass
+            # Is this really needed?
+            # if e.errno != errno.ENOENT:
+            #     raise
+
+    # this code is largely from the logic in
+    # ubuntu's /etc/init/container-detect.conf
+    try:
+        # Detect old-style libvirt
+        # Detect OpenVZ containers
+        pid1env = get_proc_env(1)
+        if "container" in pid1env:
+            return True
+        if "LIBVIRT_LXC_UUID" in pid1env:
+            return True
+    except IOError as e:
+        pass
+
+    # Detect OpenVZ containers
+    if os.path.isdir("/proc/vz") and not os.path.isdir("/proc/bc"):
+        return True
 
     try:
-        if data == None:
-            ret = callback(mountpoint)
-        else:
-            ret = callback(mountpoint, data)
-
-    except Exception as exc:
-        _cleanup(umount, tmpd)
-        raise exc
-
-    _cleanup(umount, tmpd)
-
-    return(ret)
-
-
-def wait_for_url(urls, max_wait=None, timeout=None,
-                 status_cb=None, headers_cb=None):
-    """
-    urls:      a list of urls to try
-    max_wait:  roughly the maximum time to wait before giving up
-               The max time is *actually* len(urls)*timeout as each url will
-               be tried once and given the timeout provided.
-    timeout:   the timeout provided to urllib2.urlopen
-    status_cb: call method with string message when a url is not available
-    headers_cb: call method with single argument of url to get headers
-                for request.
-
-    the idea of this routine is to wait for the EC2 metdata service to
-    come up.  On both Eucalyptus and EC2 we have seen the case where
-    the instance hit the MD before the MD service was up.  EC2 seems
-    to have permenantely fixed this, though.
-
-    In openstack, the metadata service might be painfully slow, and
-    unable to avoid hitting a timeout of even up to 10 seconds or more
-    (LP: #894279) for a simple GET.
-
-    Offset those needs with the need to not hang forever (and block boot)
-    on a system where cloud-init is configured to look for EC2 Metadata
-    service but is not going to find one.  It is possible that the instance
-    data host (169.254.169.254) may be firewalled off Entirely for a sytem,
-    meaning that the connection will block forever unless a timeout is set.
-    """
-    starttime = time.time()
-
-    sleeptime = 1
-
-    def nullstatus_cb(msg):
-        return
-
-    if status_cb == None:
-        status_cb = nullstatus_cb
-
-    def timeup(max_wait, starttime):
-        return((max_wait <= 0 or max_wait == None) or
-               (time.time() - starttime > max_wait))
-
-    loop_n = 0
-    while True:
-        sleeptime = int(loop_n / 5) + 1
-        for url in urls:
-            now = time.time()
-            if loop_n != 0:
-                if timeup(max_wait, starttime):
-                    break
-                if timeout and (now + timeout > (starttime + max_wait)):
-                    # shorten timeout to not run way over max_time
-                    timeout = int((starttime + max_wait) - now)
-
-            reason = ""
-            try:
-                if headers_cb != None:
-                    headers = headers_cb(url)
-                else:
-                    headers = {}
-
-                req = urllib2.Request(url, data=None, headers=headers)
-                resp = urllib2.urlopen(req, timeout=timeout)
-                if resp.read() != "":
-                    return url
-                reason = "empty data [%s]" % resp.getcode()
-            except urllib2.HTTPError as e:
-                reason = "http error [%s]" % e.code
-            except urllib2.URLError as e:
-                reason = "url error [%s]" % e.reason
-            except socket.timeout as e:
-                reason = "socket timeout [%s]" % e
-            except Exception as e:
-                reason = "unexpected error [%s]" % e
-
-            status_cb("'%s' failed [%s/%ss]: %s" %
-                      (url, int(time.time() - starttime), max_wait,
-                       reason))
-
-        if timeup(max_wait, starttime):
-            break
-
-        loop_n = loop_n + 1
-        time.sleep(sleeptime)
+        # Detect Vserver containers
+        lines = load_file("/proc/self/status").splitlines()
+        for line in lines:
+            if line.startswith("VxID:"):
+                (_key, val) = line.strip().split(":", 1)
+                if val != "0":
+                    return True
+    except IOError as e:
+        pass
 
     return False
 
 
+def get_proc_env(pid):
+    # return the environment in a dict that a given process id was started with
+    env = {}
+    fn = os.path.join("/proc/", str(pid), "environ")
+    try:
+        contents = load_file(fn)
+        toks = contents.split("\0")
+        for tok in toks:
+            if tok == "":
+                continue
+            (name, val) = tok.split("=", 1)
+            if not name:
+                env[name] = val
+    except IOError:
+        pass
+    return env
+
+
 def keyval_str_to_dict(kvstring):
     ret = {}
     for tok in kvstring.split():
@@ -851,5 +775,4 @@ def keyval_str_to_dict(kvstring):
             key = tok
             val = True
         ret[key] = val
-
-    return(ret)
+    return ret

From 3e7e8f0612aa0db5406e8100308cf945ee91be1b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:02:45 -0700
Subject: [PATCH 025/434] Moved some of the mounting logic here. Also
 introduced a context manager which will help unmount.

---
 cloudinit/mounting.py | 51 +++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 51 insertions(+)
 create mode 100644 cloudinit/mounting.py

diff --git a/cloudinit/mounting.py b/cloudinit/mounting.py
new file mode 100644
index 00000000..b72f729a
--- /dev/null
+++ b/cloudinit/mounting.py
@@ -0,0 +1,51 @@
+import contextlib
+
+from cloudinit import util
+
+
+class MountFailedError(Exception):
+    pass
+
+
+@contextlib.contextmanager
+def unmounter(umount):
+    try:
+        yield umount
+    finally:
+        if umount:
+            sh.subp(["umount", '-l', umount])
+
+
+def mount_callback_umount(device, callback, data=None):
+    """
+    mount the device, call method 'callback' passing the directory
+    in which it was mounted, then unmount.  Return whatever 'callback'
+    returned.  If data != None, also pass data to callback.
+    """
+
+    # go through mounts to see if it was already mounted
+    mounts = sh.load_file("/proc/mounts").splitlines()
+    mounted = {}
+    for mpline in mounts:
+        (dev, mp, fstype, _opts, _freq, _passno) = mpline.split()
+        mp = mp.replace("\\040", " ")
+        mounted[dev] = (dev, fstype, mp, False)
+
+    with util.tempdir() as tmpd:
+        umount = False
+        if device in mounted:
+            mountpoint = "%s/" % mounted[device][2]
+        else:
+            try:
+                mountcmd = ["mount", "-o", "ro", device, tmpd]
+                util.subp(mountcmd)
+                umount = tmpd
+            except IOError as exc:
+                raise MountFailedError("%s" % (exc))
+            mountpoint = "%s/" % tmpd
+        with unmounter(umount):
+            if data is None:
+                ret = callback(mountpoint)
+            else:
+                ret = callback(mountpoint, data)
+            return ret

From 9418e6cdfff8c32c121779db120a91aef89f61bb Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:03:22 -0700
Subject: [PATCH 026/434] This file now holds the default part handlers (shell
 script, cloud-config, upstart-jobs, boot-hook) as classes as well as some
 utility methods to fixup imported modules (ensuring they have the right
 members/properties) and moving the walking handler callbacks and other part
 running functionality here.

---
 cloudinit/parts.py | 200 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 200 insertions(+)
 create mode 100644 cloudinit/parts.py

diff --git a/cloudinit/parts.py b/cloudinit/parts.py
new file mode 100644
index 00000000..9cd24c5a
--- /dev/null
+++ b/cloudinit/parts.py
@@ -0,0 +1,200 @@
+import os
+
+from cloudinit import util
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
+from cloudinit import log as logging
+
+LOG = logging.getLogger(__name__)
+
+CONTENT_END = "__end__"
+CONTENT_START = "__begin__"
+PART_CONTENT_TYPES = ["text/part-handler"]
+PART_HANDLER_FN_TMPL = 'part-handler-%03d'
+
+
+class PartHandler(object):
+    def __init__(self, frequency, version=2):
+        self.handler_version = version
+        self.frequency = frequency
+
+    def __repr__(self):
+        return "%s: [%s]" % (self.__class__.__name__, self.list_types())
+
+    def list_types(self):
+        raise NotImplementedError()
+
+    def handle_part(self, data, ctype, filename, payload, frequency):
+        return self._handle_part(data, ctype, filename, payload, frequency)
+
+    def _handle_part(self, data, ctype, filename, payload, frequency):
+        raise NotImplementedError()
+
+
+class BootHookPartHandler(PartHandler):
+    def __init__(self, boothook_dir, instance_id):
+        PartHandler.__init__(self, PER_ALWAYS)
+        self.boothook_dir = boothook_dir
+        self.instance_id = instance_id
+
+    def list_types(self):
+        return ['text/cloud-boothook']
+    
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype in [CONTENT_START, CONTENT_END]:
+            return
+
+        filename = util.clean_filename(filename)
+        payload = util.dos2unix(payload)
+        prefix = "#cloud-boothook"
+        start = 0
+        if payload.startswith(prefix):
+            start = len(prefix) + 1
+
+        filepath = os.path.join(self.boothook_dir, filename)
+        util.write_file(filepath, payload[start:], 0700)
+        try:
+            env = os.environ.copy()
+            env['INSTANCE_ID'] = str(self.instance_id)
+            util.subp([filepath], env=env)
+        except util.ProcessExecutionError as e:
+            LOG.error("Boothooks script %s returned %s", filepath, e.exit_code)
+        except Exception as e:
+            LOG.error("Boothooks unknown exception %s when running %s", e, filepath)
+
+
+class UpstartJobPartHandler(PartHandler):
+    def __init__(self, upstart_dir):
+        PartHandler.__init__(self, PER_INSTANCE)
+        self.upstart_dir = upstart_dir
+
+    def list_types(self):
+        return ['text/upstart-job']
+
+    def _handle_part(self, _data, ctype, filename, payload, frequency):
+        if ctype in [CONTENT_START, CONTENT_END]:
+            return
+
+        filename = utils.clean_filename(filename)
+        (name, ext) = os.path.splitext(filename)
+        ext = ext.lower()
+        if ext != ".conf":
+            filename = filename + ".conf"
+
+        payload = util.dos2unix(payload)
+        util.write_file(os.path.join(self.upstart_dir, filename), payload, 0644)
+
+
+class ShellScriptPartHandler(PartHandler):
+
+    def __init__(self, script_dir):
+        PartHandler.__init__(self, PER_ALWAYS)
+        self.script_dir = script_dir
+
+    def list_types(self):
+        return ['text/x-shellscript']
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype in [CONTENT_START, CONTENT_END]:
+            # maybe delete existing things here
+            return
+
+        filename = util.clean_filename(filename)
+        payload = util.dos2unix(payload)
+        util.write_file(os.path.join(self.script_dir, filename), payload, 0700)
+
+
+class CloudConfigPartHandler(PartHandler):
+    def __init__(self, cloud_fn):
+        PartHandler.__init__(self, PER_ALWAYS)
+        self.cloud_buf = []
+        self.cloud_fn = cloud_fn
+
+    def list_types(self):
+        return ['text/cloud-config']
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype == CONTENT_START:
+            self.cloud_buf = []
+            return
+
+        if ctype == CONTENT_END:
+            payload = "\n".join(self.cloud_buf)
+            util.write_file(self.cloud_fn, payload, 0600)
+            self.cloud_buf = []
+            return
+
+        filename = util.clean_filename(filename)
+        entry = "\n".join(["#%s" % (filename), str(payload)])
+        self.config_buf.append(entry)
+
+
+def fixup_module(mod):
+    if not hasattr(mod, "handler_version"):
+        setattr(mod, "handler_version", 1)
+    if not hasattr(mod, 'list_types'):
+        def empty_types():
+            return []
+        setattr(mod, 'list_types', empty_types)
+    if not hasattr(mod, frequency):
+        setattr(mod, 'frequency', PER_INSTANCE)
+    return mod
+
+
+def run_part(mod, data, ctype, filename, payload, frequency):
+    # only add the handler if the module should run
+    mod_freq = getattr(mod, "frequency")
+    if not (mod_freq == PER_ALWAYS or
+            (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
+        return
+    try:
+        mod_ver = getattr(mod, 'handler_version')
+        if mod_ver == 1:
+            mod.handle_part(data, ctype, filename, payload)
+        else:
+            mod.handle_part(data, ctype, filename, payload, frequency)
+    except:
+        LOG.exception("Failed calling mod %s (%s, %s, %s) with frequency %s", mod, ctype, filename, mod_ver, frequency)
+
+
+def call_begin(mod, data, frequency):
+    run_part(mod, data, CONTENT_START, None, None, frequency)
+
+
+def call_end(mod, data, frequency):
+    run_part(mod, data, CONTENT_END, None, None, frequency)
+
+
+def walker_handle_handler(pdata, _ctype, _filename, payload):
+    curcount = pdata['handlercount']
+    modname = PART_HANDLER_FN_TMPL % (curcount)
+    frequency = pdata['frequency']
+    modfname = os.path.join(pdata['handlerdir'], "%s.py" % (modname))
+    # TODO: Check if path exists??
+    util.write_file(modfname, payload, 0600)
+    handlers = pdata['handlers']
+    try:
+        mod = fixup_module(importer.import_module(modname))
+        handlers.register(mod)
+        call_begin(mod, pdata['data'], frequency)
+        pdata['handlercount'] = curcount + 1
+    except:
+        LOG.exception("Failed at registered python file %s", modfname)
+
+
+def walker_callback(pdata, ctype, filename, payload):
+    # data here is the part_handlers array and then the data to pass through
+    if ctype in PART_CONTENT_TYPES:
+        walker_handle_handler(pdata, ctype, filename, payload)
+        return
+    handlers = pdata['handlers']
+    if ctype not in handlers:
+        if ctype == "text/x-not-multipart":
+            # Extract the first line or 24 bytes for displaying in the log
+            start = payload.split("\n", 1)[0][:24]
+            if start < payload:
+                details = "starting '%s...'" % start.encode("string-escape")
+            else:
+                details = repr(payload)
+            LOG.warning("Unhandled non-multipart userdata: %s", details)
+        return
+    run_part(handlers[ctype], pdata['data'], ctype, filename, payload, pdata['frequency'])

From f9a37a4e09d4262671b53f4e0c35dc0c20ca1e02 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:04:56 -0700
Subject: [PATCH 027/434] Remove cloud config from here and move to cloud.py

---
 cloudinit/handlers/__init__.py | 60 +++++-----------------------------
 1 file changed, 9 insertions(+), 51 deletions(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index a16bdde6..3b0cdd4e 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -19,65 +19,23 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 #
 
-import yaml
-import cloudinit
-import cloudinit.util as util
-import sys
-import traceback
 import os
 import subprocess
+import sys
 import time
+import traceback
 
-per_instance = cloudinit.per_instance
-per_always = cloudinit.per_always
-per_once = cloudinit.per_once
+import yaml
 
+from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE)
 
-class CloudConfig():
-    cfgfile = None
-    cfg = None
+from cloudinit import log as logging
+from cloudinit import util
 
-    def __init__(self, cfgfile, cloud=None, ds_deps=None):
-        if cloud == None:
-            self.cloud = cloudinit.CloudInit(ds_deps)
-            self.cloud.get_data_source()
-        else:
-            self.cloud = cloud
-        self.cfg = self.get_config_obj(cfgfile)
+LOG = logging.getLogger(__name__)
 
-    def get_config_obj(self, cfgfile):
-        try:
-            cfg = util.read_conf(cfgfile)
-        except:
-            # TODO: this 'log' could/should be passed in
-            cloudinit.log.critical("Failed loading of cloud config '%s'. "
-                                   "Continuing with empty config\n" % cfgfile)
-            cloudinit.log.debug(traceback.format_exc() + "\n")
-            cfg = None
-        if cfg is None:
-            cfg = {}
-
-        try:
-            ds_cfg = self.cloud.datasource.get_config_obj()
-        except:
-            ds_cfg = {}
-
-        cfg = util.mergedict(cfg, ds_cfg)
-        return(util.mergedict(cfg, self.cloud.cfg))
-
-    def handle(self, name, args, freq=None):
-        try:
-            mod = __import__("cc_" + name.replace("-", "_"), globals())
-            def_freq = getattr(mod, "frequency", per_instance)
-            handler = getattr(mod, "handle")
-
-            if not freq:
-                freq = def_freq
-
-            self.cloud.sem_and_run("config-" + name, freq, handler,
-                [name, self.cfg, self.cloud, cloudinit.log, args])
-        except:
-            raise
+DEF_HANDLER_VERSION = 1
+DEF_FREQ = PER_INSTANCE
 
 
 # reads a cloudconfig module list, returns

From cbcb8d09779d76739ae6f8ef662233aefb0441e5 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:05:27 -0700
Subject: [PATCH 028/434] Remove is ipv4 function from here and move to utils +
 move exceptions to here as well as other find datasource function.

---
 cloudinit/sources/__init__.py | 42 +++++++++++++++++++++--------------
 1 file changed, 25 insertions(+), 17 deletions(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index e2a9150d..9a9c1316 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -18,13 +18,16 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from cloudinit import user_data as ud
+from cloudinit import util
+
+import socket
 
 DEP_FILESYSTEM = "FILESYSTEM"
 DEP_NETWORK = "NETWORK"
 
-import cloudinit.UserDataHandler as ud
-import cloudinit.util as util
-import socket
+class DataSourceNotFoundException(Exception):
+    pass
 
 
 class DataSource:
@@ -152,6 +155,25 @@ class DataSource:
             return hostname
 
 
+def find_source(cfg, ds_deps):
+    cfglist = cfg.get('datasource_list') or []
+    dslist = list_sources(cfglist, ds_deps)
+    dsnames = [f.__name__ for f in dslist]
+    
+    LOG.debug("Searching for data source in %s", dsnames)
+    for cls in dslist:
+        ds = cls.__name__
+        try:
+            s = cls(sys_cfg=cfg)
+            if s.get_data():
+                return (s, ds)
+        except Exception as e:
+            LOG.exception("Getting data from %s raised %s", ds, e)
+
+    msg = "Did not find any data source, searched classes: %s" % dsnames
+    raise DataSourceNotFoundException(msg)
+
+
 # return a list of classes that have the same depends as 'depends'
 # iterate through cfg_list, loading "DataSourceCollections" modules
 # and calling their "get_datasource_list".
@@ -198,17 +220,3 @@ def list_from_depends(depends, dslist):
         if depset == set(deps):
             retlist.append(cls)
     return(retlist)
-
-
-def is_ipv4(instr):
-    """ determine if input string is a ipv4 address. return boolean"""
-    toks = instr.split('.')
-    if len(toks) != 4:
-        return False
-
-    try:
-        toks = [x for x in toks if (int(x) < 256 and int(x) > 0)]
-    except:
-        return False
-
-    return (len(toks) == 4)

From 02f5baf28e7bacd13dba4c0989dbf67bd8f5169a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:09:24 -0700
Subject: [PATCH 029/434] Remove the main function from this, seems like that
 should be in a test if needed.

---
 cloudinit/ssh_util.py | 37 -------------------------------------
 1 file changed, 37 deletions(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index a081fbe8..1483f718 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -188,40 +188,3 @@ def parse_ssh_config(fname="/etc/ssh/sshd_config"):
         ret[key] = val
     fp.close()
     return(ret)
-
-if __name__ == "__main__":
-    def main():
-        import sys
-        # usage: orig_file, new_keys, [key_prefix]
-        #   prints out merged, where 'new_keys' will trump old
-        ##  example
-        ## ### begin auth_keys ###
-        # ssh-rsa AAAAB3NzaC1xxxxxxxxxV3csgm8cJn7UveKHkYjJp8= smoser-work
-        # ssh-rsa AAAAB3NzaC1xxxxxxxxxCmXp5Kt5/82cD/VN3NtHw== smoser@brickies
-        # ### end authorized_keys ###
-        #
-        # ### begin new_keys ###
-        # ssh-rsa nonmatch smoser@newhost
-        # ssh-rsa AAAAB3NzaC1xxxxxxxxxV3csgm8cJn7UveKHkYjJp8= new_comment
-        # ### end new_keys ###
-        #
-        # Then run as:
-        #  program auth_keys new_keys \
-        #      'no-port-forwarding,command=\"echo hi world;\"'
-        def_prefix = None
-        orig_key_file = sys.argv[1]
-        new_key_file = sys.argv[2]
-        if len(sys.argv) > 3:
-            def_prefix = sys.argv[3]
-        fp = open(new_key_file)
-
-        newkeys = []
-        for line in fp.readlines():
-            newkeys.append(AuthKeyEntry(line, def_prefix))
-
-        fp.close()
-        print update_authorized_keys(orig_key_file, newkeys)
-
-    main()
-
-# vi: ts=4 expandtab

From 57da61791c9d4e7b9858f820bfa7347c46fa7700 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:09:44 -0700
Subject: [PATCH 030/434] Remove the main function from this, seems like it
 should also be in a test if needed.

---
 cloudinit/netinfo.py | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index aac4af04..1f0fa571 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -110,7 +110,3 @@ def debug_info(pre="ci-info: "):
             (pre, n, r[0], r[1], r[2], r[7], r[3]))
         n = n + 1
     return('\n'.join(lines))
-
-
-if __name__ == '__main__':
-    print debug_info()

From 692065dd762106d42c0578d9874f96e8270644ab Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:42:06 -0700
Subject: [PATCH 031/434] Fixup CloudConfig by using new module functions and
 calling objects.

---
 cloudinit/cloud.py | 67 ++++++++++++++++++++++------------------------
 1 file changed, 32 insertions(+), 35 deletions(-)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index cfb1c011..a98bfbbd 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -16,6 +16,7 @@ from cloudinit import parts
 from cloudinit import sources
 from cloudinit import util
 from cloudinit import user_data
+from cloudinit import handlers
 
 LOG = logging.getLogger(__name__)
 
@@ -168,7 +169,6 @@ class CloudInit(object):
         else:
             self.ds_deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
         self.paths = CloudPaths(self)
-        self.sems = CloudSemaphores(self.paths)
         self.cfg = self._read_cfg()
 
     def _read_cfg_old(self):
@@ -294,16 +294,14 @@ class CloudInit(object):
         handlers = CloudHandlers(self)
 
         # Add handlers in cdir
-        for fname in glob.glob(os.path.join(cdir, "*.py")):
-            if not os.path.isfile(fname):
-                continue
-            modname = os.path.basename(fname)[0:-3]
+        potential_handlers = parts.find_module_files(cdir)
+        for (fname, modname) in potential_handlers.iteritems():
             try:
                 mod = parts.fixup_module(importer.import_module(modname))
                 types = handlers.register(mod)
                 LOG.debug("Added handler for [%s] from %s", types, fname)
             except:
-                LOG.exception("Failed to register handler in %s", fname)
+                LOG.exception("Failed to register handler from %s", fname)
 
         def_handlers = handlers.register_defaults()
         if def_handlers:
@@ -391,47 +389,46 @@ class CloudHandlers(object):
 
 
 class CloudConfig(object):
-    cfgfile = None
-    cfg = None
 
-    def __init__(self, cfgfile, cloud=None, ds_deps=None):
-        if cloud == None:
-            self.cloud = cloudinit.CloudInit(ds_deps)
-            self.cloud.get_data_source()
-        else:
-            self.cloud = cloud
-        self.cfg = self.get_config_obj(cfgfile)
+    def __init__(self, cfgfile, cloud):
+        self.cloud = cloud
+        self.cfg = self._get_config(cfgfile)
+        self.paths = cloud.paths
+        self.sems = CloudSemaphores(self.paths)
 
-    def get_config_obj(self, cfgfile):
+    def _get_config(self, cfgfile):
+
+        cfg = None
         try:
             cfg = util.read_conf(cfgfile)
         except:
-            # TODO: this 'log' could/should be passed in
-            cloudinit.log.critical("Failed loading of cloud config '%s'. "
-                                   "Continuing with empty config\n" % cfgfile)
-            cloudinit.log.debug(traceback.format_exc() + "\n")
-            cfg = None
-        if cfg is None:
+            LOG.exception(("Failed loading of cloud config '%s'. "
+                          "Continuing with empty config."), cfgfile)
+        if not cfg:
             cfg = {}
 
+        ds_cfg = None
         try:
             ds_cfg = self.cloud.datasource.get_config_obj()
         except:
+            LOG.exception("Failed loading of datasource config.")
+        if not ds_cfg:
             ds_cfg = {}
 
         cfg = util.mergedict(cfg, ds_cfg)
-        return(util.mergedict(cfg, self.cloud.cfg))
+        cloud_cfg = self.cloud.cfg or {}
+        return util.mergedict(cfg, cloud_cfg)
 
-    def handle(self, name, args, freq=None):
-        try:
-            mod = __import__("cc_" + name.replace("-", "_"), globals())
-            def_freq = getattr(mod, "frequency", per_instance)
-            handler = getattr(mod, "handle")
+    def extract(self, name):
+        modname = handlers.form_module_name(name)
+        if not modname:
+            return None
+        return handlers.fixup_module(importer.import_module(modname))
 
-            if not freq:
-                freq = def_freq
-
-            self.cloud.sem_and_run("config-" + name, freq, handler,
-                [name, self.cfg, self.cloud, cloudinit.log, args])
-        except:
-            raise
+    def handle(self, name, mod, args, freq=None):
+        def_freq = mod.frequency 
+        if not freq:
+            freq = def_freq
+        c_name = "config-%s" % (name)
+        real_args = [name, self.cfg, self.cloud, LOG, args]
+        return self.sems.run_functor(c_name, freq, mod.handle, real_args)

From b41de934573d6ed890bc004a1f13f4cd5dcfa99a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:42:31 -0700
Subject: [PATCH 032/434] Move how user part data modules are found to here.

---
 cloudinit/parts.py | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/cloudinit/parts.py b/cloudinit/parts.py
index 9cd24c5a..6af1ab7c 100644
--- a/cloudinit/parts.py
+++ b/cloudinit/parts.py
@@ -137,9 +137,23 @@ def fixup_module(mod):
         setattr(mod, 'list_types', empty_types)
     if not hasattr(mod, frequency):
         setattr(mod, 'frequency', PER_INSTANCE)
+    if not hasattr(mod, 'handle_part'):
+        def empty_handler(data, ctype, filename, payload):
+            pass
+        setattr(mod, 'handle_part', empty_handler)
     return mod
 
 
+def find_module_files(root_dir):
+    entries = dict()
+    for fname in glob.glob(os.path.join(root_dir, "*.py")):
+        if not os.path.isfile(fname):
+            continue
+        modname = os.path.basename(fname)[0:-3]
+        entries[fname] = modname
+    return entries
+
+
 def run_part(mod, data, ctype, filename, payload, frequency):
     # only add the handler if the module should run
     mod_freq = getattr(mod, "frequency")

From 7f809e486870deb3f2dfaa2bf63777631aef86c5 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 18:42:54 -0700
Subject: [PATCH 033/434] Move how handler module names are found to here as
 well as a fixup module function for bad modules.

---
 cloudinit/handlers/__init__.py | 23 +++++++++++++++++++++++
 1 file changed, 23 insertions(+)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 3b0cdd4e..ae74b683 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -36,6 +36,7 @@ LOG = logging.getLogger(__name__)
 
 DEF_HANDLER_VERSION = 1
 DEF_FREQ = PER_INSTANCE
+HANDLER_TPL = "cc_%s"
 
 
 # reads a cloudconfig module list, returns
@@ -230,3 +231,25 @@ def update_package_sources():
 def install_packages(pkglist):
     update_package_sources()
     apt_get("install", pkglist)
+
+
+def form_module_name(name):
+    canon_name = name.replace("-", "_")
+    if canon_name.endswith(".py"):
+        canon_name = canon_name[0:(len(canon_name) - 3)]
+    canon_name = canon_name.strip()
+    if not canon_name:
+        return None
+    return HANDLER_TPL % (canon_name)
+
+
+def fixup_module(mod):
+    freq = getattr(mod, "frequency", None)
+    if not freq:
+        setattr(mod, 'frequency', PER_INSTANCE)
+    handler = getattr(mod, "handle", None)
+    if not handler:
+        def empty_handle(_name, _cfg, _cloud, _log, _args):
+            pass
+        setattr(mod, 'handle', empty_handle)
+    return mod

From 941887ec38cf6e693dab287cdbaa42352a12e48f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 19:10:58 -0700
Subject: [PATCH 034/434] Remove parsed config cache, and cleanup cmdline
 function.

---
 cloudinit/__init__.py | 62 +++++++++++++++++++------------------------
 1 file changed, 27 insertions(+), 35 deletions(-)

diff --git a/cloudinit/__init__.py b/cloudinit/__init__.py
index 2c291ff5..c38b3b09 100644
--- a/cloudinit/__init__.py
+++ b/cloudinit/__init__.py
@@ -34,47 +34,37 @@ from cloudinit import url_helper as uhelp
 from cloudinit import util
 
 from cloudinit.settings import (VAR_LIB_DIR, CFG_BUILTIN, CLOUD_CONFIG,
-                                 BOOT_FINISHED, CUR_INSTANCE_LINK, PATH_MAP)
+                                 BOOT_FINISHED, CUR_INSTANCE_LINK)
 
 LOG = logging.getLogger(__name__)
 
 INIT_SUBDIRS = [
-    'scripts',
-    os.path.join('scripts', 'per-instance'),
-    os.path.join('scripts', 'per-once'),
-    os.path.join('scripts', 'per-boot'),
-    'seed',
-    'instances',
-    'handlers',
-    'sem',
-    'data'
+    os.path.join(VAR_LIB_DIR, 'scripts'),
+    os.path.join(VAR_LIB_DIR, 'scripts', 'per-instance'),
+    os.path.join(VAR_LIB_DIR, 'scripts', 'per-once'),
+    os.path.join(VAR_LIB_DIR, 'scripts', 'per-boot'),
+    os.path.join(VAR_LIB_DIR, 'seed'),
+    os.path.join(VAR_LIB_DIR, 'instances'),
+    os.path.join(VAR_LIB_DIR, 'handlers'),
+    os.path.join(VAR_LIB_DIR, 'sem'),
+    os.path.join(VAR_LIB_DIR, 'data'),
 ]
 
 
-# TODO: get rid of this global
-parsed_cfgs = {}
-
-
 def initfs():
-
-    # TODO don't do this every time this function is called?
-    dlist = []
-    for subd in INIT_SUBDIRS:
-        dlist.append(os.path.join(VAR_LIB_DIR, subd))
-    util.ensure_dirs(dlist)
-
-    cfg = util.get_base_cfg(CLOUD_CONFIG, get_builtin_cfg(), parsed_cfgs)
+    util.ensure_dirs(INIT_SUBDIRS)
+    cfg = util.get_base_cfg(CLOUD_CONFIG, get_builtin_cfg())
     log_file = util.get_cfg_option_str(cfg, 'def_log_file', None)
     perms = util.get_cfg_option_str(cfg, 'syslog_fix_perms', None)
     if log_file:
         util.ensure_file(log_file)
-    if log_file and perms:
-        (u, g) = perms.split(':', 1)
-        if u == "-1" or u == "None":
-            u = None
-        if g == "-1" or g == "None":
-            g = None
-        util.chownbyname(log_file, u, g)
+        if perms:
+            (u, g) = perms.split(':', 1)
+            if u == "-1" or u == "None":
+                u = None
+            if g == "-1" or g == "None":
+                g = None
+            util.chownbyname(log_file, u, g)
 
 
 def purge_cache(rmcur=True):
@@ -89,7 +79,7 @@ def purge_cache(rmcur=True):
 def get_base_cfg(cfg_path=None):
     if cfg_path is None:
         cfg_path = CLOUD_CONFIG
-    return util.get_base_cfg(cfg_path, get_builtin_cfg(), parsed_cfgs)
+    return util.get_base_cfg(cfg_path, get_builtin_cfg())
 
 
 def get_builtin_cfg():
@@ -97,14 +87,16 @@ def get_builtin_cfg():
 
 
 def list_sources(cfg_list, depends):
-    return (sources.list_sources(cfg_list, depends, ["cloudinit", ""]))
+    return sources.list_sources(cfg_list, depends, ["cloudinit", ""])
 
 
-def get_cmdline_url(names=('cloud-config-url', 'url'),
-                    starts="#cloud-config", cmdline=None):
-
-    if cmdline == None:
+def get_cmdline_url(names=None, starts=None, cmdline=None):
+    if cmdline is None:
         cmdline = util.get_cmdline()
+    if not names:
+        names = ('cloud-config-url', 'url')
+    if not starts:
+        starts = "#cloud-config"
 
     data = util.keyval_str_to_dict(cmdline)
     url = None

From a4203ab8b7c5a9f28083b9c587dd59116a668c3a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 8 Jun 2012 19:11:14 -0700
Subject: [PATCH 035/434] Move to having a parts directory/module + seperate
 modules.

---
 cloudinit/cloud.py                        |  37 ++++----
 cloudinit/{parts.py => parts/__init__.py} | 103 +---------------------
 cloudinit/parts/boot_hook.py              |  42 +++++++++
 cloudinit/parts/cloud_config.py           |  36 ++++++++
 cloudinit/parts/shell_script.py           |  27 ++++++
 cloudinit/parts/upstart_job.py            |  30 +++++++
 6 files changed, 158 insertions(+), 117 deletions(-)
 rename cloudinit/{parts.py => parts/__init__.py} (54%)
 create mode 100644 cloudinit/parts/boot_hook.py
 create mode 100644 cloudinit/parts/cloud_config.py
 create mode 100644 cloudinit/parts/shell_script.py
 create mode 100644 cloudinit/parts/upstart_job.py

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index a98bfbbd..f9c0d531 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -2,22 +2,27 @@ from time import time
 
 import cPickle as pickle
 import contextlib
+import copy
 import os
 import sys
 import weakref
 
-
 from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS,
                                 OLD_CLOUD_CONFIG, CLOUD_CONFIG,
-                                CFG_BUILTIN, CUR_INSTANCE_LINK)
+                                CUR_INSTANCE_LINK)
 from cloudinit import (get_builtin_cfg, get_base_cfg)
 from cloudinit import log as logging
-from cloudinit import parts
 from cloudinit import sources
 from cloudinit import util
 from cloudinit import user_data
 from cloudinit import handlers
 
+from cloudinit import parts
+from cloudinit.parts import boot_hook as bh_part
+from cloudinit.parts import cloud_config as cc_part
+from cloudinit.parts import upstart_job as up_part
+from cloudinit.parts import shell_script as ss_part
+
 LOG = logging.getLogger(__name__)
 
 
@@ -128,10 +133,10 @@ class CloudPaths(object):
         return ipath
 
 
-class CloudPartData(object):
-    def __init__(self, datasource, paths):
-        self.datasource = datasource
-        self.paths = paths
+class CloudSimple(object):
+    def __init__(self, init):
+        self.datasource = init.datasource
+        self.paths = init.paths
 
     def get_userdata(self):
         return self.datasource.get_userdata()
@@ -288,7 +293,7 @@ class CloudInit(object):
         sys.path.insert(0, idir)
 
         # Data will be a little proxy that modules can use
-        data = CloudPartData(self.datasource, self.paths)
+        data = CloudSimple(self)
 
         # This keeps track of all the active handlers
         handlers = CloudHandlers(self)
@@ -369,13 +374,13 @@ class CloudHandlers(object):
     def _get_default_handlers(self):
         def_handlers = []
         if self.paths.get_ipath("cloud_config"):
-            def_handlers.append(parts.CloudConfigPartHandler(self.paths.get_ipath("cloud_config")))
+            def_handlers.append(cc_part.CloudConfigPartHandler(self.paths.get_ipath("cloud_config")))
         if self.paths.get_ipath_cur('scripts'):
-            def_handlers.append(parts.ShellScriptPartHandler(self.paths.get_ipath_cur('scripts')))
+            def_handlers.append(ss_part.ShellScriptPartHandler(self.paths.get_ipath_cur('scripts')))
         if self.paths.get_ipath("boothooks"):
-            def_handlers.append(parts.BootHookPartHandler(self.paths.get_ipath("boothooks")))
+            def_handlers.append(bh_part.BootHookPartHandler(self.paths.get_ipath("boothooks")))
         if self.paths.upstart_conf_d:
-            def_handlers.append(parts.UpstartJobPartHandler(self.paths.upstart_conf_d))
+            def_handlers.append(up_part.UpstartJobPartHandler(self.paths.upstart_conf_d))
         return def_handlers
 
     def register_defaults(self):
@@ -391,13 +396,11 @@ class CloudHandlers(object):
 class CloudConfig(object):
 
     def __init__(self, cfgfile, cloud):
-        self.cloud = cloud
+        self.cloud = CloudSimple(cloud)
         self.cfg = self._get_config(cfgfile)
-        self.paths = cloud.paths
-        self.sems = CloudSemaphores(self.paths)
+        self.sems = CloudSemaphores(self.cloud.paths)
 
     def _get_config(self, cfgfile):
-
         cfg = None
         try:
             cfg = util.read_conf(cfgfile)
@@ -430,5 +433,5 @@ class CloudConfig(object):
         if not freq:
             freq = def_freq
         c_name = "config-%s" % (name)
-        real_args = [name, self.cfg, self.cloud, LOG, args]
+        real_args = [name, copy.deepcopy(self.cfg), self.cloud, LOG, copy.deepcopy(args)]
         return self.sems.run_functor(c_name, freq, mod.handle, real_args)
diff --git a/cloudinit/parts.py b/cloudinit/parts/__init__.py
similarity index 54%
rename from cloudinit/parts.py
rename to cloudinit/parts/__init__.py
index 6af1ab7c..20d4bd3b 100644
--- a/cloudinit/parts.py
+++ b/cloudinit/parts/__init__.py
@@ -10,6 +10,7 @@ CONTENT_END = "__end__"
 CONTENT_START = "__begin__"
 PART_CONTENT_TYPES = ["text/part-handler"]
 PART_HANDLER_FN_TMPL = 'part-handler-%03d'
+UNDEF_HANDLER_VERSION = 1
 
 
 class PartHandler(object):
@@ -30,107 +31,9 @@ class PartHandler(object):
         raise NotImplementedError()
 
 
-class BootHookPartHandler(PartHandler):
-    def __init__(self, boothook_dir, instance_id):
-        PartHandler.__init__(self, PER_ALWAYS)
-        self.boothook_dir = boothook_dir
-        self.instance_id = instance_id
-
-    def list_types(self):
-        return ['text/cloud-boothook']
-    
-    def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype in [CONTENT_START, CONTENT_END]:
-            return
-
-        filename = util.clean_filename(filename)
-        payload = util.dos2unix(payload)
-        prefix = "#cloud-boothook"
-        start = 0
-        if payload.startswith(prefix):
-            start = len(prefix) + 1
-
-        filepath = os.path.join(self.boothook_dir, filename)
-        util.write_file(filepath, payload[start:], 0700)
-        try:
-            env = os.environ.copy()
-            env['INSTANCE_ID'] = str(self.instance_id)
-            util.subp([filepath], env=env)
-        except util.ProcessExecutionError as e:
-            LOG.error("Boothooks script %s returned %s", filepath, e.exit_code)
-        except Exception as e:
-            LOG.error("Boothooks unknown exception %s when running %s", e, filepath)
-
-
-class UpstartJobPartHandler(PartHandler):
-    def __init__(self, upstart_dir):
-        PartHandler.__init__(self, PER_INSTANCE)
-        self.upstart_dir = upstart_dir
-
-    def list_types(self):
-        return ['text/upstart-job']
-
-    def _handle_part(self, _data, ctype, filename, payload, frequency):
-        if ctype in [CONTENT_START, CONTENT_END]:
-            return
-
-        filename = utils.clean_filename(filename)
-        (name, ext) = os.path.splitext(filename)
-        ext = ext.lower()
-        if ext != ".conf":
-            filename = filename + ".conf"
-
-        payload = util.dos2unix(payload)
-        util.write_file(os.path.join(self.upstart_dir, filename), payload, 0644)
-
-
-class ShellScriptPartHandler(PartHandler):
-
-    def __init__(self, script_dir):
-        PartHandler.__init__(self, PER_ALWAYS)
-        self.script_dir = script_dir
-
-    def list_types(self):
-        return ['text/x-shellscript']
-
-    def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype in [CONTENT_START, CONTENT_END]:
-            # maybe delete existing things here
-            return
-
-        filename = util.clean_filename(filename)
-        payload = util.dos2unix(payload)
-        util.write_file(os.path.join(self.script_dir, filename), payload, 0700)
-
-
-class CloudConfigPartHandler(PartHandler):
-    def __init__(self, cloud_fn):
-        PartHandler.__init__(self, PER_ALWAYS)
-        self.cloud_buf = []
-        self.cloud_fn = cloud_fn
-
-    def list_types(self):
-        return ['text/cloud-config']
-
-    def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype == CONTENT_START:
-            self.cloud_buf = []
-            return
-
-        if ctype == CONTENT_END:
-            payload = "\n".join(self.cloud_buf)
-            util.write_file(self.cloud_fn, payload, 0600)
-            self.cloud_buf = []
-            return
-
-        filename = util.clean_filename(filename)
-        entry = "\n".join(["#%s" % (filename), str(payload)])
-        self.config_buf.append(entry)
-
-
 def fixup_module(mod):
     if not hasattr(mod, "handler_version"):
-        setattr(mod, "handler_version", 1)
+        setattr(mod, "handler_version", UNDEF_HANDLER_VERSION)
     if not hasattr(mod, 'list_types'):
         def empty_types():
             return []
@@ -211,4 +114,4 @@ def walker_callback(pdata, ctype, filename, payload):
                 details = repr(payload)
             LOG.warning("Unhandled non-multipart userdata: %s", details)
         return
-    run_part(handlers[ctype], pdata['data'], ctype, filename, payload, pdata['frequency'])
+    run_part(handlers[ctype], pdata['data'], ctype, filename, payload, pdata['frequency'])
\ No newline at end of file
diff --git a/cloudinit/parts/boot_hook.py b/cloudinit/parts/boot_hook.py
new file mode 100644
index 00000000..881ffc58
--- /dev/null
+++ b/cloudinit/parts/boot_hook.py
@@ -0,0 +1,42 @@
+import os
+
+from cloudinit import util
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
+from cloudinit import log as logging
+from cloudinit import parts
+
+LOG = logging.getLogger(__name__)
+
+
+
+class BootHookPartHandler(parts.PartHandler):
+    def __init__(self, boothook_dir, instance_id):
+        parts.PartHandler.__init__(self, PER_ALWAYS)
+        self.boothook_dir = boothook_dir
+        self.instance_id = instance_id
+
+    def list_types(self):
+        return ['text/cloud-boothook']
+    
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype in [CONTENT_START, CONTENT_END]:
+            return
+
+        filename = util.clean_filename(filename)
+        payload = util.dos2unix(payload)
+        prefix = "#cloud-boothook"
+        start = 0
+        if payload.startswith(prefix):
+            start = len(prefix) + 1
+
+        filepath = os.path.join(self.boothook_dir, filename)
+        util.write_file(filepath, payload[start:], 0700)
+        try:
+            env = os.environ.copy()
+            env['INSTANCE_ID'] = str(self.instance_id)
+            util.subp([filepath], env=env)
+        except util.ProcessExecutionError as e:
+            LOG.error("Boothooks script %s returned %s", filepath, e.exit_code)
+        except Exception as e:
+            LOG.error("Boothooks unknown exception %s when running %s", e, filepath)
+
diff --git a/cloudinit/parts/cloud_config.py b/cloudinit/parts/cloud_config.py
new file mode 100644
index 00000000..dab0e5f5
--- /dev/null
+++ b/cloudinit/parts/cloud_config.py
@@ -0,0 +1,36 @@
+import os
+
+from cloudinit import util
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
+from cloudinit import log as logging
+from cloudinit import parts
+
+LOG = logging.getLogger(__name__)
+
+
+
+class CloudConfigPartHandler(parts.PartHandler):
+    def __init__(self, cloud_fn):
+        parts.PartHandler.__init__(self, PER_ALWAYS)
+        self.cloud_buf = []
+        self.cloud_fn = cloud_fn
+
+    def list_types(self):
+        return ['text/cloud-config']
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype == CONTENT_START:
+            self.cloud_buf = []
+            return
+
+        if ctype == CONTENT_END:
+            payload = "\n".join(self.cloud_buf)
+            util.write_file(self.cloud_fn, payload, 0600)
+            self.cloud_buf = []
+            return
+
+        filename = util.clean_filename(filename)
+        entry = "\n".join(["#%s" % (filename), str(payload)])
+        self.config_buf.append(entry)
+
+
diff --git a/cloudinit/parts/shell_script.py b/cloudinit/parts/shell_script.py
new file mode 100644
index 00000000..a248f198
--- /dev/null
+++ b/cloudinit/parts/shell_script.py
@@ -0,0 +1,27 @@
+import os
+
+from cloudinit import util
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
+from cloudinit import log as logging
+from cloudinit import parts
+
+LOG = logging.getLogger(__name__)
+
+
+class ShellScriptPartHandler(parts.PartHandler):
+
+    def __init__(self, script_dir):
+        parts.PartHandler.__init__(self, PER_ALWAYS)
+        self.script_dir = script_dir
+
+    def list_types(self):
+        return ['text/x-shellscript']
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype in [CONTENT_START, CONTENT_END]:
+            # maybe delete existing things here
+            return
+
+        filename = util.clean_filename(filename)
+        payload = util.dos2unix(payload)
+        util.write_file(os.path.join(self.script_dir, filename), payload, 0700)
diff --git a/cloudinit/parts/upstart_job.py b/cloudinit/parts/upstart_job.py
new file mode 100644
index 00000000..7b290d26
--- /dev/null
+++ b/cloudinit/parts/upstart_job.py
@@ -0,0 +1,30 @@
+import os
+
+from cloudinit import util
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
+from cloudinit import log as logging
+from cloudinit import parts
+
+LOG = logging.getLogger(__name__)
+
+
+class UpstartJobPartHandler(parts.PartHandler):
+    def __init__(self, upstart_dir):
+        parts.PartHandler.__init__(self, PER_INSTANCE)
+        self.upstart_dir = upstart_dir
+
+    def list_types(self):
+        return ['text/upstart-job']
+
+    def _handle_part(self, _data, ctype, filename, payload, frequency):
+        if ctype in [CONTENT_START, CONTENT_END]:
+            return
+
+        filename = utils.clean_filename(filename)
+        (name, ext) = os.path.splitext(filename)
+        ext = ext.lower()
+        if ext != ".conf":
+            filename = filename + ".conf"
+
+        payload = util.dos2unix(payload)
+        util.write_file(os.path.join(self.upstart_dir, filename), payload, 0644)

From 72093f7260d3f3f60a81db23a095ced18ae4c0db Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:30:43 -0700
Subject: [PATCH 036/434] Not needed.

---
 checks.sh | 53 -----------------------------------------------------
 1 file changed, 53 deletions(-)
 delete mode 100755 checks.sh

diff --git a/checks.sh b/checks.sh
deleted file mode 100755
index f54cad36..00000000
--- a/checks.sh
+++ /dev/null
@@ -1,53 +0,0 @@
-#!/bin/bash
-
-set -u
-
-function find_src {
-  files=`find bin cloudinit -type f | grep "py\$"`
-  echo $files
-}
-
-function run_pep8 {
-  echo "Running pep8 ..."
-  files=$(find_src)
-  ignores="E202,E501"
-  output_filename="pep8.log"
-  opts="--ignore=$ignores --repeat"
-  pep8 ${opts} ${files} 2>&1 > $output_filename
-  if [ "$?" -ne "0" ]; then
-    echo "Some badness was found!"
-  fi
-  echo "Check '$output_filename' for a full report."
-}
-
-function run_pylint {
-  echo "Running pylint ..."
-  opts="--rcfile=pylintrc --output-format=parseable"
-  files=$(find_src)
-  output_filename="pylint.log"
-  pylint ${opts} ${files} 2>&1 > $output_filename
-  if [ "$?" -eq "1" ]; then
-    # pylint --long-help
-    # * 0 if everything went fine
-    # * 1 if a fatal message was issued
-    # * 2 if an error message was issued
-    # * 4 if a warning message was issued
-    # * 8 if a refactor message was issued
-    # * 16 if a convention message was issued
-    # * 32 on usage error
-    echo "A fatal pylint error occurred!"
-  else
-    if [ "$?" -eq "0" ]; then
-      echo "Your code is perfect you code master!"
-    else
-      echo "You are not yet a code master."
-      grep -i "Your code" $output_filename
-    fi
-  fi
-  echo "Check '$output_filename' for a full report."
-}
-
-
-run_pep8
-run_pylint
-

From 004e0e85e02bcfe5f388091cd5ca37eb38b3943d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:30:57 -0700
Subject: [PATCH 037/434] Start adding place where distro specifics can go.

---
 cloudinit/distros/__init__.py | 0
 cloudinit/distros/ubuntu.py   | 0
 2 files changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 cloudinit/distros/__init__.py
 create mode 100644 cloudinit/distros/ubuntu.py

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
new file mode 100644
index 00000000..e69de29b

From b239b5861bec14da2f35c34b68f68adb8863c17e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:31:19 -0700
Subject: [PATCH 038/434] Rename these to user_data module + submodules.

---
 cloudinit/parts/__init__.py                   | 117 ----------
 cloudinit/parts/boot_hook.py                  |  42 ----
 cloudinit/parts/cloud_config.py               |  36 ---
 cloudinit/parts/shell_script.py               |  27 ---
 cloudinit/parts/upstart_job.py                |  30 ---
 cloudinit/user_data/__init__.py               | 210 ++++++++++++++++++
 cloudinit/user_data/boot_hook.py              |  65 ++++++
 cloudinit/user_data/cloud_config.py           |  59 +++++
 .../{user_data.py => user_data/processor.py}  |  88 +-------
 cloudinit/user_data/shell_script.py           |  53 +++++
 cloudinit/user_data/upstart_job.py            |  56 +++++
 11 files changed, 454 insertions(+), 329 deletions(-)
 delete mode 100644 cloudinit/parts/__init__.py
 delete mode 100644 cloudinit/parts/boot_hook.py
 delete mode 100644 cloudinit/parts/cloud_config.py
 delete mode 100644 cloudinit/parts/shell_script.py
 delete mode 100644 cloudinit/parts/upstart_job.py
 create mode 100644 cloudinit/user_data/__init__.py
 create mode 100644 cloudinit/user_data/boot_hook.py
 create mode 100644 cloudinit/user_data/cloud_config.py
 rename cloudinit/{user_data.py => user_data/processor.py} (73%)
 create mode 100644 cloudinit/user_data/shell_script.py
 create mode 100644 cloudinit/user_data/upstart_job.py

diff --git a/cloudinit/parts/__init__.py b/cloudinit/parts/__init__.py
deleted file mode 100644
index 20d4bd3b..00000000
--- a/cloudinit/parts/__init__.py
+++ /dev/null
@@ -1,117 +0,0 @@
-import os
-
-from cloudinit import util
-from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
-from cloudinit import log as logging
-
-LOG = logging.getLogger(__name__)
-
-CONTENT_END = "__end__"
-CONTENT_START = "__begin__"
-PART_CONTENT_TYPES = ["text/part-handler"]
-PART_HANDLER_FN_TMPL = 'part-handler-%03d'
-UNDEF_HANDLER_VERSION = 1
-
-
-class PartHandler(object):
-    def __init__(self, frequency, version=2):
-        self.handler_version = version
-        self.frequency = frequency
-
-    def __repr__(self):
-        return "%s: [%s]" % (self.__class__.__name__, self.list_types())
-
-    def list_types(self):
-        raise NotImplementedError()
-
-    def handle_part(self, data, ctype, filename, payload, frequency):
-        return self._handle_part(data, ctype, filename, payload, frequency)
-
-    def _handle_part(self, data, ctype, filename, payload, frequency):
-        raise NotImplementedError()
-
-
-def fixup_module(mod):
-    if not hasattr(mod, "handler_version"):
-        setattr(mod, "handler_version", UNDEF_HANDLER_VERSION)
-    if not hasattr(mod, 'list_types'):
-        def empty_types():
-            return []
-        setattr(mod, 'list_types', empty_types)
-    if not hasattr(mod, frequency):
-        setattr(mod, 'frequency', PER_INSTANCE)
-    if not hasattr(mod, 'handle_part'):
-        def empty_handler(data, ctype, filename, payload):
-            pass
-        setattr(mod, 'handle_part', empty_handler)
-    return mod
-
-
-def find_module_files(root_dir):
-    entries = dict()
-    for fname in glob.glob(os.path.join(root_dir, "*.py")):
-        if not os.path.isfile(fname):
-            continue
-        modname = os.path.basename(fname)[0:-3]
-        entries[fname] = modname
-    return entries
-
-
-def run_part(mod, data, ctype, filename, payload, frequency):
-    # only add the handler if the module should run
-    mod_freq = getattr(mod, "frequency")
-    if not (mod_freq == PER_ALWAYS or
-            (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
-        return
-    try:
-        mod_ver = getattr(mod, 'handler_version')
-        if mod_ver == 1:
-            mod.handle_part(data, ctype, filename, payload)
-        else:
-            mod.handle_part(data, ctype, filename, payload, frequency)
-    except:
-        LOG.exception("Failed calling mod %s (%s, %s, %s) with frequency %s", mod, ctype, filename, mod_ver, frequency)
-
-
-def call_begin(mod, data, frequency):
-    run_part(mod, data, CONTENT_START, None, None, frequency)
-
-
-def call_end(mod, data, frequency):
-    run_part(mod, data, CONTENT_END, None, None, frequency)
-
-
-def walker_handle_handler(pdata, _ctype, _filename, payload):
-    curcount = pdata['handlercount']
-    modname = PART_HANDLER_FN_TMPL % (curcount)
-    frequency = pdata['frequency']
-    modfname = os.path.join(pdata['handlerdir'], "%s.py" % (modname))
-    # TODO: Check if path exists??
-    util.write_file(modfname, payload, 0600)
-    handlers = pdata['handlers']
-    try:
-        mod = fixup_module(importer.import_module(modname))
-        handlers.register(mod)
-        call_begin(mod, pdata['data'], frequency)
-        pdata['handlercount'] = curcount + 1
-    except:
-        LOG.exception("Failed at registered python file %s", modfname)
-
-
-def walker_callback(pdata, ctype, filename, payload):
-    # data here is the part_handlers array and then the data to pass through
-    if ctype in PART_CONTENT_TYPES:
-        walker_handle_handler(pdata, ctype, filename, payload)
-        return
-    handlers = pdata['handlers']
-    if ctype not in handlers:
-        if ctype == "text/x-not-multipart":
-            # Extract the first line or 24 bytes for displaying in the log
-            start = payload.split("\n", 1)[0][:24]
-            if start < payload:
-                details = "starting '%s...'" % start.encode("string-escape")
-            else:
-                details = repr(payload)
-            LOG.warning("Unhandled non-multipart userdata: %s", details)
-        return
-    run_part(handlers[ctype], pdata['data'], ctype, filename, payload, pdata['frequency'])
\ No newline at end of file
diff --git a/cloudinit/parts/boot_hook.py b/cloudinit/parts/boot_hook.py
deleted file mode 100644
index 881ffc58..00000000
--- a/cloudinit/parts/boot_hook.py
+++ /dev/null
@@ -1,42 +0,0 @@
-import os
-
-from cloudinit import util
-from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
-from cloudinit import log as logging
-from cloudinit import parts
-
-LOG = logging.getLogger(__name__)
-
-
-
-class BootHookPartHandler(parts.PartHandler):
-    def __init__(self, boothook_dir, instance_id):
-        parts.PartHandler.__init__(self, PER_ALWAYS)
-        self.boothook_dir = boothook_dir
-        self.instance_id = instance_id
-
-    def list_types(self):
-        return ['text/cloud-boothook']
-    
-    def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype in [CONTENT_START, CONTENT_END]:
-            return
-
-        filename = util.clean_filename(filename)
-        payload = util.dos2unix(payload)
-        prefix = "#cloud-boothook"
-        start = 0
-        if payload.startswith(prefix):
-            start = len(prefix) + 1
-
-        filepath = os.path.join(self.boothook_dir, filename)
-        util.write_file(filepath, payload[start:], 0700)
-        try:
-            env = os.environ.copy()
-            env['INSTANCE_ID'] = str(self.instance_id)
-            util.subp([filepath], env=env)
-        except util.ProcessExecutionError as e:
-            LOG.error("Boothooks script %s returned %s", filepath, e.exit_code)
-        except Exception as e:
-            LOG.error("Boothooks unknown exception %s when running %s", e, filepath)
-
diff --git a/cloudinit/parts/cloud_config.py b/cloudinit/parts/cloud_config.py
deleted file mode 100644
index dab0e5f5..00000000
--- a/cloudinit/parts/cloud_config.py
+++ /dev/null
@@ -1,36 +0,0 @@
-import os
-
-from cloudinit import util
-from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
-from cloudinit import log as logging
-from cloudinit import parts
-
-LOG = logging.getLogger(__name__)
-
-
-
-class CloudConfigPartHandler(parts.PartHandler):
-    def __init__(self, cloud_fn):
-        parts.PartHandler.__init__(self, PER_ALWAYS)
-        self.cloud_buf = []
-        self.cloud_fn = cloud_fn
-
-    def list_types(self):
-        return ['text/cloud-config']
-
-    def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype == CONTENT_START:
-            self.cloud_buf = []
-            return
-
-        if ctype == CONTENT_END:
-            payload = "\n".join(self.cloud_buf)
-            util.write_file(self.cloud_fn, payload, 0600)
-            self.cloud_buf = []
-            return
-
-        filename = util.clean_filename(filename)
-        entry = "\n".join(["#%s" % (filename), str(payload)])
-        self.config_buf.append(entry)
-
-
diff --git a/cloudinit/parts/shell_script.py b/cloudinit/parts/shell_script.py
deleted file mode 100644
index a248f198..00000000
--- a/cloudinit/parts/shell_script.py
+++ /dev/null
@@ -1,27 +0,0 @@
-import os
-
-from cloudinit import util
-from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
-from cloudinit import log as logging
-from cloudinit import parts
-
-LOG = logging.getLogger(__name__)
-
-
-class ShellScriptPartHandler(parts.PartHandler):
-
-    def __init__(self, script_dir):
-        parts.PartHandler.__init__(self, PER_ALWAYS)
-        self.script_dir = script_dir
-
-    def list_types(self):
-        return ['text/x-shellscript']
-
-    def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype in [CONTENT_START, CONTENT_END]:
-            # maybe delete existing things here
-            return
-
-        filename = util.clean_filename(filename)
-        payload = util.dos2unix(payload)
-        util.write_file(os.path.join(self.script_dir, filename), payload, 0700)
diff --git a/cloudinit/parts/upstart_job.py b/cloudinit/parts/upstart_job.py
deleted file mode 100644
index 7b290d26..00000000
--- a/cloudinit/parts/upstart_job.py
+++ /dev/null
@@ -1,30 +0,0 @@
-import os
-
-from cloudinit import util
-from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
-from cloudinit import log as logging
-from cloudinit import parts
-
-LOG = logging.getLogger(__name__)
-
-
-class UpstartJobPartHandler(parts.PartHandler):
-    def __init__(self, upstart_dir):
-        parts.PartHandler.__init__(self, PER_INSTANCE)
-        self.upstart_dir = upstart_dir
-
-    def list_types(self):
-        return ['text/upstart-job']
-
-    def _handle_part(self, _data, ctype, filename, payload, frequency):
-        if ctype in [CONTENT_START, CONTENT_END]:
-            return
-
-        filename = utils.clean_filename(filename)
-        (name, ext) = os.path.splitext(filename)
-        ext = ext.lower()
-        if ext != ".conf":
-            filename = filename + ".conf"
-
-        payload = util.dos2unix(payload)
-        util.write_file(os.path.join(self.upstart_dir, filename), payload, 0644)
diff --git a/cloudinit/user_data/__init__.py b/cloudinit/user_data/__init__.py
new file mode 100644
index 00000000..6264a6cc
--- /dev/null
+++ b/cloudinit/user_data/__init__.py
@@ -0,0 +1,210 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+
+import os
+import glob
+
+import email
+
+from email.mime.base import MIMEBase
+
+from cloudinit import log as logging
+from cloudinit import util
+
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
+
+LOG = logging.getLogger(__name__)
+
+# Special content types that signal the start and end of processing
+CONTENT_END = "__end__"
+CONTENT_START = "__begin__"
+CONTENT_SIGNALS = [CONTENT_START, CONTENT_END]
+
+# Used when a part-handler type is encountered
+# to allow for registration of new types.
+PART_CONTENT_TYPES = ["text/part-handler"]
+PART_HANDLER_FN_TMPL = 'part-handler-%03d'
+
+# For parts without filenames
+PART_FN_TPL = 'part-%03d'
+
+# Used as the content type when a message is not multipart
+# and it doesn't contain its own content-type
+NOT_MULTIPART_TYPE = "text/x-not-multipart"
+
+# Different file beginnings to there content type
+INCLUSION_TYPES_MAP = {
+    '#include': 'text/x-include-url',
+    '#include-once': 'text/x-include-once-url',
+    '#!': 'text/x-shellscript',
+    '#cloud-config': 'text/cloud-config',
+    '#upstart-job': 'text/upstart-job',
+    '#part-handler': 'text/part-handler',
+    '#cloud-boothook': 'text/cloud-boothook',
+    '#cloud-config-archive': 'text/cloud-config-archive',
+}
+
+# Sorted longest first
+INCLUSION_SRCH = sorted(INCLUSION_TYPES_MAP.keys(), key=(lambda e: 0 - len(e)))
+
+
+class PartHandler(object):
+    def __init__(self, frequency, version=2):
+        self.handler_version = version
+        self.frequency = frequency
+
+    def __repr__(self):
+        return "%s: [%s]" % (self.__class__.__name__, self.list_types())
+
+    def list_types(self):
+        raise NotImplementedError()
+
+    def handle_part(self, data, ctype, filename, payload, frequency):
+        return self._handle_part(data, ctype, filename, payload, frequency)
+
+    def _handle_part(self, data, ctype, filename, payload, frequency):
+        raise NotImplementedError()
+
+
+def fixup_module(mod):
+    if not hasattr(mod, "handler_version"):
+        setattr(mod, "handler_version", 1)
+    if not hasattr(mod, 'list_types'):
+        def empty_types():
+            return []
+        setattr(mod, 'list_types', empty_types)
+    if not hasattr(mod, frequency):
+        setattr(mod, 'frequency', PER_INSTANCE)
+    if not hasattr(mod, 'handle_part'):
+        def empty_handler(data, ctype, filename, payload):
+            pass
+        setattr(mod, 'handle_part', empty_handler)
+    return mod
+
+
+def run_part(mod, data, ctype, filename, payload, frequency):
+    mod_freq = mod.frequency
+    if not (mod_freq == PER_ALWAYS or
+            (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
+        return
+    mod_ver = mod.handler_version
+    try:
+        if mod_ver == 1:
+            mod.handle_part(data, ctype, filename, payload)
+        else:
+            mod.handle_part(data, ctype, filename, payload, frequency)
+    except:
+        LOG.exception("Failed calling mod %s (%s, %s, %s) with frequency %s", mod, ctype, filename, mod_ver, frequency)
+
+
+def call_begin(mod, data, frequency):
+    run_part(mod, data, CONTENT_START, None, None, frequency)
+
+
+def call_end(mod, data, frequency):
+    run_part(mod, data, CONTENT_END, None, None, frequency)
+
+
+def walker_handle_handler(pdata, _ctype, _filename, payload):
+    curcount = pdata['handlercount']
+    modname = PART_HANDLER_FN_TMPL % (curcount)
+    frequency = pdata['frequency']
+    modfname = os.path.join(pdata['handlerdir'], "%s.py" % (modname))
+    # TODO: Check if path exists??
+    util.write_file(modfname, payload, 0600)
+    handlers = pdata['handlers']
+    try:
+        mod = fixup_module(importer.import_module(modname))
+        handlers.register(mod)
+        call_begin(mod, pdata['data'], frequency)
+        pdata['handlercount'] = curcount + 1
+    except:
+        LOG.exception("Failed at registered python file: %s", modfname)
+
+
+def walker_callback(pdata, ctype, filename, payload):
+    if ctype in PART_CONTENT_TYPES:
+        walker_handle_handler(pdata, ctype, filename, payload)
+        return
+    handlers = pdata['handlers']
+    if ctype not in handlers:
+        if ctype == NOT_MULTIPART_TYPE:
+            # Extract the first line or 24 bytes for displaying in the log
+            start = payload.split("\n", 1)[0][:24]
+            if start < payload:
+                details = "starting '%s...'" % start.encode("string-escape")
+            else:
+                details = repr(payload)
+            LOG.warning("Unhandled non-multipart userdata: %s", details)
+        return
+    run_part(handlers[ctype], pdata['data'], ctype, filename, payload, pdata['frequency'])
+
+
+# Callback is a function that will be called with 
+# (data, content_type, filename, payload)
+def walk(msg, callback, data):
+    partnum = 0
+    for part in msg.walk():
+        # multipart/* are just containers
+        if part.get_content_maintype() == 'multipart':
+            continue
+
+        ctype = part.get_content_type()
+        if ctype is None:
+            ctype = OCTET_TYPE
+
+        filename = part.get_filename()
+        if not filename:
+            filename = PART_FN_TPL % (partnum)
+
+        callback(data, ctype, filename, part.get_payload(decode=True))
+        partnum = partnum + 1
+
+
+# Coverts a raw string into a mime message
+def convert_string(self, raw_data, headers=None):
+    if not raw_data:
+        raw_data = ''
+    if not headers:
+        headers = {}
+    data = util.decomp_str(raw_data)
+    if "mime-version:" in data[0:4096].lower():
+        msg = email.message_from_string(data)
+        for (key, val) in headers.items():
+            if key in msg:
+                msg.replace_header(key, val)
+            else:
+                msg[key] = val
+    else:
+        mtype = headers.get("Content-Type", NOT_MULTIPART_TYPE)
+        maintype, subtype = mtype.split("/", 1)
+        msg = MIMEBase(maintype, subtype, *headers)
+        msg.set_payload(data)
+    return msg
+
+
+def type_from_starts_with(payload, default=None):
+    for text in INCLUSION_SRCH:
+        if payload.startswith(text):
+            return INCLUSION_TYPES_MAP[text]
+    return default
\ No newline at end of file
diff --git a/cloudinit/user_data/boot_hook.py b/cloudinit/user_data/boot_hook.py
new file mode 100644
index 00000000..4ce398ac
--- /dev/null
+++ b/cloudinit/user_data/boot_hook.py
@@ -0,0 +1,65 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import os
+
+from cloudinit import log as logging
+from cloudinit import user_data as ud
+from cloudinit import util
+
+from cloudinit.settings import (PER_ALWAYS)
+
+LOG = logging.getLogger(__name__)
+
+
+class BootHookPartHandler(ud.PartHandler):
+    def __init__(self, boothook_dir, instance_id):
+        ud.PartHandler.__init__(self, PER_ALWAYS)
+        self.boothook_dir = boothook_dir
+        self.instance_id = instance_id
+
+    def list_types(self):
+        return [
+            ud.type_from_starts_with("#cloud-boothook"),
+        ]
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype in ud.CONTENT_SIGNALS:
+            return
+
+        filename = util.clean_filename(filename)
+        payload = util.dos2unix(payload)
+        prefix = "#cloud-boothook"
+        start = 0
+        if payload.startswith(prefix):
+            start = len(prefix) + 1
+
+        filepath = os.path.join(self.boothook_dir, filename)
+        util.write_file(filepath, payload[start:], 0700)
+        try:
+            env = os.environ.copy()
+            env['INSTANCE_ID'] = str(self.instance_id)
+            util.subp([filepath], env=env)
+        except util.ProcessExecutionError as e:
+            LOG.error("Boothooks script %s returned %s", filepath, e.exit_code)
+        except Exception as e:
+            LOG.error("Boothooks unknown exception %s when running %s", e, filepath)
diff --git a/cloudinit/user_data/cloud_config.py b/cloudinit/user_data/cloud_config.py
new file mode 100644
index 00000000..1c43f3a1
--- /dev/null
+++ b/cloudinit/user_data/cloud_config.py
@@ -0,0 +1,59 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+
+import os
+
+from cloudinit import log as logging
+from cloudinit import user_data as ud
+from cloudinit import util
+
+from cloudinit.settings import (PER_ALWAYS)
+
+LOG = logging.getLogger(__name__)
+
+
+class CloudConfigPartHandler(ud.PartHandler):
+    def __init__(self, cloud_fn):
+        ud.PartHandler.__init__(self, PER_ALWAYS)
+        self.cloud_buf = []
+        self.cloud_fn = cloud_fn
+
+    def list_types(self):
+        return [
+            ud.type_from_starts_with("#cloud-config"),
+        ]
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype == ud.CONTENT_START:
+            self.cloud_buf = []
+            return
+
+        if ctype == ud.CONTENT_END:
+            payload = "\n".join(self.cloud_buf)
+            util.write_file(self.cloud_fn, payload, 0600)
+            self.cloud_buf = []
+            return
+
+        filename = util.clean_filename(filename)
+        entry = "\n".join(["#%s" % (filename), str(payload)])
+        self.config_buf.append(entry)
diff --git a/cloudinit/user_data.py b/cloudinit/user_data/processor.py
similarity index 73%
rename from cloudinit/user_data.py
rename to cloudinit/user_data/processor.py
index f35e5d38..d4de9470 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data/processor.py
@@ -1,10 +1,12 @@
 # vi: ts=4 expandtab
 #
-#    Copyright (C) 2009-2010 Canonical Ltd.
+#    Copyright (C) 2012 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Hafliger <juerg.haefliger@hp.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -22,7 +24,6 @@ import hashlib
 import os
 import urllib
 
-import email
 from email.mime.multipart import MIMEMultipart
 from email.mime.text import MIMEText
 from email.mime.base import MIMEBase
@@ -30,33 +31,17 @@ from email.mime.base import MIMEBase
 import yaml
 
 from cloudinit import url_helper
+from cloudinit import user_data as ud
 from cloudinit import util
 
-
-# Different file beginnings to there content type
-INCLUSION_TYPES_MAP = {
-    '#include': 'text/x-include-url',
-    '#include-once': 'text/x-include-once-url',
-    '#!': 'text/x-shellscript',
-    '#cloud-config': 'text/cloud-config',
-    '#upstart-job': 'text/upstart-job',
-    '#part-handler': 'text/part-handler',
-    '#cloud-boothook': 'text/cloud-boothook',
-    '#cloud-config-archive': 'text/cloud-config-archive',
-}
-
 # Various special content types
 TYPE_NEEDED = ["text/plain", "text/x-not-multipart"]
 INCLUDE_TYPES = ['text/x-include-url', 'text/x-include-once-url']
 ARCHIVE_TYPES = ["text/cloud-config-archive"]
 UNDEF_TYPE = "text/plain"
 ARCHIVE_UNDEF_TYPE = "text/cloud-config"
-NOT_MULTIPART_TYPE = "text/x-not-multipart"
 OCTET_TYPE = 'application/octet-stream'
 
-# Sorted longest first
-INCLUSION_SRCH = sorted(INCLUSION_TYPES_MAP.keys(), key=(lambda e: 0 - len(e)))
-
 # Msg header used to track attachments
 ATTACHMENT_FIELD = 'Number-Attachments'
 
@@ -64,16 +49,13 @@ ATTACHMENT_FIELD = 'Number-Attachments'
 # When we want to make sure a entry isn't included more than once across sessions.
 INCLUDE_ONCE_HASHER = 'md5'
 
-# For those pieces without filenames
-PART_FN_TPL = 'part-%03d'
-
 
 class UserDataProcessor(object):
     def __init__(self, paths):
         self.paths = paths
 
     def process(self, blob):
-        base_msg = convert_string(blob)
+        base_msg = ud.convert_string(blob)
         process_msg = MIMEMultipart()
         self._process_msg(base_msg, process_msg)
         return process_msg
@@ -92,7 +74,7 @@ class UserDataProcessor(object):
                 ctype_orig = UNDEF_TYPE
     
             if ctype_orig in TYPE_NEEDED:
-                ctype = type_from_starts_with(payload)
+                ctype = ud.type_from_starts_with(payload)
     
             if ctype is None:
                 ctype = ctype_orig
@@ -146,7 +128,7 @@ class UserDataProcessor(object):
                 if not url_helper.ok_http_code(st):
                     content = ''
 
-            new_msg = convert_string(content)
+            new_msg = ud.convert_string(content)
             self._process_msg(new_msg, append_msg)
 
     def _explode_archive(self, archive, append_msg):
@@ -173,7 +155,7 @@ class UserDataProcessor(object):
             content = ent.get('content', '')
             mtype = ent.get('type')
             if not mtype:
-                mtype = type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
+                mtype = ud.type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
 
             maintype, subtype = mtype.split('/', 1)
             if maintype == "text":
@@ -217,55 +199,7 @@ class UserDataProcessor(object):
         """
         cur = self._multi_part_count(outer_msg)
         if not part.get_filename():
-            part.add_header('Content-Disposition', 'attachment', filename=PART_FN_TPL % (cur + 1))
+            fn = ud.PART_FN_TPL % (cur + 1)
+            part.add_header('Content-Disposition', 'attachment', filename=fn)
         outer_msg.attach(part)
         self._multi_part_count(outer_msg, cur + 1)
-
-
-# Callback is a function that will be called with 
-# (data, content_type, filename, payload)
-def walk(ud_msg, callback, data):
-    partnum = 0
-    for part in ud_msg.walk():
-        # multipart/* are just containers
-        if part.get_content_maintype() == 'multipart':
-            continue
-
-        ctype = part.get_content_type()
-        if ctype is None:
-            ctype = OCTET_TYPE
-
-        filename = part.get_filename()
-        if not filename:
-            filename = PART_FN_TPL % partnum
-
-        callback(data, ctype, filename, part.get_payload(decode=True))
-        partnum = partnum + 1
-
-
-def convert_string(self, raw_data, headers=None):
-    if not data:
-        data = ''
-    if not headers:
-        headers = {}
-    data = util.decomp_str(raw_data)
-    if "mime-version:" in data[0:4096].lower():
-        msg = email.message_from_string(data)
-        for (key, val) in headers.items():
-            if key in msg:
-                msg.replace_header(key, val)
-            else:
-                msg[key] = val
-    else:
-        mtype = headers.get("Content-Type", NOT_MULTIPART_TYPE)
-        maintype, subtype = mtype.split("/", 1)
-        msg = MIMEBase(maintype, subtype, *headers)
-        msg.set_payload(data)
-    return msg
-
-
-def type_from_starts_with(payload, default=None):
-    for text in INCLUSION_SRCH:
-        if payload.startswith(text):
-            return INCLUSION_TYPES_MAP[text]
-    return default
diff --git a/cloudinit/user_data/shell_script.py b/cloudinit/user_data/shell_script.py
new file mode 100644
index 00000000..d666b9c4
--- /dev/null
+++ b/cloudinit/user_data/shell_script.py
@@ -0,0 +1,53 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+
+import os
+
+from cloudinit import log as logging
+from cloudinit import user_data as ud
+from cloudinit import util
+
+from cloudinit.settings import (PER_INSTANCE)
+
+LOG = logging.getLogger(__name__)
+
+
+class ShellScriptPartHandler(ud.PartHandler):
+
+    def __init__(self, script_dir):
+        ud.PartHandler.__init__(self, PER_ALWAYS)
+        self.script_dir = script_dir
+
+    def list_types(self):
+        return [
+            ud.type_from_starts_with("#!"),
+        ]
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype in ud.CONTENT_SIGNALS:
+            # maybe delete existing things here
+            return
+
+        filename = util.clean_filename(filename)
+        payload = util.dos2unix(payload)
+        util.write_file(os.path.join(self.script_dir, filename), payload, 0700)
diff --git a/cloudinit/user_data/upstart_job.py b/cloudinit/user_data/upstart_job.py
new file mode 100644
index 00000000..d15e66c4
--- /dev/null
+++ b/cloudinit/user_data/upstart_job.py
@@ -0,0 +1,56 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+
+import os
+
+from cloudinit import log as logging
+from cloudinit import user_data as ud
+from cloudinit import util
+
+from cloudinit.settings import (PER_INSTANCE)
+
+LOG = logging.getLogger(__name__)
+
+
+class UpstartJobPartHandler(ud.PartHandler):
+    def __init__(self, upstart_dir):
+        ud.PartHandler.__init__(self, PER_INSTANCE)
+        self.upstart_dir = upstart_dir
+
+    def list_types(self):
+        return [
+            ud.type_from_starts_with("#upstart-job"),
+        ]
+
+    def _handle_part(self, _data, ctype, filename, payload, frequency):
+        if ctype in ud.CONTENT_SIGNALS:
+            return
+
+        filename = utils.clean_filename(filename)
+        (name, ext) = os.path.splitext(filename)
+        ext = ext.lower()
+        if ext != ".conf":
+            filename = filename + ".conf"
+
+        payload = util.dos2unix(payload)
+        util.write_file(os.path.join(self.upstart_dir, filename), payload, 0644)

From 943a2d09189558661c6a0fd0c433e37353124652 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:31:56 -0700
Subject: [PATCH 039/434] Move most of this functionality to either cloud-init
 object or utils.

---
 cloudinit/__init__.py | 93 +++----------------------------------------
 1 file changed, 6 insertions(+), 87 deletions(-)

diff --git a/cloudinit/__init__.py b/cloudinit/__init__.py
index c38b3b09..ab0603e0 100644
--- a/cloudinit/__init__.py
+++ b/cloudinit/__init__.py
@@ -1,11 +1,12 @@
 # vi: ts=4 expandtab
 #
-#    Common code for the EC2 initialisation scripts in Ubuntu
-#    Copyright (C) 2008-2009 Canonical Ltd
+#    Copyright (C) 2012 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
-#    Author: Soren Hansen <soren@canonical.com>
+#    Author: Scott Moser <scott.moser@canonical.com>
 #    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -18,99 +19,17 @@
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-#
 
-import os
-
-import sys
-import errno
-import subprocess
-import yaml
-import glob
-
-from cloudinit import log as logging
-from cloudinit import sources
-from cloudinit import url_helper as uhelp
 from cloudinit import util
 
-from cloudinit.settings import (VAR_LIB_DIR, CFG_BUILTIN, CLOUD_CONFIG,
-                                 BOOT_FINISHED, CUR_INSTANCE_LINK)
-
-LOG = logging.getLogger(__name__)
-
-INIT_SUBDIRS = [
-    os.path.join(VAR_LIB_DIR, 'scripts'),
-    os.path.join(VAR_LIB_DIR, 'scripts', 'per-instance'),
-    os.path.join(VAR_LIB_DIR, 'scripts', 'per-once'),
-    os.path.join(VAR_LIB_DIR, 'scripts', 'per-boot'),
-    os.path.join(VAR_LIB_DIR, 'seed'),
-    os.path.join(VAR_LIB_DIR, 'instances'),
-    os.path.join(VAR_LIB_DIR, 'handlers'),
-    os.path.join(VAR_LIB_DIR, 'sem'),
-    os.path.join(VAR_LIB_DIR, 'data'),
-]
-
-
-def initfs():
-    util.ensure_dirs(INIT_SUBDIRS)
-    cfg = util.get_base_cfg(CLOUD_CONFIG, get_builtin_cfg())
-    log_file = util.get_cfg_option_str(cfg, 'def_log_file', None)
-    perms = util.get_cfg_option_str(cfg, 'syslog_fix_perms', None)
-    if log_file:
-        util.ensure_file(log_file)
-        if perms:
-            (u, g) = perms.split(':', 1)
-            if u == "-1" or u == "None":
-                u = None
-            if g == "-1" or g == "None":
-                g = None
-            util.chownbyname(log_file, u, g)
-
-
-def purge_cache(rmcur=True):
-    rmlist = [BOOT_FINISHED]
-    if rmcur:
-        rmlist.append(CUR_INSTANCE_LINK)
-    for f in rmlist:
-        util.unlink(f)
-    return True
+from cloudinit.settings import (CFG_BUILTIN, CLOUD_CONFIG)
 
 
 def get_base_cfg(cfg_path=None):
-    if cfg_path is None:
+    if not cfg_path:
         cfg_path = CLOUD_CONFIG
     return util.get_base_cfg(cfg_path, get_builtin_cfg())
 
 
 def get_builtin_cfg():
     return dict(CFG_BUILTIN)
-
-
-def list_sources(cfg_list, depends):
-    return sources.list_sources(cfg_list, depends, ["cloudinit", ""])
-
-
-def get_cmdline_url(names=None, starts=None, cmdline=None):
-    if cmdline is None:
-        cmdline = util.get_cmdline()
-    if not names:
-        names = ('cloud-config-url', 'url')
-    if not starts:
-        starts = "#cloud-config"
-
-    data = util.keyval_str_to_dict(cmdline)
-    url = None
-    key = None
-    for key in names:
-        if key in data:
-            url = data[key]
-            break
-
-    if url is None:
-        return (None, None, None)
-
-    contents = uhelp.readurl(url)
-    if contents.startswith(starts):
-        return (key, url, contents)
-
-    return (key, url, None)

From 9c59c098855475c309cec0ae457693c24bf20f32 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:32:50 -0700
Subject: [PATCH 040/434] More init fs here, cleanup after user_data file moves
 + other cleanups.

---
 cloudinit/cloud.py | 199 ++++++++++++++++++++++++++++++++-------------
 1 file changed, 144 insertions(+), 55 deletions(-)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index f9c0d531..80d4f1ce 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -1,34 +1,57 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
 from time import time
 
 import cPickle as pickle
+
 import contextlib
 import copy
 import os
 import sys
 import weakref
 
-from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS,
-                                OLD_CLOUD_CONFIG, CLOUD_CONFIG,
-                                CUR_INSTANCE_LINK)
+from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS)
+from cloudinit.settings import (OLD_CLOUD_CONFIG, CLOUD_CONFIG)
+
 from cloudinit import (get_builtin_cfg, get_base_cfg)
 from cloudinit import log as logging
 from cloudinit import sources
 from cloudinit import util
-from cloudinit import user_data
 from cloudinit import handlers
 
-from cloudinit import parts
-from cloudinit.parts import boot_hook as bh_part
-from cloudinit.parts import cloud_config as cc_part
-from cloudinit.parts import upstart_job as up_part
-from cloudinit.parts import shell_script as ss_part
+from cloudinit import user_data as ud
+from cloudinit.user_data import boot_hook as bh_part
+from cloudinit.user_data import cloud_config as cc_part
+from cloudinit.user_data import processor as ud_proc
+from cloudinit.user_data import shell_script as ss_part
+from cloudinit.user_data import upstart_job as up_part
 
 LOG = logging.getLogger(__name__)
 
 
 class CloudSemaphores(object):
-    def __init__(self, paths):
-        self.paths = paths
+    def __init__(self, sem_path):
+        self.sem_path = sem_path
 
     # acquire lock on 'name' for given 'freq' and run function 'func'
     # if 'clear_on_fail' is True and 'func' throws an exception
@@ -71,7 +94,7 @@ class CloudSemaphores(object):
         # here, but this should be ok due to the nature of when
         # and where cloud-init runs... (file writing is not a lock..)
         sem_file = self._getpath(name, freq)
-        contents = "%s\n" % str(time())
+        contents = "%s: %s\n" % (os.getpid(), time())
         try:
             util.write_file(sem_file, contents)
         except (IOError, OSError):
@@ -87,28 +110,37 @@ class CloudSemaphores(object):
         return False
 
     def _get_path(self, name, freq):
-        sem_path = self.init.get_ipath("sem")
+        sem_path = self.sem_path
         if freq == PER_INSTANCE:
             return os.path.join(sem_path, name)
         return os.path.join(sem_path, "%s.%s" % (name, freq))
 
 
 class CloudPaths(object):
-    def __init__(self, init):
-        self.config = CLOUD_CONFIG
-        self.old_config = OLD_CLOUD_CONFIG
-        self.var_dir = VAR_LIB_DIR
-        self.instance_link = CUR_INSTANCE_LINK
-        self.init = weakref.proxy(init)
-        self.upstart_conf_d = "/etc/init"
-
-    def _get_path_key(self, name):
-        return PATH_MAP.get(name)
+    def __init__(self, sys_info):
+        self.cloud_dir = sys_info['cloud_dir']
+        self.instance_link = os.path.join(self.cloud_dir, 'instance')
+        self.boot_finished = os.path.join(self.instance_link, "boot-finished")
+        self.upstart_conf_d = sys_info.get('upstart_dir')
+        self.template_dir = sys_info['templates_dir']
+        self.seed_dir = os.path.join(self.cloud_dir, 'seed')
+        self.datasource = None
+        self.lookups = {
+           "handlers": "handlers",
+           "scripts": "scripts",
+           "sem": "sem",
+           "boothooks": "boothooks",
+           "userdata_raw": "user-data.txt",
+           "userdata": "user-data.txt.i",
+           "obj_pkl": "obj.pkl",
+           "cloud_config": "cloud-config.txt",
+           "data": "data",
+        }
 
     # get_ipath_cur: get the current instance path for an item
     def get_ipath_cur(self, name=None):
-        add_on = self._get_path_key(name)
-        ipath = os.path.join(self.var_dir, 'instance')
+        ipath = os.path.join(self.cloud_dir, 'instance')
+        add_on = self.lookups.get(name)
         if add_on:
             ipath = os.path.join(ipath, add_on)
         return ipath
@@ -117,7 +149,7 @@ class CloudPaths(object):
     # for a name in dirmap
     def get_cpath(self, name=None):
         cpath = self.var_dir
-        add_on = self._get_path_key(name)
+        add_on = self.lookups.get(name)
         if add_on:
             cpath = os.path.join(cpath, add_on)
         return cpath
@@ -125,18 +157,21 @@ class CloudPaths(object):
     # get_ipath : get the instance path for a name in pathmap
     # (/var/lib/cloud/instances/<instance>/<name>)
     def get_ipath(self, name=None):
-        iid = self.init.datasource.get_instance_id()
-        ipath = os.path.join(self.var_dir, 'instances', iid)
-        add_on = self._get_path_key(name)
+        if not self.datasource:
+            raise RuntimeError("Unable to get instance path, datasource not available/set.")
+        iid = self.datasource.get_instance_id()
+        ipath = os.path.join(self.cloud_dir, 'instances', iid)
+        add_on = self.lookups.get(name)
         if add_on:
             ipath = os.path.join(ipath, add_on)
         return ipath
 
 
 class CloudSimple(object):
-    def __init__(self, init):
+    def __init__(self, ci):
         self.datasource = init.datasource
         self.paths = init.paths
+        self.cfg = copy.deepcopy(ci.cfg)
 
     def get_userdata(self):
         return self.datasource.get_userdata()
@@ -173,8 +208,8 @@ class CloudInit(object):
             self.ds_deps = ds_deps
         else:
             self.ds_deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
-        self.paths = CloudPaths(self)
         self.cfg = self._read_cfg()
+        self.paths = CloudPaths(self.cfg['system_info'])
 
     def _read_cfg_old(self):
         # support reading the old ConfigObj format file and merging
@@ -185,56 +220,110 @@ class CloudInit(object):
             ConfigObj = None
         if not ConfigObj:
             return {}
-        old_cfg = ConfigObj(self.paths.old_config_fn)
+        old_cfg = ConfigObj(OLD_CLOUD_CONFIG)
         return dict(old_cfg)
 
-    def read_cfg(self):
-        if not self.cfg:
-            self.cfg = self._read_cfg()
-        return self.cfg
+    def _initial_subdirs(self):
+        c_dir = self.paths.cloud_dir
+        initial_dirs = [
+            os.path.join(c_dir, 'scripts'),
+            os.path.join(c_dir, 'scripts', 'per-instance'),
+            os.path.join(c_dir, 'scripts', 'per-once'),
+            os.path.join(c_dir, 'scripts', 'per-boot'),
+            os.path.join(c_dir, 'seed'),
+            os.path.join(c_dir, 'instances'),
+            os.path.join(c_dir, 'handlers'),
+            os.path.join(c_dir, 'sem'),
+            os.path.join(c_dir, 'data'),
+        ]
+        return initial_dirs
+
+    def purge_cache(self, rmcur=True):
+        rmlist = []
+        rmlist.append(self.paths.boot_finished)
+        if rmcur:
+            rmlist.append(self.paths.instance_link)
+        for f in rmlist:
+            util.unlink(f)
+        return len(rmlist)
+
+    def init_fs(self):
+        util.ensure_dirs(self._initial_subdirs())
+        log_file = util.get_cfg_option_str(self.cfg, 'def_log_file', None)
+        perms = util.get_cfg_option_str(self.cfg, 'syslog_fix_perms', None)
+        if log_file:
+            util.ensure_file(log_file)
+            if perms:
+                (u, g) = perms.split(':', 1)
+                if u == "-1" or u == "None":
+                    u = None
+                if g == "-1" or g == "None":
+                    g = None
+                util.chownbyname(log_file, u, g)
 
     def _read_cfg(self):
         starting_config = get_builtin_cfg()
         try:
-            conf = get_base_cfg(self.paths.config, starting_config)
+            conf = get_base_cfg(CLOUD_CONFIG, starting_config)
         except Exception:
             conf = starting_config
         old_conf = self._read_cfg_old()
         conf = util.mergedict(conf, old_conf)
         return conf
     
-    def restore_from_cache(self):
+    def _restore_from_cache(self):
         pickled_fn = self.paths.get_ipath_cur('obj_pkl')
         try:
             # we try to restore from a current link and static path
             # by using the instance link, if purge_cache was called
             # the file wont exist
-            self.datasource = pickle.loads(util.load_file(pickled_fn))
-            return True
+            return pickle.loads(util.load_file(pickled_fn))
         except Exception as e:
             LOG.debug("Failed loading pickled datasource from %s due to %s", pickled_fn, e)
             return False
-    
+
     def write_to_cache(self):
         pickled_fn = self.paths.get_ipath_cur("obj_pkl")
         try:
             contents = pickle.dumps(self.datasource)
             util.write_file(pickled_fn, contents, mode=0400)
         except Exception as e:
-            LOG.debug("Failed pickling datasource to %s due to %s", pickled_fn, e)
+            LOG.debug("Failed pickling datasource to %s due to: %s", pickled_fn, e)
             return False
-    
+
+    def _get_processor(self):
+        return ud_proc.UserDataProcessor(self.paths)
+
+    def _get_datasources(self):
+        # Any config provided???
+        pkg_list = self.cfg.get('datasource_pkg_list') or []
+        # Add the defaults at the end
+        for n in [util.obj_name(sources), '']:
+            if n not in pkg_list:
+                pkg_list.append(n)
+        cfg_list = self.cfg.get('datasource_list') or []
+        return (cfg_list, pkg_list)
+
     def get_data_source(self):
         if self.datasource:
             return True
-        if self.restore_from_cache():
-            LOG.debug("Restored from cache datasource: %s" % self.datasource)
-            return True
-        (ds, dsname) = sources.find_source(self.cfg, self.ds_deps)
-        LOG.debug("Loaded datasource %s:%s", dsname, ds)
+        ds = self._restore_from_cache()
+        if ds:
+            LOG.debug("Restored from cache datasource: %s" % ds)
+        else:
+            (cfg_list, pkg_list) = self._get_datasources()
+            ud_proc = self._get_processor()
+            (ds, dsname) = sources.find_source(self.cfg,
+                                               self.ds_deps,
+                                               cfg_list=cfg_list,
+                                               pkg_list=pkg_list,
+                                               ud_proc=ud_proc)
+            LOG.debug("Loaded datasource %s - %s", dsname, ds)
         self.datasource = ds
+        # This allows the paths obj to have an ipath function that works
+        self.paths.datasource = ds
         return True
-    
+
     def set_cur_instance(self):
         # Ensure we are hooked into the right symlink for the current instance
         idir = self.paths.get_ipath()
@@ -299,7 +388,7 @@ class CloudInit(object):
         handlers = CloudHandlers(self)
 
         # Add handlers in cdir
-        potential_handlers = parts.find_module_files(cdir)
+        potential_handlers = utils.find_modules(cdir)
         for (fname, modname) in potential_handlers.iteritems():
             try:
                 mod = parts.fixup_module(importer.import_module(modname))
@@ -329,7 +418,7 @@ class CloudInit(object):
             'frequency': frequency,
             'handlercount': 0,
         }
-        user_data.walk(data.get_userdata(), parts.walker_callback, data=part_data)
+        ud.walk(data.get_userdata(), parts.walker_callback, data=part_data)
 
         # Give callbacks opportunity to finalize
         called = []
@@ -394,11 +483,11 @@ class CloudHandlers(object):
 
 
 class CloudConfig(object):
-
     def __init__(self, cfgfile, cloud):
-        self.cloud = CloudSimple(cloud)
+        self.cloud = cloud
         self.cfg = self._get_config(cfgfile)
-        self.sems = CloudSemaphores(self.cloud.paths)
+        self.paths = cloud.paths
+        self.sems = CloudSemaphores(self.paths.get_ipath("sem"))
 
     def _get_config(self, cfgfile):
         cfg = None
@@ -433,5 +522,5 @@ class CloudConfig(object):
         if not freq:
             freq = def_freq
         c_name = "config-%s" % (name)
-        real_args = [name, copy.deepcopy(self.cfg), self.cloud, LOG, copy.deepcopy(args)]
+        real_args = [name, copy.deepcopy(self.cfg), CloudSimple(self.cloud), LOG, copy.deepcopy(args)]
         return self.sems.run_functor(c_name, freq, mod.handle, real_args)

From e72987eba1e2f1cc9f40adff32f6817aa70e4986 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:33:20 -0700
Subject: [PATCH 041/434] Add copyright + index hash directly instead of get.

---
 cloudinit/importer.py | 24 ++++++++++++++++++++++--
 1 file changed, 22 insertions(+), 2 deletions(-)

diff --git a/cloudinit/importer.py b/cloudinit/importer.py
index deea0956..0344d0de 100644
--- a/cloudinit/importer.py
+++ b/cloudinit/importer.py
@@ -1,4 +1,24 @@
-# vim: tabstop=4 shiftwidth=4 softtabstop=4
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 import sys
 
@@ -6,6 +26,6 @@ import sys
 def import_module(module_name):
     try:
         __import__(module_name)
-        return sys.modules.get(module_name, None)
+        return sys.modules[module_name]
     except ImportError as err:
         raise RuntimeError('Could not load module %s: %s' % (module_name, err))

From 5914f9556dc5c40a83b615d8c52141aefe89f0ec Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:33:44 -0700
Subject: [PATCH 042/434] Add copyright.

---
 cloudinit/log.py | 23 ++++++++++++++++++++++-
 1 file changed, 22 insertions(+), 1 deletion(-)

diff --git a/cloudinit/log.py b/cloudinit/log.py
index 2dda405d..341b329b 100644
--- a/cloudinit/log.py
+++ b/cloudinit/log.py
@@ -1,4 +1,25 @@
-# vim: tabstop=4 shiftwidth=4 softtabstop=4
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
 
 import logging
 import logging.handlers

From 1b524376ee60c28619b210960f1b6ed3f3989245 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:34:06 -0700
Subject: [PATCH 043/434] Add copyright.

---
 cloudinit/mounting.py | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/cloudinit/mounting.py b/cloudinit/mounting.py
index b72f729a..b78cb5bd 100644
--- a/cloudinit/mounting.py
+++ b/cloudinit/mounting.py
@@ -1,3 +1,25 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
 import contextlib
 
 from cloudinit import util

From 28af2a6a9acb478b47fe632a16c922fa42f79775 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:34:52 -0700
Subject: [PATCH 044/434] Remove pathmap and make this a part of the CloudPath
 object, add copyright and format built in config

---
 cloudinit/settings.py | 63 +++++++++++++++++++++++++------------------
 1 file changed, 37 insertions(+), 26 deletions(-)

diff --git a/cloudinit/settings.py b/cloudinit/settings.py
index 830d970d..f58c4b52 100644
--- a/cloudinit/settings.py
+++ b/cloudinit/settings.py
@@ -1,40 +1,51 @@
-import os
-
-VAR_LIB_DIR = '/var/lib/cloud'
-CUR_INSTANCE_LINK = os.path.join(VAR_LIB_DIR, "instance")
-BOOT_FINISHED = os.path.join(CUR_INSTANCE_LINK, "boot-finished")
-SEED_DIR = os.path.join(VAR_LIB_DIR, "seed")
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 CFG_ENV_NAME = "CLOUD_CFG"
 CLOUD_CONFIG = '/etc/cloud/cloud.cfg'
 OLD_CLOUD_CONFIG = '/etc/ec2-init/ec2-config.cfg'
 
 CFG_BUILTIN = {
-    'datasource_list': ['NoCloud',
-                        'ConfigDrive',
-                        'OVF',
-                        'MAAS',
-                        'Ec2',
-                        'CloudStack'],
+    'datasource_list': [
+        'NoCloud',
+        'ConfigDrive',
+        'OVF',
+        'MAAS',
+        'Ec2',
+        'CloudStack'
+    ],
     'def_log_file': '/var/log/cloud-init.log',
     'log_cfgs': [],
-    'syslog_fix_perms': 'syslog:adm'
-}
-
-PATH_MAP = {
-   "handlers": "handlers",
-   "scripts": "scripts",
-   "sem": "sem",
-   "boothooks": "boothooks",
-   "userdata_raw": "user-data.txt",
-   "userdata": "user-data.txt.i",
-   "obj_pkl": "obj.pkl",
-   "cloud_config": "cloud-config.txt",
-   "data": "data",
+    'syslog_fix_perms': 'syslog:adm',
+    'system_info': {
+        'paths': {
+            'cloud_dir': '/var/lib/cloud',
+            'templates_dir': '/etc/cloud/templates/',
+        }, 
+        'distro': 'ubuntu',
+    },
 }
 
 PER_INSTANCE = "once-per-instance"
 PER_ALWAYS = "always"
 PER_ONCE = "once"
 
-TEMPLATE_DIR = '/etc/cloud/templates/'

From ff2f2f58420b843c052d45d8332b3b7638a13eca Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:35:39 -0700
Subject: [PATCH 045/434] Cleanup this and add refactoring around large
 constructors (add a parse method). Handle error cases better...

---
 cloudinit/ssh_util.py | 265 ++++++++++++++++++++++++------------------
 1 file changed, 149 insertions(+), 116 deletions(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index 1483f718..93fd55dd 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -20,42 +20,70 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 import os
-import os.path
-import cloudinit.util as util
+import pwd
+
+from cloudinit import log as logging
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
 
 
-class AuthKeyEntry():
-    # lines are options, keytype, base64-encoded key, comment
-    # man page says the following which I did not understand:
-    #   The options field is optional; its presence is determined by whether
-    #   the line starts with a number or not (the options field never starts
-    #   with a number)
-    options = None
-    keytype = None
-    base64 = None
-    comment = None
-    is_comment = False
-    line_in = ""
+class AuthKeyEntry(object):
+    """
+    AUTHORIZED_KEYS FILE FORMAT
+     AuthorizedKeysFile specifies the file containing public keys for public
+     key authentication; if none is specified, the default is
+     ~/.ssh/authorized_keys.  Each line of the file contains one key (empty
+     (because of the size of the public key encoding) up to a limit of 8 kilo-
+     bytes, which permits DSA keys up to 8 kilobits and RSA keys up to 16
+     kilobits.  You don't want to type them in; instead, copy the
+     identity.pub, id_dsa.pub, or the id_rsa.pub file and edit it.
+
+     sshd enforces a minimum RSA key modulus size for protocol 1 and protocol
+     2 keys of 768 bits.
+
+     The options (if present) consist of comma-separated option specifica-
+     tions.  No spaces are permitted, except within double quotes.  The fol-
+     lowing option specifications are supported (note that option keywords are
+     case-insensitive):
+    """
 
     def __init__(self, line, def_opt=None):
-        line = line.rstrip("\n\r")
-        self.line_in = line
-        if line.startswith("#") or line.strip() == "":
-            self.is_comment = True
+        self.line = str(line)
+        (self.value, self.components) = self._parse(self.line, def_opt)
+
+    def _form_components(self, toks):
+        components = {}
+        if len(toks) == 1:
+            components['base64'] = toks[0]
+        elif len(toks) == 2:
+            components['base64'] = toks[0]
+            components['comment'] = toks[1]
+        elif len(toks) == 3:
+            components['keytype'] = toks[0]
+            components['base64'] = toks[1]
+            components['comment'] = toks[2]
+        return components
+
+    def get(self, piece):
+        return self.components.get(piece)
+
+    def _parse(self, in_line, def_opt):
+        line = in_line.rstrip("\r\n")
+        if line.startswith("#") or line.strip() == '':
+            return (False, {})
         else:
             ent = line.strip()
             toks = ent.split(None, 3)
-            if len(toks) == 1:
-                self.base64 = toks[0]
-            elif len(toks) == 2:
-                (self.base64, self.comment) = toks
-            elif len(toks) == 3:
-                (self.keytype, self.base64, self.comment) = toks
-            elif len(toks) == 4:
-                i = 0
-                ent = line.strip()
-                quoted = False
+            tmp_components = {}
+            if def_opt:
+                tmp_components['options'] = def_opt
+            if len(toks) < 4:
+                tmp_components.update(self._form_components(toks))
+            else:
                 # taken from auth_rsa_key_allowed in auth-rsa.c
+                i = 0
+                quoted = False
                 try:
                     while (i < len(ent) and
                            ((quoted) or (ent[i] not in (" ", "\t")))):
@@ -67,124 +95,129 @@ class AuthKeyEntry():
                             quoted = not quoted
                         i = i + 1
                 except IndexError:
-                    self.is_comment = True
-                    return
-
+                    return (False, {})
                 try:
-                    self.options = ent[0:i]
-                    (self.keytype, self.base64, self.comment) = \
-                        ent[i + 1:].split(None, 3)
-                except ValueError:
-                    # we did not understand this line
-                    self.is_comment = True
+                    options = ent[0:i]
+                    toks = ent[i + 1:].split(None, 3)
+                    if options:
+                        tmp_components['options'] = options
+                    tmp_components.update(self._form_components(toks))
+                except (IndexError, ValueError):
+                    return (False, {})
+            # We got some useful value!
+            return (True, tmp_components)
 
-        if self.options == None and def_opt:
-            self.options = def_opt
-
-        return
-
-    def debug(self):
-        print("line_in=%s\ncomment: %s\noptions=%s\nkeytype=%s\nbase64=%s\n"
-              "comment=%s\n" % (self.line_in, self.is_comment, self.options,
-                                self.keytype, self.base64, self.comment)),
-
-    def __repr__(self):
-        if self.is_comment:
-            return(self.line_in)
+    def __str__(self):
+        if not self.value:
+            return self.line
         else:
             toks = []
-            for e in (self.options, self.keytype, self.base64, self.comment):
-                if e:
-                    toks.append(e)
-
-            return(' '.join(toks))
+            if 'options' in self.components:
+                toks.append(self.components['options'])
+            if 'keytype' in self.components:
+                toks.append(self.components['keytype'])
+            if 'base64' in self.components:
+                toks.append(self.components['base64'])
+            if 'comment' in self.components:
+                toks.append(self.components['comment'])
+            if not toks:
+                return ''
+            return ' '.join(toks)
 
 
 def update_authorized_keys(fname, keys):
-    # keys is a list of AuthKeyEntries
-    # key_prefix is the prefix (options) to prepend
+    lines = []
     try:
-        fp = open(fname, "r")
-        lines = fp.readlines()  # lines have carriage return
-        fp.close()
-    except IOError:
+        if os.path.isfile(fname):
+            lines = util.load_file(fname).splitlines()
+    except (IOError, OSError):
+        LOG.exception("Error reading lines from %s", fname)
         lines = []
 
-    ka_stats = {}  # keys_added status
-    for k in keys:
-        ka_stats[k] = False
-
-    to_add = []
-    for key in keys:
-        to_add.append(key)
-
+    to_add = list(keys)
     for i in range(0, len(lines)):
         ent = AuthKeyEntry(lines[i])
+        if not ent.value:
+            continue
+        # Replace those with the same base64
         for k in keys:
-            if k.base64 == ent.base64 and not k.is_comment:
+            if not k.value:
+                continue
+            if k.get('base64') == ent.get('base64'):
+                # Replace it with our better one
                 ent = k
-                try:
-                    to_add.remove(k)
-                except ValueError:
-                    pass
+                # Don't add it later
+                to_add.remove(k)
         lines[i] = str(ent)
 
-    # now append any entries we did not match above
+    # Now append any entries we did not match above
     for key in to_add:
         lines.append(str(key))
 
-    if len(lines) == 0:
-        return("")
-    else:
-        return('\n'.join(lines) + "\n")
+    # Ensure it ends with a newline
+    lines.append('')
+    return '\n'.join(lines)
 
 
-def setup_user_keys(keys, user, key_prefix, log=None):
-    import pwd
-    saved_umask = os.umask(077)
-
+def setup_user_keys(keys, user, key_prefix, sshd_config_fn="/etc/ssh/sshd_config"):
     pwent = pwd.getpwnam(user)
 
-    ssh_dir = '%s/.ssh' % pwent.pw_dir
+    ssh_dir = os.path.join(pwent.pw_dir, '.ssh')
     if not os.path.exists(ssh_dir):
-        os.mkdir(ssh_dir)
-        os.chown(ssh_dir, pwent.pw_uid, pwent.pw_gid)
-
-    try:
-        ssh_cfg = parse_ssh_config()
-        akeys = ssh_cfg.get("AuthorizedKeysFile", "%h/.ssh/authorized_keys")
-        akeys = akeys.replace("%h", pwent.pw_dir)
-        akeys = akeys.replace("%u", user)
-        if not akeys.startswith('/'):
-            akeys = os.path.join(pwent.pw_dir, akeys)
-        authorized_keys = akeys
-    except Exception:
-        authorized_keys = '%s/.ssh/authorized_keys' % pwent.pw_dir
-        if log:
-            util.logexc(log)
+        util.ensure_dir(ssh_dir, mode=0700)
+        util.chownbyid(ssh_dir, pwent.pw_uid, pwent.pw_gid)
 
     key_entries = []
     for k in keys:
-        ke = AuthKeyEntry(k, def_opt=key_prefix)
-        key_entries.append(ke)
+        key_entries.append(AuthKeyEntry(k, def_opt=key_prefix))
 
-    content = update_authorized_keys(authorized_keys, key_entries)
-    util.write_file(authorized_keys, content, 0600)
+    with util.SeLinuxGuard(ssh_dir, recursive=True):
+        try:
+            """
+             AuthorizedKeysFile may contain tokens
+             of the form %T which are substituted during connection set-up.
+             The following tokens are defined: %% is replaced by a literal
+             '%', %h is replaced by the home directory of the user being
+             authenticated and %u is replaced by the username of that user.
+            """
+            ssh_cfg = parse_ssh_config(sshd_config_fn)
+            akeys = ssh_cfg.get("authorizedkeysfile", '')
+            akeys = akeys.strip()
+            if not akeys:
+                akeys = "%h/.ssh/authorized_keys"
+            akeys = akeys.replace("%h", pwent.pw_dir)
+            akeys = akeys.replace("%u", user)
+            akeys = akeys.replace("%%", '%')
+            if not akeys.startswith('/'):
+                akeys = os.path.join(pwent.pw_dir, akeys)
+            authorized_keys = akeys
+        except (IOError, OSError):
+            authorized_keys = os.path.join(ssh_dir, 'authorized_keys')
+            LOG.exception(("Failed extracting 'AuthorizedKeysFile' in ssh config"
+                            " from %s, using 'AuthorizedKeysFile' file %s instead."),
+                           sshd_config_fn, authorized_keys)
 
-    os.chown(authorized_keys, pwent.pw_uid, pwent.pw_gid)
-    util.restorecon_if_possible(ssh_dir, recursive=True)
-
-    os.umask(saved_umask)
+        content = update_authorized_keys(authorized_keys, key_entries)
+        util.ensure_dir(os.path.dirname(authorized_keys), mode=0700)
+        util.write_file(authorized_keys, content, mode=0600)
+        util.chownbyid(authorized_keys, pwent.pw_uid, pwent.pw_gid)
 
 
-def parse_ssh_config(fname="/etc/ssh/sshd_config"):
+def parse_ssh_config(fname):
+    """
+    The file contains keyword-argu-ment pairs, one per line.
+    Lines starting with '#' and empty lines are interpreted as comments.
+    Note: key-words are case-insensitive and arguments are case-sensitive
+    """
     ret = {}
-    fp = open(fname)
-    for l in fp.readlines():
-        l = l.strip()
-        if not l or l.startswith("#"):
+    if not os.path.isfile(fname):
+        return ret
+    for line in util.load_file(fname).splitlines():
+        line = line.strip()
+        if not line or line.startswith("#"):
             continue
-        key, val = l.split(None, 1)
-        ret[key] = val
-    fp.close()
-    return(ret)
+        (key, val) = line.split(None, 1)
+        key = key.strip().lower()
+        if key:
+            ret[key] = val
+    return ret

From 7d9cf3b2ff62b86b7f360f9c68ab366381cc8897 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:36:18 -0700
Subject: [PATCH 046/434] Remove unused imports and reduce lines needed + add
 copy right.

---
 cloudinit/templater.py | 32 +++++++++++++++++++++++---------
 1 file changed, 23 insertions(+), 9 deletions(-)

diff --git a/cloudinit/templater.py b/cloudinit/templater.py
index 5a3563a2..04cc5a6f 100644
--- a/cloudinit/templater.py
+++ b/cloudinit/templater.py
@@ -1,18 +1,32 @@
-import os
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 from Cheetah.Template import Template
 
-from cloudinit import settings
 from cloudinit import util
 
 
-def render_to_file(template, outfile, searchList):
-    fn = template
-    (base, ext) = os.path.splitext(fn)
-    if ext != ".tmpl":
-        fn = "%s.tmpl" % (fn)
-    fn = os.path.join(settings.TEMPLATE_DIR, fn)
-    contents = Template(file=fn, searchList=[searchList]).respond()
+def render_to_file(template_fn, outfile, searchList):
+    contents = Template(file=template_fn, searchList=[searchList]).respond()
     util.write_file(outfile, contents)
 
 

From 36d36a756abd8c952ab4b3a163efcfc6c53276ff Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:37:10 -0700
Subject: [PATCH 047/434] Move cmdline functions here. Cleanup exception
 trapping. Fixup copyright.

---
 cloudinit/util.py | 113 ++++++++++++++++++++++++++++++++++++----------
 1 file changed, 88 insertions(+), 25 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 265a3a97..5930ff3f 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1,10 +1,12 @@
 # vi: ts=4 expandtab
 #
-#    Copyright (C) 2009-2010 Canonical Ltd.
+#    Copyright (C) 2012 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Hafliger <juerg.haefliger@hp.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -21,13 +23,16 @@
 from StringIO import StringIO
 
 import contextlib
+import glob
 import grp
 import gzip
 import os
 import platform
 import pwd
 import shutil
+import socket
 import subprocess
+import types
 import urlparse
 
 import yaml
@@ -96,7 +101,7 @@ class ProcessExecutionError(IOError):
         self.reason = reason
 
 
-class _SeLinuxGuard(object):
+class SeLinuxGuard(object):
     def __init__(self, path, recursive=False):
         self.path = path
         self.recursive = recursive
@@ -149,6 +154,18 @@ def decomp_str(data):
         return data
 
 
+def find_modules(root_dir):
+    entries = dict()
+    for fname in glob.glob(os.path.join(root_dir, "*.py")):
+        if not os.path.isfile(fname):
+            continue
+        modname = os.path.basename(fname)[0:-3]
+        modname = modname.strip()
+        if modname and modname.find(".") == -1:
+            entries[fname] = modname
+    return entries
+
+
 def is_ipv4(instr):
     """ determine if input string is a ipv4 address. return boolean"""
     toks = instr.split('.')
@@ -163,15 +180,16 @@ def is_ipv4(instr):
     return (len(toks) == 4)
 
 
-def get_base_cfg(cfgfile, cfg_builtin=None, parsed_cfgs=None):
-    if parsed_cfgs and cfgfile in parsed_cfgs:
-        return parsed_cfgs[cfgfile]
-
+def get_base_cfg(cfgfile, cfg_builtin=None):
     syscfg = read_conf_with_confd(cfgfile)
+
     kern_contents = read_cc_from_cmdline()
     kerncfg = {}
     if kern_contents:
-        kerncfg = yaml.load(kern_contents)
+        try:
+            kerncfg = yaml.load(kern_contents)
+        except:
+            pass
 
     # kernel parameters override system config
     combined = mergedict(kerncfg, syscfg)
@@ -180,9 +198,6 @@ def get_base_cfg(cfgfile, cfg_builtin=None, parsed_cfgs=None):
     else:
         fin = combined
 
-    # Cache it?
-    if parsed_cfgs:
-        parsed_cfgs[cfgfile] = fin
     return fin
 
 
@@ -223,7 +238,7 @@ def get_cfg_option_list_or_str(yobj, key, default=None):
         return default
     if yobj[key] is None:
         return []
-    if isinstance(yobj[key], list):
+    if isinstance(yobj[key], (list)):
         return yobj[key]
     return [yobj[key]]
 
@@ -239,6 +254,15 @@ def get_cfg_by_path(yobj, keyp, default=None):
     return cur
 
 
+def obj_name(obj):
+    if isinstance(obj, (types.TypeType,
+                        types.ModuleType,
+                        types.FunctionType,
+                        types.LambdaType)):
+        return str(obj.__name__)
+    return obj_name(obj.__class__)
+
+
 def mergedict(src, cand):
     """
     Merge values from C{cand} into C{src}. If C{src} has a key C{cand} will
@@ -258,6 +282,15 @@ def mergedict(src, cand):
     return src
 
 
+@contextlib.contextmanager
+def umask(n_msk):
+    old = os.umask(n_msk)
+    try:
+        yield old
+    finally:
+        os.umask(old)
+
+
 @contextlib.contextmanager
 def tempdir(**kwargs):
     # This seems like it was only added in python 3.2
@@ -379,13 +412,15 @@ def read_conf_with_confd(cfgfile):
     if "conf_d" in cfg:
         if cfg['conf_d'] is not None:
             confd = cfg['conf_d']
-            if not isinstance(confd, str):
-                raise RuntimeError("cfgfile %s contains 'conf_d' "
-                                "with non-string" % cfgfile)
+            if not isinstance(confd, (str)):
+                raise RuntimeError(("Config file %s contains 'conf_d' "
+                                    "with non-string") % (cfgfile))
+            else:
+                confd = confd.strip()
     elif os.path.isdir("%s.d" % cfgfile):
         confd = "%s.d" % cfgfile
 
-    if not confd:
+    if not confd or not os.path.isdir(confd):
         return cfg
 
     return mergedict(read_conf_d(confd), cfg)
@@ -479,6 +514,32 @@ def get_fqdn_from_hosts(hostname, filename="/etc/hosts"):
     return fqdn
 
 
+def get_cmdline_url(names=None, starts=None, cmdline=None):
+    if cmdline is None:
+        cmdline = get_cmdline()
+    if not names:
+        names = ('cloud-config-url', 'url')
+    if not starts:
+        starts = "#cloud-config"
+
+    data = keyval_str_to_dict(cmdline)
+    url = None
+    key = None
+    for key in names:
+        if key in data:
+            url = data[key]
+            break
+
+    if not url:
+        return (None, None, None)
+
+    (contents, sc) = uhelp.readurl(url)
+    if contents.startswith(starts) and uhelp.ok_http_code(sc):
+        return (key, url, contents)
+
+    return (key, url, None)
+
+
 def is_resolvable(name):
     """ determine if a url is resolvable, return a boolean """
     try:
@@ -488,6 +549,11 @@ def is_resolvable(name):
         return False
 
 
+def get_hostname():
+    hostname = socket.gethostname()
+    return hostname
+
+
 def is_resolvable_url(url):
     """ determine if this url is resolvable (existing or ip) """
     return (is_resolvable(urlparse.urlparse(url).hostname))
@@ -634,7 +700,7 @@ def write_file(filename, content, mode=0644, omode="wb"):
     ensure_dir(os.path.dirname(filename))
     LOG.debug("Writing to %s - %s (perms=%s) %s bytes", filename, omode, mode, len(content))
     with open(filename, omode) as fh:
-        with _SeLinuxGuard(filename):
+        with SeLinuxGuard(filename):
             fh.write(content)
             fh.flush()
             if mode is not None:
@@ -711,11 +777,8 @@ def is_container():
             cmd = [helper]
             (stdout, stderr) = subp(cmd, allowed_rc=[0])
             return True
-        except IOError as e:
+        except (IOError, OSError):
             pass
-            # Is this really needed?
-            # if e.errno != errno.ENOENT:
-            #     raise
 
     # this code is largely from the logic in
     # ubuntu's /etc/init/container-detect.conf
@@ -727,7 +790,7 @@ def is_container():
             return True
         if "LIBVIRT_LXC_UUID" in pid1env:
             return True
-    except IOError as e:
+    except (IOError, OSError):
         pass
 
     # Detect OpenVZ containers
@@ -742,7 +805,7 @@ def is_container():
                 (_key, val) = line.strip().split(":", 1)
                 if val != "0":
                     return True
-    except IOError as e:
+    except (IOError, OSError):
         pass
 
     return False
@@ -759,9 +822,9 @@ def get_proc_env(pid):
             if tok == "":
                 continue
             (name, val) = tok.split("=", 1)
-            if not name:
+            if name:
                 env[name] = val
-    except IOError:
+    except (IOError, OSError):
         pass
     return env
 

From 4bb7bb370675fce24939a4e489347a5d67fd08c6 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:37:40 -0700
Subject: [PATCH 048/434] Add copyright

---
 cloudinit/url_helper.py | 23 +++++++++++++++++++++++
 1 file changed, 23 insertions(+)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index ed78c92e..6fa3e44b 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -1,3 +1,26 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+
 import errno
 import time
 import urllib

From a72b2cf0b5df98c6a92772edcd14c8f87541cb4a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:38:19 -0700
Subject: [PATCH 049/434] Initial cleanups

---
 cloudinit/sources/__init__.py | 188 +++++++++++++++++-----------------
 1 file changed, 93 insertions(+), 95 deletions(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 9a9c1316..05c8bfad 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -1,10 +1,12 @@
 # vi: ts=4 expandtab
 #
-#    Copyright (C) 2009-2010 Canonical Ltd.
+#    Copyright (C) 2012 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Hafliger <juerg.haefliger@hp.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -18,78 +20,78 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from cloudinit import user_data as ud
+from cloudinit import importer
+from cloudinit import log as logging
 from cloudinit import util
 
-import socket
-
 DEP_FILESYSTEM = "FILESYSTEM"
 DEP_NETWORK = "NETWORK"
+DS_PREFIX = 'DataSource'
+LOG = logging.getLogger(__name__)
+
 
 class DataSourceNotFoundException(Exception):
     pass
 
 
-class DataSource:
-    userdata = None
-    metadata = None
-    userdata_raw = None
-    cfgname = ""
-    # system config (passed in from cloudinit,
-    # cloud-config before input from the DataSource)
-    sys_cfg = {}
-    # datasource config, the cloud-config['datasource']['__name__']
-    ds_cfg = {}  # datasource config
-
-    def __init__(self, sys_cfg=None):
-        if not self.cfgname:
-            name = str(self.__class__).split(".")[-1]
-            if name.startswith("DataSource"):
-                name = name[len("DataSource"):]
-            self.cfgname = name
+class DataSource(object):
+    def __init__(self, ud_proc, cfg):
+        name = util.obj_name(self)
+        if name.startswith(DS_PREFIX):
+            name = name[DS_PREFIX:]
+        self.cfgname = name
         if sys_cfg:
             self.sys_cfg = sys_cfg
-
+        else:
+            self.sys_cfg = {}
+        self.ud_proc = ud_proc
+        self.userdata = None
+        self.metadata = None
+        self.userdata_raw = None
         self.ds_cfg = util.get_cfg_by_path(self.sys_cfg,
                           ("datasource", self.cfgname), self.ds_cfg)
 
     def get_userdata(self):
-        if self.userdata == None:
-            self.userdata = ud.preprocess_userdata(self.userdata_raw)
+        if self.userdata is None:
+            raw_data = self.get_userdata_raw()
+            self.userdata = self.ud_proc.process(raw_data)
         return self.userdata
 
     def get_userdata_raw(self):
-        return(self.userdata_raw)
+        return self.userdata_raw
 
     # the data sources' config_obj is a cloud-config formated
     # object that came to it from ways other than cloud-config
     # because cloud-config content would be handled elsewhere
     def get_config_obj(self):
-        return({})
+        return {}
 
     def get_public_ssh_keys(self):
         keys = []
-        if 'public-keys' not in self.metadata:
-            return([])
 
-        if isinstance(self.metadata['public-keys'], str):
-            return(str(self.metadata['public-keys']).splitlines())
+        if not self.metadata or 'public-keys' not in self.metadata:
+            return keys
 
-        if isinstance(self.metadata['public-keys'], list):
-            return(self.metadata['public-keys'])
+        if isinstance(self.metadata['public-keys'], (str)):
+            return str(self.metadata['public-keys']).splitlines()
 
-        for _keyname, klist in self.metadata['public-keys'].items():
-            # lp:506332 uec metadata service responds with
-            # data that makes boto populate a string for 'klist' rather
-            # than a list.
-            if isinstance(klist, str):
-                klist = [klist]
-            for pkey in klist:
-                # there is an empty string at the end of the keylist, trim it
-                if pkey:
-                    keys.append(pkey)
+        if isinstance(self.metadata['public-keys'], (list, set)):
+            return list(self.metadata['public-keys'])
 
-        return(keys)
+        if isinstance(self.metadata['public-keys'], (dict)):
+            for _keyname, klist in self.metadata['public-keys'].items():
+                # lp:506332 uec metadata service responds with
+                # data that makes boto populate a string for 'klist' rather
+                # than a list.
+                if isinstance(klist, (str)):
+                    klist = [klist]
+                if isinstance(klist, (list)):
+                    for pkey in klist:
+                        # there is an empty string at the end of the keylist, trim it
+                        if pkey:
+                            keys.append(pkey)
+
+        return keys
 
     def device_name_to_device(self, _name):
         # translate a 'name' to a device
@@ -97,48 +99,43 @@ class DataSource:
         # to consult metadata service, that has
         #  ephemeral0: sdb
         # and return 'sdb' for input 'ephemeral0'
-        return(None)
+        return None
 
     def get_locale(self):
-        return('en_US.UTF-8')
+        return 'en_US.UTF-8'
 
     def get_local_mirror(self):
         return None
 
     def get_instance_id(self):
-        if 'instance-id' not in self.metadata:
+        if not self.metadata or 'instance-id' not in self.metadata:
             return "iid-datasource"
-        return(self.metadata['instance-id'])
+        return str(self.metadata['instance-id'])
 
     def get_hostname(self, fqdn=False):
         defdomain = "localdomain"
         defhost = "localhost"
-
         domain = defdomain
-        if not 'local-hostname' in self.metadata:
 
+        if not self.metadata or not 'local-hostname' in self.metadata:
             # this is somewhat questionable really.
             # the cloud datasource was asked for a hostname
             # and didn't have one. raising error might be more appropriate
             # but instead, basically look up the existing hostname
             toks = []
-
-            hostname = socket.gethostname()
-
+            hostname = util.get_hostname()
             fqdn = util.get_fqdn_from_hosts(hostname)
-
             if fqdn and fqdn.find(".") > 0:
                 toks = str(fqdn).split(".")
             elif hostname:
                 toks = [hostname, defdomain]
             else:
                 toks = [defhost, defdomain]
-
         else:
             # if there is an ipv4 address in 'local-hostname', then
             # make up a hostname (LP: #475354) in format ip-xx.xx.xx.xx
             lhost = self.metadata['local-hostname']
-            if is_ipv4(lhost):
+            if util.is_ipv4(lhost):
                 toks = "ip-%s" % lhost.replace(".", "-")
             else:
                 toks = lhost.split(".")
@@ -155,22 +152,22 @@ class DataSource:
             return hostname
 
 
-def find_source(cfg, ds_deps):
-    cfglist = cfg.get('datasource_list') or []
-    dslist = list_sources(cfglist, ds_deps)
-    dsnames = [f.__name__ for f in dslist]
-    
-    LOG.debug("Searching for data source in %s", dsnames)
-    for cls in dslist:
-        ds = cls.__name__
+def find_source(cfg, ds_deps, cfg_list, pkg_list, **kwargs):
+    ds_list = list_sources(cfg_list, ds_deps, pkg_list)
+    ds_names = [util.obj_name(f) for f in ds_list]
+    ds_args = dict(kwargs)
+    ds_args['cfg'] = cfg
+    LOG.info("Searching for data source in: %s", ds_names)
+    for cls in ds_list:
+        ds = util.obj_name(cls)
         try:
-            s = cls(sys_cfg=cfg)
+            s = cls(**ds_args)
             if s.get_data():
                 return (s, ds)
         except Exception as e:
-            LOG.exception("Getting data from %s raised %s", ds, e)
+            LOG.exception("Getting data from %s failed", ds)
 
-    msg = "Did not find any data source, searched classes: %s" % dsnames
+    msg = "Did not find any data source, searched classes: %s" % (ds_names)
     raise DataSourceNotFoundException(msg)
 
 
@@ -178,31 +175,33 @@ def find_source(cfg, ds_deps):
 # iterate through cfg_list, loading "DataSourceCollections" modules
 # and calling their "get_datasource_list".
 # return an ordered list of classes that match
-#
-# - modules must be named "DataSource<item>", where 'item' is an entry
-#   in cfg_list
-# - if pkglist is given, it will iterate try loading from that package
-#   ie, pkglist=[ "foo", "" ]
-#     will first try to load foo.DataSource<item>
-#     then DataSource<item>
-def list_sources(cfg_list, depends, pkglist=None):
-    if pkglist is None:
-        pkglist = []
-    retlist = []
+def list_sources(cfg_list, depends, pkg_list):
+    src_list = []
+    LOG.info("Looking for for data source in: %s, %s that match %s", cfg_list, pkg_list, depends)
     for ds_coll in cfg_list:
-        for pkg in pkglist:
+        ds_name = str(ds_coll)
+        if not ds_name.startswith(DS_PREFIX):
+            ds_name = '%s%s' % (DS_PREFIX, ds_name)
+        for pkg in pkg_list:
+            pkg_name = []
             if pkg:
-                pkg = "%s." % pkg
-            try:
-                mod = __import__("%sDataSource%s" % (pkg, ds_coll))
-                if pkg:
-                    mod = getattr(mod, "DataSource%s" % ds_coll)
-                lister = getattr(mod, "get_datasource_list")
-                retlist.extend(lister(depends))
-                break
-            except:
-                raise
-    return(retlist)
+                pkg_name.append(str(pkg))
+            pkg_name.append(ds_name)
+            mod_name = ".".join(pkg_name)
+            mod = importer.import_module(mod_name)
+            if pkg:
+                mod = getattr(mod, ds_name, None)
+            if not mod:
+                continue
+            lister = getattr(mod, "get_datasource_list", None)
+            if not lister:
+                continue
+            cls_matches = lister(depends)
+            if not cls_matches:
+                continue
+            src_list.extend(cls_matches)
+            break
+    return src_list
 
 
 # depends is a list of dependencies (DEP_FILESYSTEM)
@@ -213,10 +212,9 @@ def list_sources(cfg_list, depends, pkglist=None):
 # it returns a list of 'class' that matched these deps exactly
 # it is a helper function for DataSourceCollections
 def list_from_depends(depends, dslist):
-    retlist = []
+    ret_list = []
     depset = set(depends)
-    for elem in dslist:
-        (cls, deps) = elem
+    for (cls, deps) in dslist:
         if depset == set(deps):
-            retlist.append(cls)
-    return(retlist)
+            ret_list.append(cls)
+    return ret_list

From 42b37f1029d2d03f3cc9639e0d97806bedc05031 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 9 Jun 2012 12:38:32 -0700
Subject: [PATCH 050/434] Start adding a system section.

---
 config/cloud.cfg | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/config/cloud.cfg b/config/cloud.cfg
index 3688f88d..33feec48 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -1,7 +1,6 @@
 user: ubuntu
 disable_root: 1
 preserve_hostname: False
-# datasource_list: ["NoCloud", "ConfigDrive", "OVF", "MAAS", "Ec2", "CloudStack"]
 
 cloud_init_modules:
  - bootcmd
@@ -40,3 +39,10 @@ cloud_final_modules:
  - keys-to-console
  - phone-home
  - final-message
+
+system_info:
+   paths:
+      cloud_dir: /var/lib/cloud/
+      templates_dir: /etc/cloud/templates/
+      upstart_dir: /etc/init/
+   distro: ubuntu

From d657c31976becf38b049396bf82c1aa596e94ad7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:09:10 -0700
Subject: [PATCH 051/434] Not needed, this functionality can go in utils.

---
 cloudinit/mounting.py | 73 -------------------------------------------
 1 file changed, 73 deletions(-)
 delete mode 100644 cloudinit/mounting.py

diff --git a/cloudinit/mounting.py b/cloudinit/mounting.py
deleted file mode 100644
index b78cb5bd..00000000
--- a/cloudinit/mounting.py
+++ /dev/null
@@ -1,73 +0,0 @@
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2012 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#    Copyright (C) 2012 Yahoo! Inc.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
-#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-import contextlib
-
-from cloudinit import util
-
-
-class MountFailedError(Exception):
-    pass
-
-
-@contextlib.contextmanager
-def unmounter(umount):
-    try:
-        yield umount
-    finally:
-        if umount:
-            sh.subp(["umount", '-l', umount])
-
-
-def mount_callback_umount(device, callback, data=None):
-    """
-    mount the device, call method 'callback' passing the directory
-    in which it was mounted, then unmount.  Return whatever 'callback'
-    returned.  If data != None, also pass data to callback.
-    """
-
-    # go through mounts to see if it was already mounted
-    mounts = sh.load_file("/proc/mounts").splitlines()
-    mounted = {}
-    for mpline in mounts:
-        (dev, mp, fstype, _opts, _freq, _passno) = mpline.split()
-        mp = mp.replace("\\040", " ")
-        mounted[dev] = (dev, fstype, mp, False)
-
-    with util.tempdir() as tmpd:
-        umount = False
-        if device in mounted:
-            mountpoint = "%s/" % mounted[device][2]
-        else:
-            try:
-                mountcmd = ["mount", "-o", "ro", device, tmpd]
-                util.subp(mountcmd)
-                umount = tmpd
-            except IOError as exc:
-                raise MountFailedError("%s" % (exc))
-            mountpoint = "%s/" % tmpd
-        with unmounter(umount):
-            if data is None:
-                ret = callback(mountpoint)
-            else:
-                ret = callback(mountpoint, data)
-            return ret

From 88e5552813e6c39031d5ded9e309edb8a04a494e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:09:24 -0700
Subject: [PATCH 052/434] Removed, not needed.

---
 pylintrc | 42 ------------------------------------------
 1 file changed, 42 deletions(-)
 delete mode 100644 pylintrc

diff --git a/pylintrc b/pylintrc
deleted file mode 100644
index a7447a19..00000000
--- a/pylintrc
+++ /dev/null
@@ -1,42 +0,0 @@
-# The format of this file isn't really documented; just use --generate-rcfile
-
-[Master]
-
-[Messages Control]
-
-# http://pylint-messages.wikidot.com/all-codes
-# NOTE(justinsb): We might want to have a 2nd strict pylintrc in future
-# C0111: Don't require docstrings on every method
-# R0912: Too many branches (huh)
-# R0914: Too many local variables is odd.
-# W0142: *args and **kwargs are fine.
-# W0511: TODOs in code comments are fine.
-# W0613: Unused argument '??' should be ok (they are useful sometimes to know intention of variable)
-# W0622: Redefining id is fine.
-disable=C0111,W0142,W0622,C0301,R0902,R0201,R0914,W0613,R0912,R0801
-
-[Basic]
-
-# Variable names can be 1 to 31 characters long, with lowercase and underscores
-variable-rgx=[a-z_][a-z0-9_]{0,30}$
-
-# Argument names can be 2 to 31 characters long, with lowercase and underscores
-argument-rgx=[a-z_][a-z0-9_]{1,30}$
-
-# Method names should be at least 3 characters long
-# and be lowercased with underscores
-method-rgx=([a-z_][a-z0-9_]{2,50}|setUp|tearDown)$
-
-# Don't require docstrings on tests.
-no-docstring-rgx=((__.*__)|([tT]est.*)|setUp|tearDown)$
-
-[Design]
-
-max-public-methods=100
-min-public-methods=0
-max-args=6
-
-[Variables]
-
-# List of additional names supposed to be defined in builtins. Remember that
-# you should avoid to define new builtins when possible.

From 460ee0a506a9cd1082b17b7370c7db5d4eae2f39 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:09:38 -0700
Subject: [PATCH 053/434] All main stage helpers go here, ie semaphores,
 handler registrys, runners...

---
 cloudinit/helpers.py | 204 +++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 204 insertions(+)
 create mode 100644 cloudinit/helpers.py

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
new file mode 100644
index 00000000..cdb8a07e
--- /dev/null
+++ b/cloudinit/helpers.py
@@ -0,0 +1,204 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+from time import time
+
+import contextlib
+import os
+
+from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE)
+
+from cloudinit import log as logging
+from cloudinit import util
+
+from cloudinit.user_data import boot_hook as bh_part
+from cloudinit.user_data import cloud_config as cc_part
+from cloudinit.user_data import shell_script as ss_part
+from cloudinit.user_data import upstart_job as up_part
+
+LOG = logging.getLogger(__name__)
+
+
+class DummySemaphores(object):
+    def __init__(self):
+        pass
+
+    @contextlib.contextmanager
+    def lock(self, _name, _freq, _clear_on_fail):
+        yield True
+
+    def has_run(self, _name, _freq):
+        return False
+
+
+class Semaphores(object):
+    def __init__(self, sem_path):
+        self.sem_path = sem_path
+
+    @contextlib.contextmanager
+    def lock(self, name, freq, clear_on_fail):
+        try:
+            yield self._acquire(name, freq)
+        except:
+            if clear_on_fail:
+                self.clear(name, freq)
+            raise
+
+    def clear(self, name, freq):
+        sem_file = self._get_path(name, freq)
+        try:
+            util.del_file(sem_file)
+        except (IOError, OSError):
+            return False
+        return True
+
+    def _acquire(self, name, freq):
+        if self.has_run(name, freq):
+            return None
+        # This is a race condition since nothing atomic is happening
+        # here, but this should be ok due to the nature of when
+        # and where cloud-init runs... (file writing is not a lock..)
+        sem_file = self._get_path(name, freq)
+        contents = "%s: %s\n" % (os.getpid(), time())
+        try:
+            util.write_file(sem_file, contents)
+        except (IOError, OSError):
+            return None
+        return sem_file
+
+    def has_run(self, name, freq):
+        if freq == PER_ALWAYS:
+            return False
+        sem_file = self._get_path(name, freq)
+        if os.path.exists(sem_file):
+            return True
+        return False
+
+    def _get_path(self, name, freq):
+        sem_path = self.sem_path
+        if not freq or freq == PER_INSTANCE:
+            return os.path.join(sem_path, name)
+        else:
+            return os.path.join(sem_path, "%s.%s" % (name, freq))
+
+
+class Runners(object):
+    def __init__(self, paths):
+        self.paths = paths
+        self.sems = {}
+
+    def _get_sem(self, freq):
+        if freq == PER_ALWAYS or not freq:
+            return None
+        sem_path = None
+        if freq == PER_INSTANCE:
+            sem_path = self.paths.get_ipath("sem")
+        elif freq == PER_ONCE:
+            sem_path = self.paths.get_cpath("sem")
+        if not sem_path:
+            return None
+        if sem_path not in self.sems:
+            self.sems[sem_path] = Semaphores(sem_path)
+        return self.sems[sem_path]
+
+    def run(self, name, functor, args, freq=None, clear_on_fail=False):
+        sem = self._get_sem(freq)
+        if not sem:
+            sem = DummySemaphores()
+        if not args:
+            args = []
+        if sem.has_run(name, freq):
+            LOG.info("%s already ran (freq=%s)", name, freq)
+            return None
+        with sem.lock(name, freq, clear_on_fail) as lk:
+            if not lk:
+                raise RuntimeError("Failed to acquire lock on %s" % name)
+            else:
+                LOG.debug("Running %s with args %s using lock %s",
+                          functor, args, lk)
+                return functor(*args)
+
+
+class ContentHandlers(object):
+
+    def __init__(self, paths):
+        self.paths = paths
+        self.registered = {}
+
+    def __contains__(self, item):
+        return self.is_registered(item)
+
+    def __getitem__(self, key):
+        return self._get_handler(key)
+
+    def is_registered(self, content_type):
+        return content_type in self.registered
+
+    def register(self, mod):
+        types = set()
+        for t in mod.list_types():
+            self.registered[t] = mod
+            types.add(t)
+        return types
+
+    def _get_handler(self, content_type):
+        return self.registered[content_type]
+
+    def items(self):
+        return self.registered.items()
+
+    def iteritems(self):
+        return self.registered.iteritems()
+
+    def _get_default_handlers(self):
+        def_handlers = []
+
+        cc_path = self.paths.get_ipath("cloud_config")
+        if cc_path:
+            cc_h = cc_part.CloudConfigPartHandler(cc_path)
+            def_handlers.append(cc_h)
+
+        sc_path = self.paths.get_ipath_cur('scripts')
+        if sc_path:
+            ss_h = ss_part.ShellScriptPartHandler(sc_path)
+            def_handlers.append(ss_h)
+
+        bh_path = self.paths.get_ipath("boothooks")
+        if bh_path:
+            bh_h = bh_part.BootHookPartHandler(bh_path)
+            def_handlers.append(bh_h)
+
+        upstart_pth = self.paths.upstart_conf_d
+        if upstart_pth:
+            up_h = up_part.UpstartJobPartHandler(upstart_pth)
+            def_handlers.append(up_h)
+
+        return def_handlers
+
+    def register_defaults(self):
+        registered = set()
+        for mod in self._get_default_handlers():
+            for t in mod.list_types():
+                if not self.is_registered(t):
+                    self.registered[t] = mod
+                    registered.add(t)
+        return registered

From d928c8ed16bbd5170d1cc79d7304fd558284f3fc Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:11:46 -0700
Subject: [PATCH 054/434] Move paths to here, since it also qualifies.

---
 cloudinit/helpers.py | 63 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 63 insertions(+)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index cdb8a07e..0bd13c78 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -202,3 +202,66 @@ class ContentHandlers(object):
                     self.registered[t] = mod
                     registered.add(t)
         return registered
+
+
+class Paths(object):
+    def __init__(self, sys_info):
+        self.cloud_dir = sys_info.get('cloud_dir', '/var/lib/cloud')
+        self.instance_link = os.path.join(self.cloud_dir, 'instance')
+        self.boot_finished = os.path.join(self.instance_link, "boot-finished")
+        self.upstart_conf_d = sys_info.get('upstart_dir')
+        template_dir = sys_info.get('templates_dir', '/etc/cloud/templates/')
+        self.template_tpl = os.path.join(template_dir, '%s.tmpl')
+        self.seed_dir = os.path.join(self.cloud_dir, 'seed')
+        self.lookups = {
+           "handlers": "handlers",
+           "scripts": "scripts",
+           "sem": "sem",
+           "boothooks": "boothooks",
+           "userdata_raw": "user-data.txt",
+           "userdata": "user-data.txt.i",
+           "obj_pkl": "obj.pkl",
+           "cloud_config": "cloud-config.txt",
+           "data": "data",
+        }
+        # Set when a datasource becomes active
+        self.datasource = None
+
+    # get_ipath_cur: get the current instance path for an item
+    def get_ipath_cur(self, name=None):
+        ipath = self.instance_link
+        add_on = self.lookups.get(name)
+        if add_on:
+            ipath = os.path.join(ipath, add_on)
+        return ipath
+
+    # get_cpath : get the "clouddir" (/var/lib/cloud/<name>)
+    # for a name in dirmap
+    def get_cpath(self, name=None):
+        cpath = self.cloud_dir
+        add_on = self.lookups.get(name)
+        if add_on:
+            cpath = os.path.join(cpath, add_on)
+        return cpath
+
+    def _get_ipath(self, name=None):
+        if not self.datasource:
+            return None
+        iid = self.datasource.get_instance_id()
+        if iid is None:
+            return None
+        ipath = os.path.join(self.cloud_dir, 'instances', iid)
+        add_on = self.lookups.get(name)
+        if add_on:
+            ipath = os.path.join(ipath, add_on)
+        return ipath
+
+    # (/var/lib/cloud/instances/<instance>/<name>)
+    def get_ipath(self, name=None):
+        ipath = self._get_ipath(name)
+        if not ipath:
+            LOG.warn(("No per instance semaphores available, "
+                              "is there an datasource/iid set?"))
+            return None
+        else:
+            return ipath

From 16e8f85be5abb8d5f37035223b27b18b1c0e2bec Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:12:00 -0700
Subject: [PATCH 055/434] Add this file, which contains the main init stage,
 and the handlers stage (as seperate objects).

---
 cloudinit/stages.py | 411 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 411 insertions(+)
 create mode 100644 cloudinit/stages.py

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
new file mode 100644
index 00000000..55ad143d
--- /dev/null
+++ b/cloudinit/stages.py
@@ -0,0 +1,411 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import cPickle as pickle
+
+import copy
+import os
+import sys
+
+try:
+    from configobj import ConfigObj
+except ImportError:
+    ConfigObj = None
+
+from cloudinit.settings import (PER_INSTANCE)
+from cloudinit.settings import (OLD_CLOUD_CONFIG)
+
+from cloudinit import cloud
+from cloudinit import distros
+from cloudinit import handlers
+from cloudinit import helpers
+from cloudinit import importer
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import util
+
+from cloudinit import user_data as ud
+
+LOG = logging.getLogger(__name__)
+
+
+class Init(object):
+    def __init__(self, ds_deps=None):
+        self.datasource = None
+        if ds_deps:
+            self.ds_deps = ds_deps
+        else:
+            self.ds_deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
+        # Created on first use
+        self.cached_cfg = None
+        self.cached_distro = None
+        self.cached_paths = None
+
+    def _read_cfg_old(self):
+        # Support reading the old ConfigObj format file and merging
+        # it into the yaml dictionary
+        if not ConfigObj:
+            return {}
+        old_cfg = ConfigObj(OLD_CLOUD_CONFIG)
+        return dict(old_cfg)
+
+    @property
+    def cfg(self):
+        if self.cached_cfg is None:
+            self.cached_cfg = self._read_cfg()
+        return self.cached_cfg
+
+    @property
+    def paths(self):
+        if not self.cached_paths:
+            sys_info = self.cfg.get('system_info', {})
+            self.cached_paths = helpers.Paths(copy.deepcopy(sys_info),
+                                          self.datasource)
+        return self.cached_paths
+
+    def _initial_subdirs(self):
+        c_dir = self.paths.cloud_dir
+        initial_dirs = [
+            os.path.join(c_dir, 'scripts'),
+            os.path.join(c_dir, 'scripts', 'per-instance'),
+            os.path.join(c_dir, 'scripts', 'per-once'),
+            os.path.join(c_dir, 'scripts', 'per-boot'),
+            os.path.join(c_dir, 'seed'),
+            os.path.join(c_dir, 'instances'),
+            os.path.join(c_dir, 'handlers'),
+            os.path.join(c_dir, 'sem'),
+            os.path.join(c_dir, 'data'),
+        ]
+        return initial_dirs
+
+    def purge_cache(self, rmcur=True):
+        rmlist = []
+        rmlist.append(self.paths.boot_finished)
+        if rmcur:
+            rmlist.append(self.paths.instance_link)
+        for f in rmlist:
+            util.del_file(f)
+        return len(rmlist)
+
+    def initialize(self):
+        self._initialize_filesystem()
+
+    def _initialize_filesystem(self):
+        util.ensure_dirs(self._initial_subdirs())
+        log_file = util.get_cfg_option_str(self.cfg, 'def_log_file')
+        perms = util.get_cfg_option_str(self.cfg, 'syslog_fix_perms')
+        if log_file:
+            util.ensure_file(log_file)
+            if perms:
+                (u, g) = perms.split(':', 1)
+                if u == "-1" or u == "None":
+                    u = None
+                if g == "-1" or g == "None":
+                    g = None
+                util.chownbyname(log_file, u, g)
+
+    def _read_cfg(self):
+        # Deep copy so that
+        b_config = util.get_builtin_cfg()
+        try:
+            conf = util.get_base_cfg()
+        except Exception:
+            conf = b_config
+        return util.mergedict(conf, self._read_cfg_old())
+
+    def _restore_from_cache(self):
+        pickled_fn = self.paths.get_ipath_cur('obj_pkl')
+        try:
+            # we try to restore from a current link and static path
+            # by using the instance link, if purge_cache was called
+            # the file wont exist
+            return pickle.loads(util.load_file(pickled_fn))
+        except Exception as e:
+            LOG.exception(("Failed loading pickled datasource from"
+                           " %s due to: %s"), pickled_fn, e)
+            return None
+
+    def _write_to_cache(self):
+        pickled_fn = self.paths.get_ipath_cur("obj_pkl")
+        try:
+            contents = pickle.dumps(self.datasource)
+            util.write_file(pickled_fn, contents, mode=0400)
+        except Exception as e:
+            LOG.exception(("Failed pickling datasource to"
+                          " %s due to: %s"), pickled_fn, e)
+            return False
+
+    def _get_datasources(self):
+        # Any config provided???
+        pkg_list = self.cfg.get('datasource_pkg_list') or []
+        # Add the defaults at the end
+        for n in [util.obj_name(sources), '']:
+            if n not in pkg_list:
+                pkg_list.append(n)
+        cfg_list = self.cfg.get('datasource_list') or []
+        return (cfg_list, pkg_list)
+
+    def _get_data_source(self):
+        if self.datasource:
+            return self.datasource
+        ds = self._restore_from_cache()
+        if ds:
+            LOG.debug("Restored from cache datasource: %s" % ds)
+        else:
+            (cfg_list, pkg_list) = self._get_datasources()
+            # Deep copy so that handlers can not modify (which will
+            # affect handlers down the line...)
+            sys_cfg = copy.deepcopy(self.cfg)
+            ds_deps = copy.deepcopy(self.ds_deps)
+            distro = distros.fetch(sys_cfg,
+                                   cloud.Cloud(self.datasource,
+                                               self.paths, sys_cfg))
+            (ds, dsname) = sources.find_source(sys_cfg, distro, self.paths,
+                                               ds_deps, cfg_list, pkg_list)
+            LOG.debug("Loaded datasource %s - %s", dsname, ds)
+        self.datasource = ds
+        if self.cached_paths:
+            self.cached_paths.datasource = ds
+        return ds
+
+    def _reflect_cur_instance(self):
+        # Ensure we are hooked into the right symlink for the current instance
+        idir = self.paths.get_ipath()
+        util.del_file(self.paths.instance_link)
+        util.sym_link(idir, self.paths.instance_link)
+
+        # Ensures these dirs exist
+        dir_list = []
+        for d in ["handlers", "scripts", "sem"]:
+            dir_list.append(os.path.join(idir, d))
+        util.ensure_dirs(dir_list)
+
+        # Write out information on what is being used for the current instance
+        # and what may have been used for a previous instance...
+        dp = self.paths.get_cpath('data')
+
+        # Write what the datasource was and is..
+        ds = "%s: %s" % (util.obj_name(self.datasource), self.datasource)
+        previous_ds = ''
+        ds_fn = os.path.join(idir, 'datasource')
+        try:
+            previous_ds = util.load_file(ds_fn).strip()
+        except Exception:
+            pass
+        if not previous_ds:
+            # TODO: ?? is this right
+            previous_ds = ds
+        util.write_file(ds_fn, "%s\n" % ds)
+        util.write_file(os.path.join(dp, 'previous-datasource'),
+                        "%s\n" % (previous_ds))
+
+        # What the instance id was and is...
+        iid = self.datasource.get_instance_id()
+        previous_iid = ''
+        p_iid_fn = os.path.join(dp, 'previous-instance-id')
+        c_iid_fn = os.path.join(dp, 'instance-id')
+        try:
+            previous_iid = util.load_file(p_iid_fn).strip()
+        except Exception:
+            pass
+        if not previous_iid:
+            # TODO: ?? is this right
+            previous_iid = iid
+        util.write_file(c_iid_fn, "%s\n" % iid)
+        util.write_file(p_iid_fn, "%s\n" % previous_iid)
+
+    def fetch(self):
+        return self._get_data_source()
+
+    def instancify(self):
+        self._reflect_cur_instance()
+
+    def update(self):
+        self._write_to_cache()
+        self._store_userdata()
+
+    def _store_userdata(self):
+        raw_ud = "%s" % (self.datasource.get_userdata_raw())
+        util.write_file(self.paths.get_ipath('userdata_raw'), raw_ud, 0600)
+        processed_ud = "%s" % (self.datasource.get_userdata())
+        util.write_file(self.paths.get_ipath('userdata'), processed_ud, 0600)
+
+    def consume(self, frequency=PER_INSTANCE):
+        cdir = self.paths.get_cpath("handlers")
+        idir = self.paths.get_ipath("handlers")
+    
+        # Add the path to the plugins dir to the top of our list for import
+        # instance dir should be read before cloud-dir
+        sys.path.insert(0, cdir)
+        sys.path.insert(0, idir)
+
+        # This keeps track of all the active handlers
+        c_handlers = helpers.ContentHandlers(self.paths)
+
+        # Add handlers in cdir
+        potential_handlers = util.find_modules(cdir)
+        for (fname, modname) in potential_handlers.iteritems():
+            try:
+                mod = ud.fixup_module(importer.import_module(modname))
+                types = c_handlers.register(mod)
+                LOG.debug("Added handler for [%s] from %s", types, fname)
+            except:
+                LOG.exception("Failed to register handler from %s", fname)
+
+        def_handlers = c_handlers.register_defaults()
+        if def_handlers:
+            LOG.debug("Registered default handlers for [%s]", def_handlers)
+
+        # Form our cloud proxy
+        data = cloud.Cloud(self.datasource,
+                           self.paths, copy.deepcopy(self.cfg))
+
+        # Init the handlers first
+        # Ensure userdata fetched before activation
+        called = []
+        for (_mtype, mod) in c_handlers.iteritems():
+            if mod in called:
+                continue
+            ud.call_begin(mod, data, frequency)
+            called.append(mod)
+
+        # Walk the user data
+        part_data = {
+            'handlers': c_handlers,
+            'handlerdir': idir,
+            'data': data, 
+            'frequency': frequency,
+            'handlercount': 0,
+        }
+        ud.walk(data.get_userdata(), ud.walker_callback, data=part_data)
+
+        # Give callbacks opportunity to finalize
+        called = []
+        for (_mtype, mod) in c_handlers.iteritems():
+            if mod in called:
+                continue
+            ud.call_end(mod, data, frequency)
+            called.append(mod)
+
+
+class Handlers(object):
+    def __init__(self, datasource, h_cloud, cfgfile=None, basecfg=None):
+        self.datasource = datasource
+        self.cfgfile = cfgfile
+        self.basecfg = basecfg
+        self.h_cloud = h_cloud
+        self.cachedcfg = None
+
+    @property
+    def cfg(self):
+        if self.cachedcfg is None:
+            self.cachedcfg = self._get_config(self.cfgfile)
+        return self.cachedcfg
+
+    def _get_config(self, cfgfile):
+        mcfg = None
+
+        if self.cfgfile:
+            try:
+                mcfg = util.read_conf(cfgfile)
+            except:
+                LOG.exception(("Failed loading of cloud config '%s'. "
+                              "Continuing with an empty config."), cfgfile)
+        if not mcfg:
+            mcfg = {}
+
+        ds_cfg = None
+        try:
+            ds_cfg = self.datasource.get_config_obj()
+        except:
+            LOG.exception("Failed loading of datasource config.")
+        if not ds_cfg:
+            ds_cfg = {}
+
+        mcfg = util.mergedict(mcfg, ds_cfg)
+        if self.basecfg:
+            return util.mergedict(mcfg, self.basecfg)
+        else:
+            return mcfg
+
+
+    def _read_modules(self, name):
+        module_list = []
+        if name not in self.cfg:
+            return module_list
+        cfg_mods = self.cfg[name]
+        # Create 'module_list', an array of arrays
+        # Where array[0] = module name
+        #       array[1] = frequency
+        #       array[2:] = arguments
+        for item in cfg_mods:
+            if not item:
+                continue
+            if isinstance(item, str):
+                module_list.append([item])
+            elif isinstance(item, list):
+                module_list.append(item)
+            else:
+                raise TypeError("Failed to read '%s' item in config")
+        return module_list
+
+    def _form_modules(self, raw_mods):
+        mostly_mods = []
+        for raw_mod in raw_mods:
+            raw_name = raw_mod[0]
+            freq = None
+            run_args = None
+            if len(raw_mod) > 1:
+                freq = raw_mod[1]
+            if len(raw_mod) > 2:
+                run_args = raw_mod[2:]
+            if not run_args:
+                run_args = []
+            mod_name = handlers.form_module_name(raw_name)
+            if not mod_name:
+                continue
+            mod = handlers.fixup_module(importer.import_module(mod_name))
+            mostly_mods.append([mod, raw_name, freq, run_args])
+        return mostly_mods
+
+    def _run_modules(self, mostly_mods):
+        failures = []
+        for (mod, name, freq, args) in mostly_mods:
+            try:
+                if not freq:
+                    freq = mod.frequency
+                if not freq:
+                    freq = PER_INSTANCE
+                func_args = [name, copy.deepcopy(self.cfg),
+                             self.h_cloud, LOG,
+                             args]
+                run_name = "config-" + name        
+                self.h_cloud.run(run_name, mod.handle, func_args, freq=freq)
+            except:
+                LOG.exception("Running %s failed", mod)
+                failures.append(name)
+        return failures
+
+    def run(self, name):
+        raw_mods = self._read_modules(name)
+        mostly_mods = self._form_modules(raw_mods)
+        return self._run_modules(mostly_mods)

From 802d9f5886843031459c3abba2cac4188651b61b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:12:29 -0700
Subject: [PATCH 056/434] Moved these functions to utils.

---
 cloudinit/__init__.py | 14 --------------
 1 file changed, 14 deletions(-)

diff --git a/cloudinit/__init__.py b/cloudinit/__init__.py
index ab0603e0..da124641 100644
--- a/cloudinit/__init__.py
+++ b/cloudinit/__init__.py
@@ -19,17 +19,3 @@
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-from cloudinit import util
-
-from cloudinit.settings import (CFG_BUILTIN, CLOUD_CONFIG)
-
-
-def get_base_cfg(cfg_path=None):
-    if not cfg_path:
-        cfg_path = CLOUD_CONFIG
-    return util.get_base_cfg(cfg_path, get_builtin_cfg())
-
-
-def get_builtin_cfg():
-    return dict(CFG_BUILTIN)

From 006e4d65136e084482cd0c9e3e0096901dfecca7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:12:49 -0700
Subject: [PATCH 057/434] This will now just contain the "public" view of the
 cloud objects, backed by whatever other set of objects.

---
 cloudinit/cloud.py | 482 ++-------------------------------------------
 1 file changed, 11 insertions(+), 471 deletions(-)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index 80d4f1ce..765e7d3a 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -20,158 +20,23 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from time import time
-
-import cPickle as pickle
-
-import contextlib
-import copy
-import os
-import sys
-import weakref
-
-from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS)
-from cloudinit.settings import (OLD_CLOUD_CONFIG, CLOUD_CONFIG)
-
-from cloudinit import (get_builtin_cfg, get_base_cfg)
+from cloudinit import distros
+from cloudinit import helpers
 from cloudinit import log as logging
-from cloudinit import sources
-from cloudinit import util
-from cloudinit import handlers
-
-from cloudinit import user_data as ud
-from cloudinit.user_data import boot_hook as bh_part
-from cloudinit.user_data import cloud_config as cc_part
-from cloudinit.user_data import processor as ud_proc
-from cloudinit.user_data import shell_script as ss_part
-from cloudinit.user_data import upstart_job as up_part
 
 LOG = logging.getLogger(__name__)
 
 
-class CloudSemaphores(object):
-    def __init__(self, sem_path):
-        self.sem_path = sem_path
+class Cloud(object):
+    def __init__(self, datasource, paths, cfg):
+        self.datasource = datasource
+        self.paths = paths
+        self.cfg = cfg
+        self.distro = distros.fetch(cfg, self)
+        self.runners = helpers.Runners(paths)
 
-    # acquire lock on 'name' for given 'freq' and run function 'func'
-    # if 'clear_on_fail' is True and 'func' throws an exception
-    # then remove the lock (so it would run again)
-    def run_functor(self, name, freq, functor, args=None, clear_on_fail=False):
-        if not args:
-            args = []
-        if self.has_run(name, freq):
-            LOG.debug("%s already ran %s", name, freq)
-            return False
-        with self.lock(name, freq, clear_on_fail) as lock:
-            if not lock:
-                raise RuntimeError("Failed to acquire lock on %s" % name)
-            else:
-                LOG.debug("Running %s with args %s using lock %s", func, args, lock)
-                func(*args)
-        return True
-
-    @contextlib.contextmanager
-    def lock(self, name, freq, clear_on_fail=False):
-        try:
-            yield self._acquire(name, freq)
-        except:
-            if clear_on_fail:
-                self.clear(name, freq)
-            raise
-
-    def clear(self, name, freq):
-        sem_file = self._getpath(name, freq)
-        try:
-            util.del_file(sem_file)
-        except IOError:
-            return False
-        return True
-
-    def _acquire(self, name, freq):
-        if self.has_run(name, freq):
-            return None
-        # This is a race condition since nothing atomic is happening
-        # here, but this should be ok due to the nature of when
-        # and where cloud-init runs... (file writing is not a lock..)
-        sem_file = self._getpath(name, freq)
-        contents = "%s: %s\n" % (os.getpid(), time())
-        try:
-            util.write_file(sem_file, contents)
-        except (IOError, OSError):
-            return None
-        return sem_file
-
-    def has_run(self, name, freq):
-        if freq == PER_ALWAYS:
-            return False
-        sem_file = self._get_path(name, freq)
-        if os.path.exists(sem_file):
-            return True
-        return False
-
-    def _get_path(self, name, freq):
-        sem_path = self.sem_path
-        if freq == PER_INSTANCE:
-            return os.path.join(sem_path, name)
-        return os.path.join(sem_path, "%s.%s" % (name, freq))
-
-
-class CloudPaths(object):
-    def __init__(self, sys_info):
-        self.cloud_dir = sys_info['cloud_dir']
-        self.instance_link = os.path.join(self.cloud_dir, 'instance')
-        self.boot_finished = os.path.join(self.instance_link, "boot-finished")
-        self.upstart_conf_d = sys_info.get('upstart_dir')
-        self.template_dir = sys_info['templates_dir']
-        self.seed_dir = os.path.join(self.cloud_dir, 'seed')
-        self.datasource = None
-        self.lookups = {
-           "handlers": "handlers",
-           "scripts": "scripts",
-           "sem": "sem",
-           "boothooks": "boothooks",
-           "userdata_raw": "user-data.txt",
-           "userdata": "user-data.txt.i",
-           "obj_pkl": "obj.pkl",
-           "cloud_config": "cloud-config.txt",
-           "data": "data",
-        }
-
-    # get_ipath_cur: get the current instance path for an item
-    def get_ipath_cur(self, name=None):
-        ipath = os.path.join(self.cloud_dir, 'instance')
-        add_on = self.lookups.get(name)
-        if add_on:
-            ipath = os.path.join(ipath, add_on)
-        return ipath
-
-    # get_cpath : get the "clouddir" (/var/lib/cloud/<name>)
-    # for a name in dirmap
-    def get_cpath(self, name=None):
-        cpath = self.var_dir
-        add_on = self.lookups.get(name)
-        if add_on:
-            cpath = os.path.join(cpath, add_on)
-        return cpath
-
-    # get_ipath : get the instance path for a name in pathmap
-    # (/var/lib/cloud/instances/<instance>/<name>)
-    def get_ipath(self, name=None):
-        if not self.datasource:
-            raise RuntimeError("Unable to get instance path, datasource not available/set.")
-        iid = self.datasource.get_instance_id()
-        ipath = os.path.join(self.cloud_dir, 'instances', iid)
-        add_on = self.lookups.get(name)
-        if add_on:
-            ipath = os.path.join(ipath, add_on)
-        return ipath
-
-
-class CloudSimple(object):
-    def __init__(self, ci):
-        self.datasource = init.datasource
-        self.paths = init.paths
-        self.cfg = copy.deepcopy(ci.cfg)
+    def run(self, name, functor, args, freq=None, clear_on_fail=False):
+        return self.runners.run(name, functor, args, freq, clear_on_fail)
 
     def get_userdata(self):
         return self.datasource.get_userdata()
@@ -199,328 +64,3 @@ class CloudSimple(object):
 
     def get_ipath(self, name=None):
         return self.paths.get_ipath(name)
-
-
-class CloudInit(object):
-    def __init__(self, ds_deps=None):
-        self.datasource = None
-        if ds_deps:
-            self.ds_deps = ds_deps
-        else:
-            self.ds_deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
-        self.cfg = self._read_cfg()
-        self.paths = CloudPaths(self.cfg['system_info'])
-
-    def _read_cfg_old(self):
-        # support reading the old ConfigObj format file and merging
-        # it into the yaml dictionary
-        try:
-            from configobj import ConfigObj
-        except ImportError:
-            ConfigObj = None
-        if not ConfigObj:
-            return {}
-        old_cfg = ConfigObj(OLD_CLOUD_CONFIG)
-        return dict(old_cfg)
-
-    def _initial_subdirs(self):
-        c_dir = self.paths.cloud_dir
-        initial_dirs = [
-            os.path.join(c_dir, 'scripts'),
-            os.path.join(c_dir, 'scripts', 'per-instance'),
-            os.path.join(c_dir, 'scripts', 'per-once'),
-            os.path.join(c_dir, 'scripts', 'per-boot'),
-            os.path.join(c_dir, 'seed'),
-            os.path.join(c_dir, 'instances'),
-            os.path.join(c_dir, 'handlers'),
-            os.path.join(c_dir, 'sem'),
-            os.path.join(c_dir, 'data'),
-        ]
-        return initial_dirs
-
-    def purge_cache(self, rmcur=True):
-        rmlist = []
-        rmlist.append(self.paths.boot_finished)
-        if rmcur:
-            rmlist.append(self.paths.instance_link)
-        for f in rmlist:
-            util.unlink(f)
-        return len(rmlist)
-
-    def init_fs(self):
-        util.ensure_dirs(self._initial_subdirs())
-        log_file = util.get_cfg_option_str(self.cfg, 'def_log_file', None)
-        perms = util.get_cfg_option_str(self.cfg, 'syslog_fix_perms', None)
-        if log_file:
-            util.ensure_file(log_file)
-            if perms:
-                (u, g) = perms.split(':', 1)
-                if u == "-1" or u == "None":
-                    u = None
-                if g == "-1" or g == "None":
-                    g = None
-                util.chownbyname(log_file, u, g)
-
-    def _read_cfg(self):
-        starting_config = get_builtin_cfg()
-        try:
-            conf = get_base_cfg(CLOUD_CONFIG, starting_config)
-        except Exception:
-            conf = starting_config
-        old_conf = self._read_cfg_old()
-        conf = util.mergedict(conf, old_conf)
-        return conf
-    
-    def _restore_from_cache(self):
-        pickled_fn = self.paths.get_ipath_cur('obj_pkl')
-        try:
-            # we try to restore from a current link and static path
-            # by using the instance link, if purge_cache was called
-            # the file wont exist
-            return pickle.loads(util.load_file(pickled_fn))
-        except Exception as e:
-            LOG.debug("Failed loading pickled datasource from %s due to %s", pickled_fn, e)
-            return False
-
-    def write_to_cache(self):
-        pickled_fn = self.paths.get_ipath_cur("obj_pkl")
-        try:
-            contents = pickle.dumps(self.datasource)
-            util.write_file(pickled_fn, contents, mode=0400)
-        except Exception as e:
-            LOG.debug("Failed pickling datasource to %s due to: %s", pickled_fn, e)
-            return False
-
-    def _get_processor(self):
-        return ud_proc.UserDataProcessor(self.paths)
-
-    def _get_datasources(self):
-        # Any config provided???
-        pkg_list = self.cfg.get('datasource_pkg_list') or []
-        # Add the defaults at the end
-        for n in [util.obj_name(sources), '']:
-            if n not in pkg_list:
-                pkg_list.append(n)
-        cfg_list = self.cfg.get('datasource_list') or []
-        return (cfg_list, pkg_list)
-
-    def get_data_source(self):
-        if self.datasource:
-            return True
-        ds = self._restore_from_cache()
-        if ds:
-            LOG.debug("Restored from cache datasource: %s" % ds)
-        else:
-            (cfg_list, pkg_list) = self._get_datasources()
-            ud_proc = self._get_processor()
-            (ds, dsname) = sources.find_source(self.cfg,
-                                               self.ds_deps,
-                                               cfg_list=cfg_list,
-                                               pkg_list=pkg_list,
-                                               ud_proc=ud_proc)
-            LOG.debug("Loaded datasource %s - %s", dsname, ds)
-        self.datasource = ds
-        # This allows the paths obj to have an ipath function that works
-        self.paths.datasource = ds
-        return True
-
-    def set_cur_instance(self):
-        # Ensure we are hooked into the right symlink for the current instance
-        idir = self.paths.get_ipath()
-        util.del_file(self.paths.instance_link)
-        util.sym_link(idir, self.paths.instance_link)
-
-        dlist = []
-        for d in ["handlers", "scripts", "sem"]:
-            dlist.append(os.path.join(idir, d))
-        util.ensure_dirs(dlist)
-
-        # Write out information on what is being used for the current instance
-        # and what may have been used for a previous instance...
-        dp = self.paths.get_cpath('data')
-        ds = "%s: %s\n" % (self.datasource.__class__, self.datasource)
-        previous_ds = ''
-        ds_fn = os.path.join(idir, 'datasource')
-        try:
-            previous_ds = util.load_file(ds_fn).strip()
-        except IOError as e:
-            pass
-        if not previous_ds:
-            # TODO: ?? is this right
-            previous_ds = ds
-        util.write_file(ds_fn, ds)
-        util.write_file(os.path.join(dp, 'previous-datasource'), previous_ds)
-        iid = self.datasource.get_instance_id()
-        previous_iid = ''
-        p_iid_fn = os.path.join(dp, 'previous-instance-id')
-        try:
-            previous_iid = util.load_file(p_iid_fn).strip()
-        except IOError as e:
-            pass
-        if not previous_iid:
-            # TODO: ?? is this right
-            previous_iid = iid
-        util.write_file(p_iid_fn, "%s\n" % previous_iid)
-
-    def update_cache(self):
-        self.write_to_cache()
-        self.store_userdata()
-
-    def store_userdata(self):
-        raw_ud = "%s" % (self.datasource.get_userdata_raw())
-        util.write_file(self.paths.get_ipath('userdata_raw'), raw_ud, 0600)
-        ud = "%s" % (self.datasource.get_userdata())
-        util.write_file(self.paths.get_ipath('userdata'), ud, 0600)
-
-    def consume_userdata(self, frequency=PER_INSTANCE):
-        cdir = self.paths.get_cpath("handlers")
-        idir = self.paths.get_ipath("handlers")
-    
-        # Add the path to the plugins dir to the top of our list for import
-        # instance dir should be read before cloud-dir
-        sys.path.insert(0, cdir)
-        sys.path.insert(0, idir)
-
-        # Data will be a little proxy that modules can use
-        data = CloudSimple(self)
-
-        # This keeps track of all the active handlers
-        handlers = CloudHandlers(self)
-
-        # Add handlers in cdir
-        potential_handlers = utils.find_modules(cdir)
-        for (fname, modname) in potential_handlers.iteritems():
-            try:
-                mod = parts.fixup_module(importer.import_module(modname))
-                types = handlers.register(mod)
-                LOG.debug("Added handler for [%s] from %s", types, fname)
-            except:
-                LOG.exception("Failed to register handler from %s", fname)
-
-        def_handlers = handlers.register_defaults()
-        if def_handlers:
-            LOG.debug("Registered default handlers for [%s]", def_handlers)
-
-        # Init the handlers first
-        # Ensure userdata fetched before activation
-        called = []
-        for (_mtype, mod) in handlers.iteritems():
-            if mod in called:
-                continue
-            parts.call_begin(mod, data, frequency)
-            called.append(mod)
-
-        # Walk the user data
-        part_data = {
-            'handlers': handlers,
-            'handlerdir': idir,
-            'data': data, 
-            'frequency': frequency,
-            'handlercount': 0,
-        }
-        ud.walk(data.get_userdata(), parts.walker_callback, data=part_data)
-
-        # Give callbacks opportunity to finalize
-        called = []
-        for (_mtype, mod) in handlers.iteritems():
-            if mod in called:
-                continue
-            parts.call_end(mod, data, frequency)
-            called.append(mod)
-
-
-class CloudHandlers(object):
-
-    def __init__(self, paths):
-        self.paths = paths
-        self.registered = {}
-
-    def __contains__(self, item):
-        return self.is_registered(item)
-
-    def __getitem__(self, key):
-        return self._get_handler(key)
-
-    def is_registered(self, content_type):
-        return content_type in self.registered
-
-    def register(self, mod):
-        types = set()
-        for t in mod.list_types():
-            self.registered[t] = handler
-            types.add(t)
-        return types
-
-    def _get_handler(self, content_type):
-        return self.registered[content_type]
-
-    def items(self):
-        return self.registered.items()
-
-    def iteritems(self):
-        return self.registered.iteritems()
-
-    def _get_default_handlers(self):
-        def_handlers = []
-        if self.paths.get_ipath("cloud_config"):
-            def_handlers.append(cc_part.CloudConfigPartHandler(self.paths.get_ipath("cloud_config")))
-        if self.paths.get_ipath_cur('scripts'):
-            def_handlers.append(ss_part.ShellScriptPartHandler(self.paths.get_ipath_cur('scripts')))
-        if self.paths.get_ipath("boothooks"):
-            def_handlers.append(bh_part.BootHookPartHandler(self.paths.get_ipath("boothooks")))
-        if self.paths.upstart_conf_d:
-            def_handlers.append(up_part.UpstartJobPartHandler(self.paths.upstart_conf_d))
-        return def_handlers
-
-    def register_defaults(self):
-        registered = set()
-        for h in self._get_default_handlers():
-            for t in h.list_types():
-                if not self.is_registered(t)
-                    self.register_handler(t, h)
-                    registered.add(t)
-        return registered
-
-
-class CloudConfig(object):
-    def __init__(self, cfgfile, cloud):
-        self.cloud = cloud
-        self.cfg = self._get_config(cfgfile)
-        self.paths = cloud.paths
-        self.sems = CloudSemaphores(self.paths.get_ipath("sem"))
-
-    def _get_config(self, cfgfile):
-        cfg = None
-        try:
-            cfg = util.read_conf(cfgfile)
-        except:
-            LOG.exception(("Failed loading of cloud config '%s'. "
-                          "Continuing with empty config."), cfgfile)
-        if not cfg:
-            cfg = {}
-
-        ds_cfg = None
-        try:
-            ds_cfg = self.cloud.datasource.get_config_obj()
-        except:
-            LOG.exception("Failed loading of datasource config.")
-        if not ds_cfg:
-            ds_cfg = {}
-
-        cfg = util.mergedict(cfg, ds_cfg)
-        cloud_cfg = self.cloud.cfg or {}
-        return util.mergedict(cfg, cloud_cfg)
-
-    def extract(self, name):
-        modname = handlers.form_module_name(name)
-        if not modname:
-            return None
-        return handlers.fixup_module(importer.import_module(modname))
-
-    def handle(self, name, mod, args, freq=None):
-        def_freq = mod.frequency 
-        if not freq:
-            freq = def_freq
-        c_name = "config-%s" % (name)
-        real_args = [name, copy.deepcopy(self.cfg), CloudSimple(self.cloud), LOG, copy.deepcopy(args)]
-        return self.sems.run_functor(c_name, freq, mod.handle, real_args)

From 0c636bfad4c9989af3fdb1221050c0febf86d418 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:13:19 -0700
Subject: [PATCH 058/434] Adding in the root distro class + a util function to
 fetch various distros.

---
 cloudinit/distros/__init__.py | 45 +++++++++++++++++++++++++++++++++++
 1 file changed, 45 insertions(+)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index e69de29b..f7f48d1f 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -0,0 +1,45 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import contextlib
+
+from cloudinit import importer
+
+
+class Distro(object):
+    def __init__(self, cloud):
+        self.cloud = cloud
+
+    def install_packages(self, pkglist):
+        raise NotImplementedError()
+
+    def apply_network(self, settings):
+        raise NotImplementedError()
+
+
+def fetch(cfg, cloud):
+    sys_info = cfg.get('system_info', {})
+    distro = sys_info.get('distro', 'ubuntu')
+    mod_name = "%s.%s" % (__name__, distro)
+    mod = importer.import_module(mod_name)
+    distro_cls = getattr(mod, 'Distro')
+    return distro_cls(cloud)
\ No newline at end of file

From 08313c0d7c3c9efcef058426bc38a84eea3c8931 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:14:46 -0700
Subject: [PATCH 059/434] Adding in the base of a ubuntu distro subclass that
 can install pkgs (right now).

---
 cloudinit/distros/ubuntu.py | 55 +++++++++++++++++++++++++++++++++++++
 1 file changed, 55 insertions(+)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index e69de29b..d19ef63e 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -0,0 +1,55 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import os
+
+from cloudinit import distros
+from cloudinit import log as logging
+from cloudinit import util
+
+from cloudinit.settings import (PER_INSTANCE)
+
+
+LOG = logging.getLogger(__name__)
+
+
+class Distro(distros.Distro):
+
+    def install_packages(self, pkglist):
+        self.update_package_sources()
+        self.apt_get('install', pkglist)
+
+    def apply_network(self, settings):
+        pass
+
+    # apt_get top level command (install, update...), and args to pass it
+    def apt_get(self, tlc, args=None):
+        e = os.environ.copy()
+        e['DEBIAN_FRONTEND'] = 'noninteractive'
+        cmd = ['apt-get', '--option', 'Dpkg::Options::=--force-confold',
+               '--assume-yes', tlc]
+        if args:
+            cmd.extend(args)
+        util.subp(cmd, env=e)
+
+    def update_package_sources(self):
+        self.cloud.run("update-sources", self.apt_get, ["update"], freq=PER_INSTANCE)
\ No newline at end of file

From 37e46182b7a635907c23fef65607dbd1c6f0c9b6 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:15:16 -0700
Subject: [PATCH 060/434] Removing distro specifics from here, as well as
 running functionality (which is now elsewhere).

---
 cloudinit/handlers/__init__.py | 40 +++-------------------------------
 1 file changed, 3 insertions(+), 37 deletions(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index ae74b683..5d70ac43 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -36,7 +36,6 @@ LOG = logging.getLogger(__name__)
 
 DEF_HANDLER_VERSION = 1
 DEF_FREQ = PER_INSTANCE
-HANDLER_TPL = "cc_%s"
 
 
 # reads a cloudconfig module list, returns
@@ -198,41 +197,6 @@ def redirect_output(outfmt, errfmt, o_out=sys.stdout, o_err=sys.stderr):
     return
 
 
-def run_per_instance(name, func, args, clear_on_fail=False):
-    semfile = "%s/%s" % (cloudinit.get_ipath_cur("data"), name)
-    if os.path.exists(semfile):
-        return
-
-    util.write_file(semfile, str(time.time()))
-    try:
-        func(*args)
-    except:
-        if clear_on_fail:
-            os.unlink(semfile)
-        raise
-
-
-# apt_get top level command (install, update...), and args to pass it
-def apt_get(tlc, args=None):
-    if args is None:
-        args = []
-    e = os.environ.copy()
-    e['DEBIAN_FRONTEND'] = 'noninteractive'
-    cmd = ['apt-get', '--option', 'Dpkg::Options::=--force-confold',
-           '--assume-yes', tlc]
-    cmd.extend(args)
-    subprocess.check_call(cmd, env=e)
-
-
-def update_package_sources():
-    run_per_instance("update-sources", apt_get, ("update",))
-
-
-def install_packages(pkglist):
-    update_package_sources()
-    apt_get("install", pkglist)
-
-
 def form_module_name(name):
     canon_name = name.replace("-", "_")
     if canon_name.endswith(".py"):
@@ -240,7 +204,9 @@ def form_module_name(name):
     canon_name = canon_name.strip()
     if not canon_name:
         return None
-    return HANDLER_TPL % (canon_name)
+    if not canon_name.startswith("cc_"):
+        canon_name = 'cc_%s' % (canon_name)
+    return canon_name
 
 
 def fixup_module(mod):

From bfa0fd6c7e46eedefb2e904a206b51a2e6709580 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:15:39 -0700
Subject: [PATCH 061/434] Added log setup and a basic log (for when one is not
 enabled)

---
 cloudinit/log.py | 72 +++++++++++++++++++++++++-----------------------
 1 file changed, 38 insertions(+), 34 deletions(-)

diff --git a/cloudinit/log.py b/cloudinit/log.py
index 341b329b..6e7424e1 100644
--- a/cloudinit/log.py
+++ b/cloudinit/log.py
@@ -40,52 +40,56 @@ INFO = logging.INFO
 DEBUG = logging.DEBUG
 NOTSET = logging.NOTSET
 
-
-class ConsoleFormatter(logging.Formatter):
-
-    def _get_mini_level(self, record):
-        if record.levelno in [INFO, NOTSET] or not record.levelname:
-            return ''
-        lvlname = record.levelname
-        return lvlname[0].upper() + ": "
-
-    def format(self, record):
-        record.message = record.getMessage()
-        rdict = dict(record.__dict__)
-        rdict['minilevelname'] = self._get_mini_level(record)
-        return self._fmt % (rdict)
+# Default basic format
+DEF_FORMAT = '%(levelname)s: @%(name)s : %(message)s'
 
 
-def setupLogging(cfg):
+def setupBasicLogging(level=INFO, fmt=DEF_FORMAT):
+    root = getLogger()
+    console = logging.StreamHandler(sys.stdout)
+    console.setFormatter(logging.Formatter(fmt))
+    console.setLevel(level)
+    root.addHandler(console)
+    root.setLevel(level)
+
+
+def setupLogging(cfg=None):
+    # See if the config provides any logging conf...
+    if not cfg:
+        cfg = {}
+
     log_cfgs = []
     log_cfg = cfg.get('logcfg')
-    if log_cfg:
-        # if there is a 'logcfg' entry in the config, respect
-        # it, it is the old keyname
-        log_cfgs = [log_cfg]
-    elif "log_cfgs" in cfg:
-        for cfg in cfg['log_cfgs']:
-            if isinstance(cfg, list):
-                log_cfgs.append('\n'.join(cfg))
+    if log_cfg and isinstance(log_cfg, (str, basestring)):
+        # Ff there is a 'logcfg' entry in the config,
+        # respect it, it is the old keyname
+        log_cfgs.append(str(log_cfg))
+    elif "log_cfgs" in cfg and isinstance(cfg['log_cfgs'], (set, list)):
+        for a_cfg in cfg['log_cfgs']:
+            if isinstance(a_cfg, (list, set, dict)):
+                cfg_str = [str(c) for c in a_cfg]
+                log_cfgs.append('\n'.join(cfg_str))
             else:
-                log_cfgs.append(cfg)
-
-    if not len(log_cfgs):
-        sys.stderr.write("Warning, no logging configured\n")
-        return
+                log_cfgs.append(str(a_cfg))
 
+    # See if any of them actually load...
     am_worked = 0
-    for logcfg in log_cfgs:
+    for log_cfg in log_cfgs:
         try:
-            if not os.path.isfile(logcfg):
-                logcfg = StringIO(logcfg)
-            logging.config.fileConfig(logcfg)
+            if not os.path.isfile(log_cfg):
+                log_cfg = StringIO(log_cfg)
+            logging.config.fileConfig(log_cfg)
             am_worked += 1
-        except:
+        except Exception:
             pass
 
+    # If it didn't work, at least setup a basic logger
+    basic_enabled = cfg.get('log_basic', True)
     if not am_worked:
-        sys.stderr.write("Warning, no logging configured\n")
+        sys.stderr.write("Warning, no logging configured!\n")
+        if basic_enabled:
+            sys.stderr.write("Setting up basic logging...\n")
+            setupBasicLogging()
 
 
 def getLogger(name='cloudinit'):

From 8cb0882dd411a9be2f4972ac7ab6ee50ead61416 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:16:07 -0700
Subject: [PATCH 062/434] Start of cleaning this up.

---
 cloudinit/netinfo.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index 1f0fa571..541d2911 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -22,6 +22,11 @@
 import cloudinit.util as util
 
 
+class NetInfo(object):
+    def __init__(self):
+        pass
+
+
 def netdev_info(empty=""):
     fields = ("hwaddr", "addr", "bcast", "mask")
     (ifcfg_out, _err) = util.subp(["ifconfig", "-a"])

From 09273ee69b69418f683b5f98d1f01243c3c5638b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:16:19 -0700
Subject: [PATCH 063/434] Fix this up to use the new datasource class hierachy,
 as well as other new objects/logging added...

---
 cloudinit/sources/DataSourceCloudStack.py | 78 +++++++++++++----------
 1 file changed, 43 insertions(+), 35 deletions(-)

diff --git a/cloudinit/sources/DataSourceCloudStack.py b/cloudinit/sources/DataSourceCloudStack.py
index 5afdf7b6..33fb3491 100644
--- a/cloudinit/sources/DataSourceCloudStack.py
+++ b/cloudinit/sources/DataSourceCloudStack.py
@@ -18,62 +18,68 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.DataSource as DataSource
-
-from cloudinit import seeddir as base_seeddir
-from cloudinit import log
-import cloudinit.util as util
 from socket import inet_ntoa
-import time
-import boto.utils as boto_utils
 from struct import pack
 
+import os
+import time
 
-class DataSourceCloudStack(DataSource.DataSource):
-    api_ver = 'latest'
-    seeddir = base_seeddir + '/cs'
-    metadata_address = None
+import boto.utils as boto_utils
 
-    def __init__(self, sys_cfg=None):
-        DataSource.DataSource.__init__(self, sys_cfg)
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
+
+
+class DataSourceCloudStack(sources.DataSource):
+    def __init__(self, sys_cfg, distro, paths):
+        sources.DataSource.__init__(self, sys_cfg, distro, paths)
+        self.seed_dir = os.path.join(paths.seed_dir, 'cs')
         # Cloudstack has its metadata/userdata URLs located at
         # http://<default-gateway-ip>/latest/
-        self.metadata_address = "http://%s/" % self.get_default_gateway()
+        self.api_ver = 'latest'
+        gw_addr = self.get_default_gateway()
+        if not gw_addr:
+            raise RuntimeError("No default gateway found!")
+        self.metadata_address = "http://%s/" % (gw_addr)
 
     def get_default_gateway(self):
         """ Returns the default gateway ip address in the dotted format
         """
-        with open("/proc/net/route", "r") as f:
-            for line in f.readlines():
-                items = line.split("\t")
-                if items[1] == "00000000":
-                    # found the default route, get the gateway
-                    gw = inet_ntoa(pack("<L", int(items[2], 16)))
-                    log.debug("found default route, gateway is %s" % gw)
-                    return gw
+        lines = util.load_file("/proc/net/route").splitlines()
+        for line in lines:
+            items = line.split("\t")
+            if items[1] == "00000000":
+                # Found the default route, get the gateway
+                gw = inet_ntoa(pack("<L", int(items[2], 16)))
+                LOG.debug("Found default route, gateway is %s", gw)
+                return gw
+        return None
 
     def __str__(self):
-        return "DataSourceCloudStack"
+        return util.obj_name(self)
 
     def get_data(self):
-        seedret = {}
-        if util.read_optional_seed(seedret, base=self.seeddir + "/"):
-            self.userdata_raw = seedret['user-data']
-            self.metadata = seedret['meta-data']
-            log.debug("using seeded cs data in %s" % self.seeddir)
+        seed_ret = {}
+        if util.read_optional_seed(seed_ret, base=(self.seed_dir + "/")):
+            self.userdata_raw = seed_ret['user-data']
+            self.metadata = seed_ret['meta-data']
+            LOG.info("Using seeded cloudstack data from: %s", self.seed_dir)
             return True
-
         try:
             start = time.time()
             self.userdata_raw = boto_utils.get_instance_userdata(self.api_ver,
                 None, self.metadata_address)
             self.metadata = boto_utils.get_instance_metadata(self.api_ver,
                 self.metadata_address)
-            log.debug("crawl of metadata service took %ds" %
-                (time.time() - start))
+            LOG.debug("Crawl of metadata service took %ds",
+                      (time.time() - start))
             return True
         except Exception as e:
-            log.exception(e)
+            LOG.exception(('Failed fetching from metadata '
+                           'service %s due to: %s'), self.metadata_address, e)
             return False
 
     def get_instance_id(self):
@@ -82,11 +88,13 @@ class DataSourceCloudStack(DataSource.DataSource):
     def get_availability_zone(self):
         return self.metadata['availability-zone']
 
+
+# Used to match classes to dependencies
 datasources = [
-  (DataSourceCloudStack, (DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK)),
+  (DataSourceCloudStack, (sources.DEP_FILESYSTEM, sources.DEP_NETWORK)),
 ]
 
 
-# return a list of data sources that match this set of dependencies
+# Return a list of data sources that match this set of dependencies
 def get_datasource_list(depends):
-    return DataSource.list_from_depends(depends, datasources)
+    return sources.list_from_depends(depends, datasources)

From c776a86fcb953e1b5552edfc5ef827a24545b0b7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:17:05 -0700
Subject: [PATCH 064/434] Add more logging in onto what is being searched for.

---
 cloudinit/sources/__init__.py | 35 +++++++++++++++++++----------------
 1 file changed, 19 insertions(+), 16 deletions(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 05c8bfad..dfd1fff3 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -24,9 +24,12 @@ from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import util
 
+from cloudinit.user_data import processor as ud_proc
+
 DEP_FILESYSTEM = "FILESYSTEM"
 DEP_NETWORK = "NETWORK"
 DS_PREFIX = 'DataSource'
+
 LOG = logging.getLogger(__name__)
 
 
@@ -35,26 +38,25 @@ class DataSourceNotFoundException(Exception):
 
 
 class DataSource(object):
-    def __init__(self, ud_proc, cfg):
+    def __init__(self, sys_cfg, distro, paths):
         name = util.obj_name(self)
         if name.startswith(DS_PREFIX):
             name = name[DS_PREFIX:]
         self.cfgname = name
-        if sys_cfg:
-            self.sys_cfg = sys_cfg
-        else:
-            self.sys_cfg = {}
-        self.ud_proc = ud_proc
+        self.sys_cfg = sys_cfg
+        self.distro = distro
+        self.paths = paths
+        self.userdata_proc = ud_proc.UserDataProcessor(paths)
         self.userdata = None
         self.metadata = None
         self.userdata_raw = None
         self.ds_cfg = util.get_cfg_by_path(self.sys_cfg,
-                          ("datasource", self.cfgname), self.ds_cfg)
+                        ("datasource", self.cfgname), {})
 
     def get_userdata(self):
         if self.userdata is None:
             raw_data = self.get_userdata_raw()
-            self.userdata = self.ud_proc.process(raw_data)
+            self.userdata = self.userdata_proc.process(raw_data)
         return self.userdata
 
     def get_userdata_raw(self):
@@ -85,7 +87,7 @@ class DataSource(object):
                 # than a list.
                 if isinstance(klist, (str)):
                     klist = [klist]
-                if isinstance(klist, (list)):
+                if isinstance(klist, (list, set)):
                     for pkey in klist:
                         # there is an empty string at the end of the keylist, trim it
                         if pkey:
@@ -105,6 +107,7 @@ class DataSource(object):
         return 'en_US.UTF-8'
 
     def get_local_mirror(self):
+        # ??
         return None
 
     def get_instance_id(self):
@@ -152,20 +155,18 @@ class DataSource(object):
             return hostname
 
 
-def find_source(cfg, ds_deps, cfg_list, pkg_list, **kwargs):
+def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
     ds_list = list_sources(cfg_list, ds_deps, pkg_list)
     ds_names = [util.obj_name(f) for f in ds_list]
-    ds_args = dict(kwargs)
-    ds_args['cfg'] = cfg
     LOG.info("Searching for data source in: %s", ds_names)
     for cls in ds_list:
         ds = util.obj_name(cls)
         try:
-            s = cls(**ds_args)
+            s = cls(distro, sys_cfg, paths)
             if s.get_data():
                 return (s, ds)
         except Exception as e:
-            LOG.exception("Getting data from %s failed", ds)
+            LOG.exception("Getting data from %s failed due to %s", ds, e)
 
     msg = "Did not find any data source, searched classes: %s" % (ds_names)
     raise DataSourceNotFoundException(msg)
@@ -187,8 +188,7 @@ def list_sources(cfg_list, depends, pkg_list):
             if pkg:
                 pkg_name.append(str(pkg))
             pkg_name.append(ds_name)
-            mod_name = ".".join(pkg_name)
-            mod = importer.import_module(mod_name)
+            mod = importer.import_module(".".join(pkg_name))
             if pkg:
                 mod = getattr(mod, ds_name, None)
             if not mod:
@@ -196,10 +196,13 @@ def list_sources(cfg_list, depends, pkg_list):
             lister = getattr(mod, "get_datasource_list", None)
             if not lister:
                 continue
+            LOG.debug("Seeing if %s matches using function %s", mod, lister)
             cls_matches = lister(depends)
             if not cls_matches:
                 continue
             src_list.extend(cls_matches)
+            LOG.debug("Found a match for data source %s in %s with matches %s", 
+                        ds_name, mod, cls_matches)
             break
     return src_list
 

From fb98ec8831624078172358dc8b25547a272e5c28 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:17:51 -0700
Subject: [PATCH 065/434] Add comments on formats, add in function that handles
 option extraction + other pylint cleanups.

---
 cloudinit/ssh_util.py | 105 +++++++++++++++++++++++++-----------------
 1 file changed, 62 insertions(+), 43 deletions(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index 93fd55dd..c97b3819 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -19,6 +19,9 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from StringIO import StringIO
+
+import csv
 import os
 import pwd
 
@@ -26,6 +29,7 @@ from cloudinit import log as logging
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)
+DEF_SSHD_CFG = "/etc/ssh/sshd_config"
 
 
 class AuthKeyEntry(object):
@@ -52,6 +56,40 @@ class AuthKeyEntry(object):
         self.line = str(line)
         (self.value, self.components) = self._parse(self.line, def_opt)
 
+    def _extract_options(self, ent):
+        """
+        The options (if present) consist of comma-separated option specifica-
+         tions.  No spaces are permitted, except within double quotes.
+         Note that option keywords are case-insensitive.
+        """
+        quoted = False
+        i = 0
+        while (i < len(ent) and
+               ((quoted) or (ent[i] not in (" ", "\t")))):
+            curc = ent[i]
+            if i + 1 >= len(ent):
+                i = i + 1
+                break
+            nextc = ent[i + 1]
+            if curc == "\\" and nextc == '"':
+                i = i + 1
+            elif curc == '"':
+                quoted = not quoted
+            i = i + 1
+    
+        options = ent[0:i]
+        options_lst = []
+        reader = csv.reader(StringIO(options), quoting=csv.QUOTE_NONE)
+        for row in reader:
+            for e in row:
+                e = e.strip()
+                if e:
+                    options_lst.append(e)
+        toks = []
+        if i + 1 < len(ent):
+            toks = ent[i + 1:].split(None, 3)
+        return (options_lst, toks)
+
     def _form_components(self, toks):
         components = {}
         if len(toks) == 1:
@@ -81,29 +119,10 @@ class AuthKeyEntry(object):
             if len(toks) < 4:
                 tmp_components.update(self._form_components(toks))
             else:
-                # taken from auth_rsa_key_allowed in auth-rsa.c
-                i = 0
-                quoted = False
-                try:
-                    while (i < len(ent) and
-                           ((quoted) or (ent[i] not in (" ", "\t")))):
-                        curc = ent[i]
-                        nextc = ent[i + 1]
-                        if curc == "\\" and nextc == '"':
-                            i = i + 1
-                        elif curc == '"':
-                            quoted = not quoted
-                        i = i + 1
-                except IndexError:
-                    return (False, {})
-                try:
-                    options = ent[0:i]
-                    toks = ent[i + 1:].split(None, 3)
-                    if options:
-                        tmp_components['options'] = options
-                    tmp_components.update(self._form_components(toks))
-                except (IndexError, ValueError):
-                    return (False, {})
+                (options, toks) = self._extract_options(ent)
+                if options:
+                    tmp_components['options'] = ",".join(options)
+                tmp_components.update(self._form_components(toks))
             # We got some useful value!
             return (True, tmp_components)
 
@@ -125,7 +144,7 @@ class AuthKeyEntry(object):
             return ' '.join(toks)
 
 
-def update_authorized_keys(fname, keys):
+def _update_authorized_keys(fname, keys):
     lines = []
     try:
         if os.path.isfile(fname):
@@ -159,9 +178,11 @@ def update_authorized_keys(fname, keys):
     return '\n'.join(lines)
 
 
-def setup_user_keys(keys, user, key_prefix, sshd_config_fn="/etc/ssh/sshd_config"):
-    pwent = pwd.getpwnam(user)
+def setup_user_keys(keys, user, key_prefix, sshd_config_fn=None):
+    if not sshd_config_fn:
+        sshd_config_fn = DEF_SSHD_CFG
 
+    pwent = pwd.getpwnam(user)
     ssh_dir = os.path.join(pwent.pw_dir, '.ssh')
     if not os.path.exists(ssh_dir):
         util.ensure_dir(ssh_dir, mode=0700)
@@ -173,14 +194,12 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn="/etc/ssh/sshd_config
 
     with util.SeLinuxGuard(ssh_dir, recursive=True):
         try:
-            """
-             AuthorizedKeysFile may contain tokens
-             of the form %T which are substituted during connection set-up.
-             The following tokens are defined: %% is replaced by a literal
-             '%', %h is replaced by the home directory of the user being
-             authenticated and %u is replaced by the username of that user.
-            """
-            ssh_cfg = parse_ssh_config(sshd_config_fn)
+            # AuthorizedKeysFile may contain tokens
+            # of the form %T which are substituted during connection set-up.
+            # The following tokens are defined: %% is replaced by a literal
+            # '%', %h is replaced by the home directory of the user being
+            # authenticated and %u is replaced by the username of that user.
+            ssh_cfg = _parse_ssh_config(sshd_config_fn)
             akeys = ssh_cfg.get("authorizedkeysfile", '')
             akeys = akeys.strip()
             if not akeys:
@@ -193,22 +212,22 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn="/etc/ssh/sshd_config
             authorized_keys = akeys
         except (IOError, OSError):
             authorized_keys = os.path.join(ssh_dir, 'authorized_keys')
-            LOG.exception(("Failed extracting 'AuthorizedKeysFile' in ssh config"
-                            " from %s, using 'AuthorizedKeysFile' file %s instead."),
+            LOG.exception(("Failed extracting 'AuthorizedKeysFile'"
+                            " in ssh config"
+                            " from %s, using 'AuthorizedKeysFile' file"
+                            " %s instead"),
                            sshd_config_fn, authorized_keys)
 
-        content = update_authorized_keys(authorized_keys, key_entries)
+        content = _update_authorized_keys(authorized_keys, key_entries)
         util.ensure_dir(os.path.dirname(authorized_keys), mode=0700)
         util.write_file(authorized_keys, content, mode=0600)
         util.chownbyid(authorized_keys, pwent.pw_uid, pwent.pw_gid)
 
 
-def parse_ssh_config(fname):
-    """
-    The file contains keyword-argu-ment pairs, one per line.
-    Lines starting with '#' and empty lines are interpreted as comments.
-    Note: key-words are case-insensitive and arguments are case-sensitive
-    """
+def _parse_ssh_config(fname):
+    # The file contains keyword-argument pairs, one per line.
+    # Lines starting with '#' and empty lines are interpreted as comments.
+    # Note: key-words are case-insensitive and arguments are case-sensitive
     ret = {}
     if not os.path.isfile(fname):
         return ret

From 3a3f2c7744a9279bb2b7d5923bafcd11fd3bfe4e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:18:37 -0700
Subject: [PATCH 066/434] Start using tempita instead of the more complicated
 cheetah.

---
 cloudinit/templater.py | 17 ++++++++++++-----
 1 file changed, 12 insertions(+), 5 deletions(-)

diff --git a/cloudinit/templater.py b/cloudinit/templater.py
index 04cc5a6f..5839911c 100644
--- a/cloudinit/templater.py
+++ b/cloudinit/templater.py
@@ -20,15 +20,22 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from Cheetah.Template import Template
+from tempita import Template
 
 from cloudinit import util
 
 
-def render_to_file(template_fn, outfile, searchList):
-    contents = Template(file=template_fn, searchList=[searchList]).respond()
+def render_from_file(fn, params):
+    return render_string(util.load_file(fn), params, name=fn)
+
+
+def render_to_file(name, outfile, params):
+    contents = render_from_file(name, params)
     util.write_file(outfile, contents)
 
 
-def render_string(template, searchList):
-    return Template(template, searchList=[searchList]).respond()
+def render_string(content, params, name=None):
+    tpl = Template(content, name=name)
+    if not params:
+        params = dict()
+    return tpl.substitute(params)

From abe89bb5bafdeb921e5d7bbe9712ab0e9915a413 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:19:19 -0700
Subject: [PATCH 067/434] Logging fixups + pylint fixups.

---
 cloudinit/url_helper.py | 92 ++++++++++++++++++++++++-----------------
 1 file changed, 54 insertions(+), 38 deletions(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 6fa3e44b..1bf24c4f 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -20,14 +20,14 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from contextlib import closing
 
 import errno
+import socket
 import time
 import urllib
 import urllib2
 
-from contextlib import closing
-
 from cloudinit import log as logging
 
 LOG = logging.getLogger(__name__)
@@ -37,46 +37,58 @@ def ok_http_code(st):
     return st in xrange(200, 400)
 
 
-def readurl(url, data=None, timeout=None, retries=0, sec_between=1, headers=None):
-    openargs = {}
-    if timeout is not None:
-        openargs['timeout'] = int(timeout)
+def readurl(url, data=None, timeout=None,
+            retries=0, sec_between=1, headers=None):
 
-    if data is None:
-        req = urllib2.Request(url, headers=headers)
-    else:
-        req = urllib2.Request(url, data=urllib.urlencode(data), headers=headers)
-
-    if retries <= 0:
-        retries = 1
+    req_args = {}
+    req_args['url'] = url
+    if data is not None:
+        req_args['data'] = urllib.urlencode(data)
+    if headers is not None:
+        req_args['headers'] = dict(headers)
+    req = urllib2.Request(**req_args)
 
+    retries = max(retries, 0)
     attempts = retries + 1
-    last_excp = None
-    LOG.debug("Attempting to read from %s with %s attempts to be performed", url, attempts)
+
+    last_excp = Exception("??")
+    LOG.info(("Attempting to read from %s with %s attempts"
+                " (%s retries) to be performed"), url, attempts, retries)
+    open_args = {}
+    if timeout is not None:
+        open_args['timeout'] = int(timeout)
     for i in range(0, attempts):
         try:
-            with closing(urllib2.urlopen(req, **openargs)) as rh:
-                return (rh.read(), rh.getcode())
+            with closing(urllib2.urlopen(req, **open_args)) as rh:
+                content = rh.read()
+                status = rh.getcode()
+                if status is None:
+                    # This seems to happen when files are read...
+                    status = 200
+                LOG.info("Read from %s (%s, %sb) after %s attempts",
+                         url, status, len(content), (i + 1))
+                return (content, status)
         except urllib2.HTTPError as e:
             last_excp = e
             LOG.exception("Failed at reading from %s.", url)
         except urllib2.URLError as e:
             # This can be a message string or
-            # another exception instance (socket.error for remote URLs, OSError for local URLs).
+            # another exception instance 
+            # (socket.error for remote URLs, OSError for local URLs).
             if (isinstance(e.reason, OSError) and
                 e.reason.errno == errno.ENOENT):
                 last_excp = e.reason
             else:
                 last_excp = e
-            LOG.exception("Failed at reading from %s.", url)
+            LOG.exception("Failed at reading from %s", url)
         if i + 1 < attempts:
-            LOG.debug("Please wait %s seconds while we wait to try again.", sec_between)
+            LOG.info("Please wait %s seconds while we wait to try again",
+                     sec_between)
             time.sleep(sec_between)
 
     # Didn't work out
-    LOG.warn("Failed downloading from %s after %s attempts", url, attempts)
-    if last_excp is not None:
-        raise last_excp
+    LOG.warn("Failed reading from %s after %s attempts", url, attempts)
+    raise last_excp
 
 
 def wait_for_url(urls, max_wait=None, timeout=None,
@@ -106,29 +118,29 @@ def wait_for_url(urls, max_wait=None, timeout=None,
     data host (169.254.169.254) may be firewalled off Entirely for a sytem,
     meaning that the connection will block forever unless a timeout is set.
     """
-    starttime = time.time()
+    start_time = time.time()
 
-    def nullstatus_cb(msg):
-        return
+    def log_status_cb(msg):
+        LOG.info(msg)
 
     if status_cb is None:
-        status_cb = nullstatus_cb
+        status_cb = log_status_cb
 
-    def timeup(max_wait, starttime):
+    def timeup(max_wait, start_time):
         return ((max_wait <= 0 or max_wait is None) or
-                (time.time() - starttime > max_wait))
+                (time.time() - start_time > max_wait))
 
     loop_n = 0
     while True:
-        sleeptime = int(loop_n / 5) + 1
+        sleep_time = int(loop_n / 5) + 1
         for url in urls:
             now = time.time()
             if loop_n != 0:
-                if timeup(max_wait, starttime):
+                if timeup(max_wait, start_time):
                     break
-                if timeout and (now + timeout > (starttime + max_wait)):
+                if timeout and (now + timeout > (start_time + max_wait)):
                     # shorten timeout to not run way over max_time
-                    timeout = int((starttime + max_wait) - now)
+                    timeout = int((start_time + max_wait) - now)
 
             reason = ""
             try:
@@ -153,14 +165,18 @@ def wait_for_url(urls, max_wait=None, timeout=None,
             except Exception as e:
                 reason = "unexpected error [%s]" % e
 
-            status_cb("'%s' failed [%s/%ss]: %s" %
-                      (url, int(time.time() - starttime), max_wait,
-                       reason))
+            time_taken = int(time.time() - start_time)
+            status_msg = "Calling '%s' failed [%s/%ss]: %s" % (url,
+                                                             time_taken,
+                                                             max_wait, reason)
+            status_cb(status_msg)
 
-        if timeup(max_wait, starttime):
+        if timeup(max_wait, start_time):
             break
 
         loop_n = loop_n + 1
-        time.sleep(sleeptime)
+        LOG.info("Please wait %s seconds while we wait to try again",
+                 sleep_time)
+        time.sleep(sleep_time)
 
     return False

From 0ea20e40ff185736e6323139fedd77c1d9e11e5d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:19:50 -0700
Subject: [PATCH 068/434] Pylint fixups.

---
 cloudinit/user_data/__init__.py | 19 ++++++++++++-------
 1 file changed, 12 insertions(+), 7 deletions(-)

diff --git a/cloudinit/user_data/__init__.py b/cloudinit/user_data/__init__.py
index 6264a6cc..1910ba28 100644
--- a/cloudinit/user_data/__init__.py
+++ b/cloudinit/user_data/__init__.py
@@ -28,6 +28,7 @@ import email
 
 from email.mime.base import MIMEBase
 
+from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import util
 
@@ -51,6 +52,7 @@ PART_FN_TPL = 'part-%03d'
 # Used as the content type when a message is not multipart
 # and it doesn't contain its own content-type
 NOT_MULTIPART_TYPE = "text/x-not-multipart"
+OCTET_TYPE = 'application/octet-stream'
 
 # Different file beginnings to there content type
 INCLUSION_TYPES_MAP = {
@@ -86,17 +88,17 @@ class PartHandler(object):
         raise NotImplementedError()
 
 
-def fixup_module(mod):
+def fixup_module(mod, def_freq=PER_INSTANCE):
     if not hasattr(mod, "handler_version"):
         setattr(mod, "handler_version", 1)
     if not hasattr(mod, 'list_types'):
         def empty_types():
             return []
         setattr(mod, 'list_types', empty_types)
-    if not hasattr(mod, frequency):
-        setattr(mod, 'frequency', PER_INSTANCE)
+    if not hasattr(mod, 'frequency'):
+        setattr(mod, 'frequency', def_freq)
     if not hasattr(mod, 'handle_part'):
-        def empty_handler(data, ctype, filename, payload):
+        def empty_handler(_data, _ctype, _filename, _payload):
             pass
         setattr(mod, 'handle_part', empty_handler)
     return mod
@@ -114,7 +116,9 @@ def run_part(mod, data, ctype, filename, payload, frequency):
         else:
             mod.handle_part(data, ctype, filename, payload, frequency)
     except:
-        LOG.exception("Failed calling mod %s (%s, %s, %s) with frequency %s", mod, ctype, filename, mod_ver, frequency)
+        LOG.exception(("Failed calling mod %s (%s, %s, %s)"
+                     " with frequency %s"), mod, ctype, filename,
+                     mod_ver, frequency)
 
 
 def call_begin(mod, data, frequency):
@@ -157,7 +161,8 @@ def walker_callback(pdata, ctype, filename, payload):
                 details = repr(payload)
             LOG.warning("Unhandled non-multipart userdata: %s", details)
         return
-    run_part(handlers[ctype], pdata['data'], ctype, filename, payload, pdata['frequency'])
+    run_part(handlers[ctype], pdata['data'], ctype, filename,
+             payload, pdata['frequency'])
 
 
 # Callback is a function that will be called with 
@@ -182,7 +187,7 @@ def walk(msg, callback, data):
 
 
 # Coverts a raw string into a mime message
-def convert_string(self, raw_data, headers=None):
+def convert_string(raw_data, headers=None):
     if not raw_data:
         raw_data = ''
     if not headers:

From a0bd655876458465150e3ce854dbd6633bdac0ab Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:20:04 -0700
Subject: [PATCH 069/434] Pylint fixups.

---
 cloudinit/user_data/boot_hook.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/cloudinit/user_data/boot_hook.py b/cloudinit/user_data/boot_hook.py
index 4ce398ac..87e7a3ec 100644
--- a/cloudinit/user_data/boot_hook.py
+++ b/cloudinit/user_data/boot_hook.py
@@ -60,6 +60,7 @@ class BootHookPartHandler(ud.PartHandler):
             env['INSTANCE_ID'] = str(self.instance_id)
             util.subp([filepath], env=env)
         except util.ProcessExecutionError as e:
-            LOG.error("Boothooks script %s returned %s", filepath, e.exit_code)
+            LOG.error("Boothooks script %s execution error %s", filepath, e)
         except Exception as e:
-            LOG.error("Boothooks unknown exception %s when running %s", e, filepath)
+            LOG.exception(("Boothooks unknown "
+                           "error %s when running %s"), e, filepath)

From e3dc884c46bda328f4c0cd33ae842db426fea7c9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:20:17 -0700
Subject: [PATCH 070/434] Pylint fixups.

---
 cloudinit/user_data/cloud_config.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/cloudinit/user_data/cloud_config.py b/cloudinit/user_data/cloud_config.py
index 1c43f3a1..f0e88eeb 100644
--- a/cloudinit/user_data/cloud_config.py
+++ b/cloudinit/user_data/cloud_config.py
@@ -20,9 +20,6 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-
-import os
-
 from cloudinit import log as logging
 from cloudinit import user_data as ud
 from cloudinit import util
@@ -56,4 +53,4 @@ class CloudConfigPartHandler(ud.PartHandler):
 
         filename = util.clean_filename(filename)
         entry = "\n".join(["#%s" % (filename), str(payload)])
-        self.config_buf.append(entry)
+        self.cloud_buf.append(entry)

From f737e6facf23f511004660f409bf6bd6a024debc Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:20:35 -0700
Subject: [PATCH 071/434] Use common yaml loading function + pylint cleanups.

---
 cloudinit/user_data/processor.py | 31 +++++++++++++++----------------
 1 file changed, 15 insertions(+), 16 deletions(-)

diff --git a/cloudinit/user_data/processor.py b/cloudinit/user_data/processor.py
index d4de9470..6e796f1c 100644
--- a/cloudinit/user_data/processor.py
+++ b/cloudinit/user_data/processor.py
@@ -22,14 +22,12 @@
 
 import hashlib
 import os
-import urllib
 
 from email.mime.multipart import MIMEMultipart
 from email.mime.text import MIMEText
 from email.mime.base import MIMEBase
 
-import yaml
-
+from cloudinit import log as logging
 from cloudinit import url_helper
 from cloudinit import user_data as ud
 from cloudinit import util
@@ -46,8 +44,12 @@ OCTET_TYPE = 'application/octet-stream'
 ATTACHMENT_FIELD = 'Number-Attachments'
 
 # This will be used to create a filename from a url (or like) entry
-# When we want to make sure a entry isn't included more than once across sessions.
+# When we want to make sure a entry isn't included
+# more than once across sessions.
 INCLUDE_ONCE_HASHER = 'md5'
+MAX_INCLUDE_FN_LEN = 64
+
+LOG = logging.getLogger(__name__)
 
 
 class UserDataProcessor(object):
@@ -97,8 +99,10 @@ class UserDataProcessor(object):
     def _get_include_once_filename(self, entry):
         msum = hashlib.new(INCLUDE_ONCE_HASHER)
         msum.update(entry)
-        entry_fn = msum.hexdigest()[0:64]  # Don't get to long now
-        return os.path.join(self.paths.get_ipath_cur('data'), 'urlcache', entry_fn)
+        # Don't get to long now
+        entry_fn = msum.hexdigest()[0:MAX_INCLUDE_FN_LEN]
+        return os.path.join(self.paths.get_ipath_cur('data'),
+                            'urlcache', entry_fn)
 
     def _do_include(self, content, append_msg):
         # is just a list of urls, one per line
@@ -132,17 +136,11 @@ class UserDataProcessor(object):
             self._process_msg(new_msg, append_msg)
 
     def _explode_archive(self, archive, append_msg):
-        try:
-            entries = yaml.load(archive)
-        except:
-            entries = []
-        if not isinstance(entries, (list, set)):
-            # TODO raise?
-            entries = []
-
+        entries = util.load_yaml(archive, default=[], allowed=[list, set])
         for ent in entries:
             # ent can be one of:
-            #  dict { 'filename' : 'value', 'content' : 'value', 'type' : 'value' }
+            #  dict { 'filename' : 'value', 'content' :
+            #       'value', 'type' : 'value' }
             #    filename and type not be present
             # or
             #  scalar(payload)
@@ -165,7 +163,8 @@ class UserDataProcessor(object):
                 msg.set_payload(content)
 
             if 'filename' in ent:
-                msg.add_header('Content-Disposition', 'attachment', filename=ent['filename'])
+                msg.add_header('Content-Disposition', 'attachment',
+                                filename=ent['filename'])
 
             for header in ent.keys():
                 if header in ('content', 'filename', 'type'):

From 9a64b561f876c612f1fb99e1ae565f73b2a7462c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:20:57 -0700
Subject: [PATCH 072/434] Pylint cleanups.

---
 cloudinit/user_data/shell_script.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/cloudinit/user_data/shell_script.py b/cloudinit/user_data/shell_script.py
index d666b9c4..564e4623 100644
--- a/cloudinit/user_data/shell_script.py
+++ b/cloudinit/user_data/shell_script.py
@@ -20,14 +20,13 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-
 import os
 
 from cloudinit import log as logging
 from cloudinit import user_data as ud
 from cloudinit import util
 
-from cloudinit.settings import (PER_INSTANCE)
+from cloudinit.settings import (PER_ALWAYS)
 
 LOG = logging.getLogger(__name__)
 
@@ -45,9 +44,10 @@ class ShellScriptPartHandler(ud.PartHandler):
 
     def _handle_part(self, _data, ctype, filename, payload, _frequency):
         if ctype in ud.CONTENT_SIGNALS:
-            # maybe delete existing things here
+            # TODO: maybe delete existing things here
             return
 
         filename = util.clean_filename(filename)
         payload = util.dos2unix(payload)
-        util.write_file(os.path.join(self.script_dir, filename), payload, 0700)
+        path = os.path.join(self.script_dir, filename)
+        util.write_file(path, payload, 0700)

From 26d8911f40238a2c3cdba922caf84361ba405482 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:21:09 -0700
Subject: [PATCH 073/434] Pylint cleanups.

---
 cloudinit/user_data/upstart_job.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/cloudinit/user_data/upstart_job.py b/cloudinit/user_data/upstart_job.py
index d15e66c4..568a644a 100644
--- a/cloudinit/user_data/upstart_job.py
+++ b/cloudinit/user_data/upstart_job.py
@@ -46,11 +46,14 @@ class UpstartJobPartHandler(ud.PartHandler):
         if ctype in ud.CONTENT_SIGNALS:
             return
 
-        filename = utils.clean_filename(filename)
-        (name, ext) = os.path.splitext(filename)
+        filename = util.clean_filename(filename)
+        (_name, ext) = os.path.splitext(filename)
+        if not ext:
+            ext = ''
         ext = ext.lower()
         if ext != ".conf":
             filename = filename + ".conf"
 
         payload = util.dos2unix(payload)
-        util.write_file(os.path.join(self.upstart_dir, filename), payload, 0644)
+        path = os.path.join(self.upstart_dir, filename)
+        util.write_file(path, payload, 0644)

From 5b09eaa3af96f760bce23aaf470c506ad9b49bc1 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 17:21:43 -0700
Subject: [PATCH 074/434] Pylint cleanups, add a load yaml function that
 handles errors nicely + other cleanups.

---
 cloudinit/util.py | 295 ++++++++++++++++++++++++++++++++++++----------
 1 file changed, 232 insertions(+), 63 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 5930ff3f..6cf75916 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -23,6 +23,8 @@
 from StringIO import StringIO
 
 import contextlib
+import copy
+import errno
 import glob
 import grp
 import gzip
@@ -32,6 +34,8 @@ import pwd
 import shutil
 import socket
 import subprocess
+import sys
+import tempfile
 import types
 import urlparse
 
@@ -40,6 +44,8 @@ import yaml
 from cloudinit import log as logging
 from cloudinit import url_helper as uhelp
 
+from cloudinit.settings import (CFG_BUILTIN, CLOUD_CONFIG)
+
 
 try:
     import selinux
@@ -55,6 +61,9 @@ FN_REPLACEMENTS = {
     os.sep: '_',
 }
 
+# Helper utils to see if running in a container
+CONTAINER_TESTS = ['running-in-container', 'lxc-is-container']
+
 
 class ProcessExecutionError(IOError):
 
@@ -112,12 +121,17 @@ class SeLinuxGuard(object):
     def __enter__(self):
         return self.engaged
 
-    def __exit__(self, type, value, traceback):
+    def __exit__(self, excp_type, excp_value, excp_traceback):
         if self.engaged:
-            LOG.debug("Disengaging selinux mode for %s: %s", self.path, self.recursive)
+            LOG.debug("Disengaging selinux mode for %s: %s",
+                      self.path, self.recursive)
             selinux.restorecon(self.path, recursive=self.recursive)
 
 
+class MountFailedError(Exception):
+    pass
+
+
 def translate_bool(val):
     if not val:
         return False
@@ -130,14 +144,12 @@ def translate_bool(val):
 
 def read_conf(fname):
     try:
-        mp = yaml.load(load_file(fname))
-        if not isinstance(mp, (dict)):
-            return {}
-        return mp
+        return load_yaml(load_file(fname), default={})
     except IOError as e:
         if e.errno == errno.ENOENT:
             return {}
-        raise
+        else:
+            raise
 
 
 def clean_filename(fn):
@@ -148,8 +160,9 @@ def clean_filename(fn):
 
 def decomp_str(data):
     try:
-        uncomp = gzip.GzipFile(None, "rb", 1, StringIO(data)).read()
-        return uncomp
+        buf = StringIO(str(data))
+        with contextlib.closing(gzip.GzipFile(None, "rb", 1, buf)) as gh:
+            return gh.read()
     except:
         return data
 
@@ -180,16 +193,13 @@ def is_ipv4(instr):
     return (len(toks) == 4)
 
 
-def get_base_cfg(cfgfile, cfg_builtin=None):
+def merge_base_cfg(cfgfile, cfg_builtin=None):
     syscfg = read_conf_with_confd(cfgfile)
 
     kern_contents = read_cc_from_cmdline()
     kerncfg = {}
     if kern_contents:
-        try:
-            kerncfg = yaml.load(kern_contents)
-        except:
-            pass
+        kerncfg = load_yaml(kern_contents, default={})
 
     # kernel parameters override system config
     combined = mergedict(kerncfg, syscfg)
@@ -265,8 +275,9 @@ def obj_name(obj):
 
 def mergedict(src, cand):
     """
-    Merge values from C{cand} into C{src}. If C{src} has a key C{cand} will
-    not override. Nested dictionaries are merged recursively.
+    Merge values from C{cand} into C{src}.
+    If C{src} has a key C{cand} will not override.
+    Nested dictionaries are merged recursively.
     """
     if isinstance(src, dict) and isinstance(cand, dict):
         for k, v in cand.iteritems():
@@ -276,9 +287,11 @@ def mergedict(src, cand):
                 src[k] = mergedict(src[k], v)
     else:
         if not isinstance(src, dict):
-            raise TypeError("Attempting to merge a non dictionary source type: %s" % (type(src)))
+            raise TypeError(("Attempting to merge a non dictionary "
+                             "source type: %s") % (obj_name(src)))
         if not isinstance(cand, dict):
-            raise TypeError("Attempting to merge a non dictionary candiate type: %s" % (type(cand)))
+            raise TypeError(("Attempting to merge a non dictionary "
+                             "candidate type: %s") % (obj_name(cand)))
     return src
 
 
@@ -308,8 +321,9 @@ def del_dir(path):
     shutil.rmtree(path)
 
 
-# get keyid from keyserver
+# get gpg keyid from keyserver
 def getkeybyid(keyid, keyserver):
+    # TODO fix this...
     shcmd = """
     k=${1} ks=${2};
     exec 2>/dev/null
@@ -323,7 +337,7 @@ def getkeybyid(keyid, keyserver):
     [ -n "${armour}" ] && echo "${armour}"
     """
     args = ['sh', '-c', shcmd, "export-gpg-keyid", keyid, keyserver]
-    (stdout, stderr) = subp(args)
+    (stdout, _stderr) = subp(args)
     return stdout
 
 
@@ -340,11 +354,12 @@ def runparts(dirp, skip_no_exist=True):
             try:
                 subp([exe_path])
             except ProcessExecutionError as e:
-                LOG.exception("Failed running %s [%i]", exe_path, e.exit_code)
+                LOG.exception("Failed running %s [%s]", exe_path, e.exit_code)
                 failed += 1
 
     if failed and attempted:
-        raise RuntimeError('runparts: %i failures in %i attempted commands' % (failed, attempted))
+        raise RuntimeError('Runparts: %s failures in %s attempted commands'
+                           % (failed, attempted))
 
 
 # read_optional_seed
@@ -363,6 +378,32 @@ def read_optional_seed(fill, base="", ext="", timeout=5):
         raise
 
 
+def read_file_or_url(url, timeout, retries, file_retries):
+    if url.startswith("/"):
+        url = "file://%s" % url
+    if url.startswith("file://"):
+        retries = file_retries
+    return uhelp.readurl(url, timeout=timeout, retries=retries)
+
+
+def load_yaml(blob, default=None, allowed=(dict,)):
+    loaded = default
+    try:
+        blob = str(blob)
+        LOG.debug(("Attempting to load yaml from string "
+                 "of length %s with allowed root types %s"), 
+                 len(blob), allowed)
+        converted = yaml.load(blob)
+        if not isinstance(converted, allowed):
+            # Yes this will just be caught, but thats ok for now...
+            raise TypeError("Yaml load allows %s types, but got %s instead" %
+                            (allowed, obj_name(converted)))
+        loaded = converted
+    except (yaml.YAMLError, TypeError, ValueError) as exc:
+        LOG.exception("Failed loading yaml due to: %s", exc)
+    return loaded
+
+
 def read_seeded(base="", ext="", timeout=5, retries=10, file_retries=0):
     if base.startswith("/"):
         base = "file://%s" % base
@@ -378,13 +419,16 @@ def read_seeded(base="", ext="", timeout=5, retries=10, file_retries=0):
         ud_url = "%s%s%s" % (base, "user-data", ext)
         md_url = "%s%s%s" % (base, "meta-data", ext)
 
-    (md_str, msc) = uhelp.readurl(md_url, timeout=timeout, retries=retries)
-    (ud, usc) = uhelp.readurl(ud_url, timeout=timeout, retries=retries)
+    (md_str, msc) = read_file_or_url(md_url, timeout, retries, file_retries)
     md = None
     if md_str and uhelp.ok_http_code(msc):
-        md = yaml.load(md_str)
-    if not uhelp.ok_http_code(usc):
-        ud = None
+        md = load_yaml(md_str, default={})
+
+    (ud_str, usc) = read_file_or_url(ud_url, timeout, retries, file_retries)
+    ud = None
+    if ud_str and uhelp.ok_http_code(usc):
+        ud = ud_str
+
     return (md, ud)
 
 
@@ -410,13 +454,14 @@ def read_conf_with_confd(cfgfile):
 
     confd = False
     if "conf_d" in cfg:
-        if cfg['conf_d'] is not None:
-            confd = cfg['conf_d']
-            if not isinstance(confd, (str)):
-                raise RuntimeError(("Config file %s contains 'conf_d' "
-                                    "with non-string") % (cfgfile))
+        confd = cfg['conf_d']
+        if confd:
+            if not isinstance(confd, (str, basestring)):
+                raise TypeError(("Config file %s contains 'conf_d' "
+                                 "with non-string type %s") %
+                                 (cfgfile, obj_name(confd)))
             else:
-                confd = confd.strip()
+                confd = str(confd).strip()
     elif os.path.isdir("%s.d" % cfgfile):
         confd = "%s.d" % cfgfile
 
@@ -490,26 +535,41 @@ def get_hostname_fqdn(cfg, cloud):
 
 
 def get_fqdn_from_hosts(hostname, filename="/etc/hosts"):
-    # this parses /etc/hosts to get a fqdn.  It should return the same
-    # result as 'hostname -f <hostname>' if /etc/hosts.conf
-    # did not have did not have 'bind' in the order attribute
+    """
+    For each host a single line should be present with
+      the following information:
+    
+	     IP_address canonical_hostname [aliases...]
+    
+      Fields of the entry are separated by any number of  blanks  and/or  tab
+      characters.  Text  from	a "#" character until the end of the line is a
+      comment, and is ignored.	 Host  names  may  contain  only  alphanumeric
+      characters, minus signs ("-"), and periods (".").  They must begin with
+      an  alphabetic  character  and  end  with  an  alphanumeric  character.
+      Optional aliases provide for name changes, alternate spellings, shorter
+      hostnames, or generic hostnames (for example, localhost).
+    """
     fqdn = None
     try:
         for line in load_file(filename).splitlines():
             hashpos = line.find("#")
             if hashpos >= 0:
                 line = line[0:hashpos]
-            toks = line.split()
-        
-            # if there there is less than 3 entries (ip, canonical, alias)
+            line = line.strip()
+            if not line:
+                continue
+
+            # If there there is less than 3 entries 
+            # (IP_address, canonical_hostname, alias)
             # then ignore this line
+            toks = line.split()
             if len(toks) < 3:
                 continue
-        
+
             if hostname in toks[2:]:
                 fqdn = toks[1]
                 break
-    except IOError as e:
+    except IOError:
         pass
     return fqdn
 
@@ -584,7 +644,7 @@ def close_stdin():
         os.dup2(fp.fileno(), sys.stdin.fileno())
 
 
-def find_devs_with(criteria):
+def find_devs_with(criteria=None):
     """
     find devices matching given criteria (via blkid)
     criteria can be *one* of:
@@ -593,10 +653,26 @@ def find_devs_with(criteria):
       UUID=<uuid>
     """
     try:
-        (out, _err) = subp(['blkid', '-t%s' % criteria, '-odevice'])
+        blk_id_cmd = ['blkid']
+        if criteria:
+            # Search for block devices with tokens named NAME that 
+            # have the value 'value' and display any devices which are found.
+            # Common values for NAME include  TYPE, LABEL, and UUID.
+            # If there are no devices specified on the command line,
+            # all block devices will be searched; otherwise, 
+            # only search the devices specified by the user.
+            blk_id_cmd.append("-t%s" % (criteria))
+        # Only print the device name
+        blk_id_cmd.append('-odevice')
+        (out, _err) = subp(blk_id_cmd)
+        entries = []
+        for line in out.splitlines():
+            line = line.strip()
+            if line:
+                entries.append(line)
+        return entries
     except ProcessExecutionError:
         return []
-    return (out.splitlines())
 
 
 def load_file(fname, read_cb=None):
@@ -604,7 +680,10 @@ def load_file(fname, read_cb=None):
     with open(fname, 'rb') as fh:
         ofh = StringIO()
         pipe_in_out(fh, ofh, chunk_cb=read_cb)
-        return ofh.getvalue()
+        ofh.flush()
+        contents = ofh.getvalue()
+        LOG.debug("Read %s bytes from %s", len(contents), fname)
+        return contents
 
 
 def get_cmdline():
@@ -620,7 +699,8 @@ def get_cmdline():
 
 def pipe_in_out(in_fh, out_fh, chunk_size=1024, chunk_cb=None):
     bytes_piped = 0
-    LOG.debug("Transferring the contents of %s to %s in chunks of size %s.", in_fh, out_fh, chunk_size)
+    LOG.debug(("Transferring the contents of %s "
+             "to %s in chunks of size %sb"), in_fh, out_fh, chunk_size)
     while True:
         data = in_fh.read(chunk_size)
         if data == '':
@@ -658,15 +738,87 @@ def ensure_dirs(dirlist, mode=0755):
 
 def ensure_dir(path, mode=0755):
     if not os.path.isdir(path):
-        fixmodes = []
-        LOG.debug("Ensuring directory exists at path %s (perms=%s)", dir_name, mode)
-        try:
-            os.makedirs(path)
-        except OSError as e:
-            if e.errno != errno.EEXIST:
-                raise e
-        if mode is not None:
-            os.chmod(path, mode)
+        # Make the dir and adjust the mode
+        LOG.debug("Ensuring directory exists at path %s", path)
+        os.makedirs(path)
+        chmod(path, mode)
+    else:
+        # Just adjust the mode
+        chmod(path, mode)
+
+
+def get_base_cfg(cfg_path=None):
+    if not cfg_path:
+        cfg_path = CLOUD_CONFIG
+    return merge_base_cfg(cfg_path, get_builtin_cfg())
+
+
+@contextlib.contextmanager
+def unmounter(umount):
+    try:
+        yield umount
+    finally:
+        if umount:
+            umount_cmd = ["umount", '-l', umount]
+            subp(umount_cmd)
+
+
+def mounts():
+    mounted = {}
+    try:
+        # Go through mounts to see if it was already mounted
+        mount_locs = load_file("/proc/mounts").splitlines()
+        for mpline in mount_locs:
+            # Format at: http://linux.die.net/man/5/fstab
+            try:
+                (dev, mp, fstype, _opts, _freq, _passno) = mpline.split()
+            except:
+                continue
+            # If the name of the mount point contains spaces these 
+            # can be escaped as '\040', so undo that..
+            mp = mp.replace("\\040", " ")
+            mounted[dev] = (dev, fstype, mp, False)
+    except (IOError, OSError):
+        pass
+    return mounted
+
+
+def mount_cb(device, callback, data=None, rw=False):
+    """
+    Mount the device, call method 'callback' passing the directory
+    in which it was mounted, then unmount.  Return whatever 'callback'
+    returned.  If data != None, also pass data to callback.
+    """
+    mounted = mounts()
+    with tempdir() as tmpd:
+        umount = False
+        if device in mounted:
+            mountpoint = "%s/" % mounted[device][2]
+        else:
+            try:
+                mountcmd = ['mount', "-o"]
+                if rw:
+                    mountcmd.append('rw')
+                else:
+                    mountcmd.append('ro')
+                mountcmd.append(device)
+                mountcmd.append(tmpd)
+                subp(mountcmd)
+                umount = tmpd
+            except IOError as exc:
+                raise MountFailedError("%s" % (exc))
+            mountpoint = "%s/" % tmpd
+        with unmounter(umount):
+            if data is None:
+                ret = callback(mountpoint)
+            else:
+                ret = callback(mountpoint, data)
+            return ret
+
+
+def get_builtin_cfg():
+    # Deep copy so that others can't modify
+    return copy.deepcopy(CFG_BUILTIN)
 
 
 def sym_link(source, link):
@@ -687,6 +839,18 @@ def ensure_file(path):
     write_file(path, content='', omode="ab")
 
 
+def chmod(path, mode):
+    real_mode = None
+    try:
+        real_mode = int(mode)
+    except (ValueError, TypeError):
+        pass
+    if path and real_mode:
+        LOG.debug("Adjusting the permissions of %s (perms=%o)",
+                 path, real_mode)
+        os.chmod(path, real_mode)
+
+
 def write_file(filename, content, mode=0644, omode="wb"):
     """
     Writes a file with the given content and sets the file mode as specified.
@@ -698,13 +862,12 @@ def write_file(filename, content, mode=0644, omode="wb"):
     @param omode: The open mode used when opening the file (r, rb, a, etc.)
     """
     ensure_dir(os.path.dirname(filename))
-    LOG.debug("Writing to %s - %s (perms=%s) %s bytes", filename, omode, mode, len(content))
+    LOG.debug("Writing to %s - %s, %s bytes", filename, omode, len(content))
     with open(filename, omode) as fh:
         with SeLinuxGuard(filename):
             fh.write(content)
             fh.flush()
-            if mode is not None:
-                os.chmod(filename, mode)
+            chmod(filename, mode)
 
 
 def delete_dir_contents(dirname):
@@ -725,7 +888,8 @@ def subp(args, input_data=None, allowed_rc=None, env=None):
     if allowed_rc is None:
         allowed_rc = [0]
     try:
-        LOG.debug("Running command %s with allowed return codes %s", args, allowed_rc)
+        LOG.debug("Running command %s with allowed return codes %s",
+                  args, allowed_rc)
         sp = subprocess.Popen(args, stdout=subprocess.PIPE,
             stderr=subprocess.PIPE, stdin=subprocess.PIPE,
             env=env)
@@ -768,14 +932,16 @@ def shellify(cmdlist, add_header=True):
 
 
 def is_container():
-    # is this code running in a container of some sort
+    """
+    Checks to see if this code running in a container of some sort
+    """
 
-    for helper in ('running-in-container', 'lxc-is-container'):
+    for helper in CONTAINER_TESTS:
         try:
             # try to run a helper program. if it returns true/zero
             # then we're inside a container. otherwise, no
             cmd = [helper]
-            (stdout, stderr) = subp(cmd, allowed_rc=[0])
+            subp(cmd, allowed_rc=[0])
             return True
         except (IOError, OSError):
             pass
@@ -812,7 +978,10 @@ def is_container():
 
 
 def get_proc_env(pid):
-    # return the environment in a dict that a given process id was started with
+    """
+    Return the environment in a dict that a given process id was started with.
+    """
+
     env = {}
     fn = os.path.join("/proc/", str(pid), "environ")
     try:

From 6418e9b2e809872a5e186176894f6e61fb3184dc Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 18:01:45 -0700
Subject: [PATCH 075/434] Add initial network writing here.

---
 cloudinit/distros/ubuntu.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index d19ef63e..ccf2cec4 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -39,7 +39,7 @@ class Distro(distros.Distro):
         self.apt_get('install', pkglist)
 
     def apply_network(self, settings):
-        pass
+        util.write_file("/etc/network/interfaces", settings)
 
     # apt_get top level command (install, update...), and args to pass it
     def apt_get(self, tlc, args=None):

From f90fbe35045513202db029b178f3391550cfdd0a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 18:01:59 -0700
Subject: [PATCH 076/434] Fix log statement.

---
 cloudinit/helpers.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 0bd13c78..16548001 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -260,8 +260,8 @@ class Paths(object):
     def get_ipath(self, name=None):
         ipath = self._get_ipath(name)
         if not ipath:
-            LOG.warn(("No per instance semaphores available, "
-                              "is there an datasource/iid set?"))
+            LOG.warn(("No per instance data available, "
+                      "is there an datasource/iid set?"))
             return None
         else:
             return ipath

From 7dc7729c24ba134bf2ddb4d38f57a317bfc6dc93 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 18:02:32 -0700
Subject: [PATCH 077/434] Fix logging + fetch user data before user data
 content handlers are activated.

---
 cloudinit/stages.py | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 55ad143d..2cb9d0ec 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -124,7 +124,6 @@ class Init(object):
                 util.chownbyname(log_file, u, g)
 
     def _read_cfg(self):
-        # Deep copy so that
         b_config = util.get_builtin_cfg()
         try:
             conf = util.get_base_cfg()
@@ -279,8 +278,10 @@ class Init(object):
         data = cloud.Cloud(self.datasource,
                            self.paths, copy.deepcopy(self.cfg))
 
-        # Init the handlers first
         # Ensure userdata fetched before activation
+        ud_obj = data.get_userdata()
+
+        # Init the handlers first
         called = []
         for (_mtype, mod) in c_handlers.iteritems():
             if mod in called:
@@ -294,9 +295,12 @@ class Init(object):
             'handlerdir': idir,
             'data': data, 
             'frequency': frequency,
+            # This will be used when new handlers are found
+            # to help write there contents to files with numbered
+            # names...
             'handlercount': 0,
         }
-        ud.walk(data.get_userdata(), ud.walker_callback, data=part_data)
+        ud.walk(ud_obj, ud.walker_callback, data=part_data)
 
         # Give callbacks opportunity to finalize
         called = []

From d4c6ebff56be48eb6282709d0a87c4c5f9a7f247 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 18:02:56 -0700
Subject: [PATCH 078/434] Fix this up to work with new
 utils/logging/datasource...

---
 cloudinit/sources/DataSourceConfigDrive.py | 216 ++++++++++-----------
 1 file changed, 108 insertions(+), 108 deletions(-)

diff --git a/cloudinit/sources/DataSourceConfigDrive.py b/cloudinit/sources/DataSourceConfigDrive.py
index 2db4a76a..ca4bb7cf 100644
--- a/cloudinit/sources/DataSourceConfigDrive.py
+++ b/cloudinit/sources/DataSourceConfigDrive.py
@@ -14,54 +14,61 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.DataSource as DataSource
-
-from cloudinit import seeddir as base_seeddir
-from cloudinit import log
-import cloudinit.util as util
-import os.path
-import os
 import json
-import subprocess
+import os
 
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
 DEFAULT_IID = "iid-dsconfigdrive"
+DEFAULT_MODE = 'pass'
+CFG_DRIVE_FILES = [
+    "etc/network/interfaces",
+    "root/.ssh/authorized_keys",
+    "meta.js",
+]
+DEFAULT_METADATA = {
+    "instance-id": DEFAULT_IID, 
+    "dsmode": DEFAULT_MODE,
+}
+IF_UP_CMD = ['ifup', '--all']
+CFG_DRIVE_DEV_ENV = 'CLOUD_INIT_CONFIG_DRIVE_DEVICE'
 
 
-class DataSourceConfigDrive(DataSource.DataSource):
-    seed = None
-    seeddir = base_seeddir + '/config_drive'
-    cfg = {}
-    userdata_raw = None
-    metadata = None
-    dsmode = "local"
+class DataSourceConfigDrive(sources.DataSource):
+    def __init__(self, sys_cfg, distro, paths):
+        sources.DataSource.__init__(self, sys_cfg, distro, paths)
+        self.seed = None
+        self.cfg = {}
+        self.dsmode = 'local'
+        self.seed_dir = os.path.join(self.paths.seed_dir, 'config_drive')
 
     def __str__(self):
-        mstr = "DataSourceConfigDrive[%s]" % self.dsmode
-        mstr = mstr + " [seed=%s]" % self.seed
-        return(mstr)
+        mstr = "%s[%s]" % (util.obj_name(self), self.dsmode)
+        mstr = mstr + " [seed=%s]" % (self.seed)
+        return mstr
 
     def get_data(self):
         found = None
         md = {}
         ud = ""
 
-        defaults = {"instance-id": DEFAULT_IID, "dsmode": "pass"}
-
-        if os.path.isdir(self.seeddir):
+        if os.path.isdir(self.seed_dir):
             try:
-                (md, ud) = read_config_drive_dir(self.seeddir)
-                found = self.seeddir
-            except nonConfigDriveDir:
-                pass
-
+                (md, ud) = read_config_drive_dir(self.seed_dir)
+                found = self.seed_dir
+            except NonConfigDriveDir:
+                LOG.exception("Failed reading config drive from %s",
+                              self.seed_dir)
         if not found:
-            dev = cfg_drive_device()
+            dev = find_cfg_drive_device()
             if dev:
                 try:
-                    (md, ud) = util.mount_callback_umount(dev,
-                        read_config_drive_dir)
+                    (md, ud) = util.mount_cb(dev, read_config_drive_dir)
                     found = dev
-                except (nonConfigDriveDir, util.mountFailedError):
+                except (NonConfigDriveDir, util.MountFailedError):
                     pass
 
         if not found:
@@ -70,25 +77,24 @@ class DataSourceConfigDrive(DataSource.DataSource):
         if 'dsconfig' in md:
             self.cfg = md['dscfg']
 
-        md = util.mergedict(md, defaults)
+        md = util.mergedict(md, DEFAULT_METADATA)
 
-        # update interfaces and ifup only on the local datasource
+        # Update interfaces and ifup only on the local datasource
         # this way the DataSourceConfigDriveNet doesn't do it also.
         if 'network-interfaces' in md and self.dsmode == "local":
             if md['dsmode'] == "pass":
-                log.info("updating network interfaces from configdrive")
+                LOG.info("Updating network interfaces from configdrive")
             else:
-                log.debug("updating network interfaces from configdrive")
+                LOG.debug("Updating network interfaces from configdrive")
 
-            util.write_file("/etc/network/interfaces",
-                md['network-interfaces'])
+            self.distro.apply_network(md['network-interfaces'])
             try:
-                (out, err) = util.subp(['ifup', '--all'])
-                if len(out) or len(err):
-                    log.warn("ifup --all had stderr: %s" % err)
-
-            except subprocess.CalledProcessError as exc:
-                log.warn("ifup --all failed: %s" % (exc.output[1]))
+                (_out, err) = util.subp(IF_UP_CMD)
+                if len(err):
+                    LOG.warn("Running %s resulted in stderr output: %s",
+                             IF_UP_CMD, err)
+            except util.ProcessExecutionError:
+                LOG.exception("Running %s failed", IF_UP_CMD)
 
         self.seed = found
         self.metadata = md
@@ -97,99 +103,107 @@ class DataSourceConfigDrive(DataSource.DataSource):
         if md['dsmode'] == self.dsmode:
             return True
 
-        log.debug("%s: not claiming datasource, dsmode=%s" %
-            (self, md['dsmode']))
+        LOG.debug("%s: not claiming datasource, dsmode=%s", self, md['dsmode'])
         return False
 
     def get_public_ssh_keys(self):
         if not 'public-keys' in self.metadata:
-            return([])
-        return(self.metadata['public-keys'])
+            return []
+        return list(self.metadata['public-keys'])
 
-    # the data sources' config_obj is a cloud-config formated
+    # The data sources' config_obj is a cloud-config formated
     # object that came to it from ways other than cloud-config
     # because cloud-config content would be handled elsewhere
     def get_config_obj(self):
-        return(self.cfg)
+        return self.cfg
 
 
 class DataSourceConfigDriveNet(DataSourceConfigDrive):
-    dsmode = "net"
+    def __init__(self, sys_cfg, paths):
+        DataSourceConfigDrive.__init__(self, sys_cfg, paths)
+        self.dsmode = 'net'
 
 
-class nonConfigDriveDir(Exception):
+class NonConfigDriveDir(Exception):
     pass
 
 
-def cfg_drive_device():
-    """ get the config drive device.  return a string like '/dev/vdb'
+def find_cfg_drive_device():
+    """ Get the config drive device.  Return a string like '/dev/vdb'
         or None (if there is no non-root device attached). This does not
         check the contents, only reports that if there *were* a config_drive
         attached, it would be this device.
-        per config_drive documentation, this is
-         "associated as the last available disk on the instance"
+        Note: per config_drive documentation, this is
+        "associated as the last available disk on the instance"
     """
 
-    if 'CLOUD_INIT_CONFIG_DRIVE_DEVICE' in os.environ:
-        return(os.environ['CLOUD_INIT_CONFIG_DRIVE_DEVICE'])
-
-    # we are looking for a raw block device (sda, not sda1) with a vfat
-    # filesystem on it.
+    # This seems to be for debugging??
+    if CFG_DRIVE_DEV_ENV in os.environ:
+        return os.environ[CFG_DRIVE_DEV_ENV]
 
+    # We are looking for a raw block device (sda, not sda1) with a vfat
+    # filesystem on it....
     letters = "abcdefghijklmnopqrstuvwxyz"
     devs = util.find_devs_with("TYPE=vfat")
 
-    # filter out anything not ending in a letter (ignore partitions)
+    # Filter out anything not ending in a letter (ignore partitions)
     devs = [f for f in devs if f[-1] in letters]
 
-    # sort them in reverse so "last" device is first
+    # Sort them in reverse so "last" device is first
     devs.sort(reverse=True)
 
-    if len(devs):
-        return(devs[0])
+    if devs:
+        return devs[0]
 
-    return(None)
+    return None
 
 
 def read_config_drive_dir(source_dir):
     """
     read_config_drive_dir(source_dir):
        read source_dir, and return a tuple with metadata dict and user-data
-       string populated.  If not a valid dir, raise a nonConfigDriveDir
+       string populated.  If not a valid dir, raise a NonConfigDriveDir
     """
-    md = {}
-    ud = ""
 
-    flist = ("etc/network/interfaces", "root/.ssh/authorized_keys", "meta.js")
-    found = [f for f in flist if os.path.isfile("%s/%s" % (source_dir, f))]
-    keydata = ""
+    # TODO: fix this for other operating systems...
+    # Ie: this is where https://fedorahosted.org/netcf/ or similar should
+    # be hooked in... (or could be)
+    found = {}
+    for af in CFG_DRIVE_FILES:
+        fn = os.path.join(source_dir, af)
+        if os.path.isfile(fn):
+            found[af] = fn
 
     if len(found) == 0:
-        raise nonConfigDriveDir("%s: %s" % (source_dir, "no files found"))
+        raise NonConfigDriveDir("%s: %s" % (source_dir, "no files found"))
 
+    md = {}
+    ud = ""
+    keydata = ""
     if "etc/network/interfaces" in found:
-        with open("%s/%s" % (source_dir, "/etc/network/interfaces")) as fp:
-            md['network-interfaces'] = fp.read()
+        fn = found["etc/network/interfaces"]
+        md['network-interfaces'] = util.load_file(fn)
 
     if "root/.ssh/authorized_keys" in found:
-        with open("%s/%s" % (source_dir, "root/.ssh/authorized_keys")) as fp:
-            keydata = fp.read()
+        fn = found["root/.ssh/authorized_keys"]
+        keydata = util.load_file(fn)
 
     meta_js = {}
-
     if "meta.js" in found:
-        content = ''
-        with open("%s/%s" % (source_dir, "meta.js")) as fp:
-            content = fp.read()
-        md['meta_js'] = content
+        fn = found['meta.js']
+        content = util.load_file(fn)
         try:
+            # Just check if its really json...
             meta_js = json.loads(content)
-        except ValueError:
-            raise nonConfigDriveDir("%s: %s" %
-                (source_dir, "invalid json in meta.js"))
+            if not isinstance(meta_js, (dict)):
+                raise TypeError("Dict expected for meta.js root node")
+        except (ValueError, TypeError) as e:
+            raise NonConfigDriveDir("%s: %s, %s" %
+                (source_dir, "invalid json in meta.js", e))
+        md['meta_js'] = content
 
+    # Key data override??
     keydata = meta_js.get('public-keys', keydata)
-
     if keydata:
         lines = keydata.splitlines()
         md['public-keys'] = [l for l in lines
@@ -202,30 +216,16 @@ def read_config_drive_dir(source_dir):
     if 'user-data' in meta_js:
         ud = meta_js['user-data']
 
-    return(md, ud)
-
-datasources = (
-  (DataSourceConfigDrive, (DataSource.DEP_FILESYSTEM, )),
-  (DataSourceConfigDriveNet,
-    (DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK)),
-)
+    return (md, ud)
 
 
-# return a list of data sources that match this set of dependencies
+# Used to match classes to dependencies
+datasources = [
+  (DataSourceConfigDrive, (sources.DEP_FILESYSTEM, )),
+  (DataSourceConfigDriveNet, (sources.DEP_FILESYSTEM, sources.DEP_NETWORK)),
+]
+
+
+# Used to match classes to dependencies
 def get_datasource_list(depends):
-    return(DataSource.list_from_depends(depends, datasources))
-
-if __name__ == "__main__":
-    def main():
-        import sys
-        import pprint
-        print cfg_drive_device()
-        (md, ud) = read_config_drive_dir(sys.argv[1])
-        print "=== md ==="
-        pprint.pprint(md)
-        print "=== ud ==="
-        print(ud)
-
-    main()
-
-# vi: ts=4 expandtab
+    return sources.list_from_depends(depends, datasources)

From 799cb59d20bcbe0bf905982daf0a99ffe6fb9aa2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 20:11:03 -0700
Subject: [PATCH 079/434] Add centering method + more descriptive mount failure
 exception message.

---
 cloudinit/util.py | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 6cf75916..f02fcfe9 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -316,6 +316,11 @@ def tempdir(**kwargs):
         del_dir(tdir)
 
 
+def center(text, fill, max_len):
+    return '{0:{fill}{align}{size}}'.format(text, fill=fill,
+                                            align="^", size=max_len)
+
+
 def del_dir(path):
     LOG.debug("Recursively deleting %s", path)
     shutil.rmtree(path)
@@ -805,8 +810,10 @@ def mount_cb(device, callback, data=None, rw=False):
                 mountcmd.append(tmpd)
                 subp(mountcmd)
                 umount = tmpd
-            except IOError as exc:
-                raise MountFailedError("%s" % (exc))
+            except (IOError, OSError) as exc:
+                raise MountFailedError(("Failed mounting %s "
+                                        "to %s due to: %s") %
+                                       (device, tmpd, exc))
             mountpoint = "%s/" % tmpd
         with unmounter(umount):
             if data is None:

From 25b85ab42c4e47192d009ba5c220ffa14a7fbc8b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 20:11:24 -0700
Subject: [PATCH 080/434] Use pretty table to get a parseable format out.

---
 cloudinit/netinfo.py | 93 +++++++++++++++++++++++++++++++-------------
 1 file changed, 67 insertions(+), 26 deletions(-)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index 541d2911..a211788c 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -19,12 +19,11 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+import os
+
 import cloudinit.util as util
 
-
-class NetInfo(object):
-    def __init__(self):
-        pass
+from prettytable import PrettyTable
 
 
 def netdev_info(empty=""):
@@ -71,47 +70,89 @@ def netdev_info(empty=""):
                 if dev[field] == "":
                     dev[field] = empty
 
-    return(devs)
+    return devs
 
 
 def route_info():
     (route_out, _err) = util.subp(["route", "-n"])
     routes = []
-    for line in str(route_out).splitlines()[1:]:
+    entries = route_out.splitlines()[1:]
+    for line in entries:
         if not line:
             continue
         toks = line.split()
         if toks[0] == "Kernel" or toks[0] == "Destination":
             continue
-        routes.append(toks)
-    return(routes)
+        entry = {
+            'destination': toks[0],
+            'gateway': toks[1],
+            'genmask': toks[2],
+            'flags': toks[3],
+            'metric': toks[4],
+            'ref': toks[5],
+            'use': toks[6],
+            'iface': toks[7],
+        }
+        routes.append(entry)
+    return routes
 
 
 def getgateway():
-    for r in route_info():
-        if r[3].find("G") >= 0:
-            return("%s[%s]" % (r[1], r[7]))
-    return(None)
+    routes = []
+    try:
+        routes = route_info()
+    except:
+        pass
+    for r in routes:
+        if r['flags'].find("G") >= 0:
+            return "%s[%s]" % (r['gateway'], r['iface'])
+    return None
 
 
-def debug_info(pre="ci-info: "):
+def netdev_pformat():
     lines = []
     try:
         netdev = netdev_info(empty=".")
     except Exception:
-        lines.append("netdev_info failed!")
-        netdev = {}
-    for (dev, d) in netdev.iteritems():
-        lines.append("%s%-6s: %i %-15s %-15s %s" %
-            (pre, dev, d["up"], d["addr"], d["mask"], d["hwaddr"]))
+        lines.append(util.center("Net device info failed", '!', 80))
+        netdev = None
+    if netdev is not None:
+        fields = ['Device', 'Up', 'Address', 'Mask', 'Hw-Address']
+        tbl = PrettyTable(fields)
+        for (dev, d) in netdev.iteritems():
+            tbl.add_row([dev, d["up"], d["addr"], d["mask"], d["hwaddr"]])
+        netdev_s = tbl.get_string()
+        max_len = len(max(netdev_s.splitlines(), key=len))
+        header = util.center("Net device info", "+", max_len)
+        lines.extend([header, netdev_s])
+    return os.linesep.join(lines)
+
+
+def route_pformat():
+    lines = []
     try:
         routes = route_info()
     except Exception:
-        lines.append("route_info failed")
-        routes = []
-    n = 0
-    for r in routes:
-        lines.append("%sroute-%d: %-15s %-15s %-15s %-6s %s" %
-            (pre, n, r[0], r[1], r[2], r[7], r[3]))
-        n = n + 1
-    return('\n'.join(lines))
+        lines.append(util.center('Route info failed', '!', 80))
+        routes = None
+    if routes is not None:
+        fields = ['Route', 'Destination', 'Gateway',
+                  'Genmask', 'Interface', 'Flags']
+        tbl = PrettyTable(fields)
+        for n, r in enumerate(routes):
+            route_id = str(n)
+            tbl.add_row([str(n), r['destination'],
+                        r['gateway'], r['genmask'],
+                        r['iface'], r['flags']])
+        route_s = tbl.get_string()
+        max_len = len(max(route_s.splitlines(), key=len))
+        header = util.center("Route info", "+", max_len)
+        lines.extend([header, route_s])
+    return os.linesep.join(lines)
+
+
+def debug_info(pre=""):
+    lines = []
+    lines.append(netdev_pformat())
+    lines.append(route_pformat())
+    return os.linesep.join(lines)

From ae466e42dff5ec0092c26c95175e1b22fbd2412d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 20:11:44 -0700
Subject: [PATCH 081/434] Rename sem class to file sem class, add clear_all
 methods, add empty methods to dummy sem class.

---
 cloudinit/helpers.py | 16 ++++++++++++++--
 1 file changed, 14 insertions(+), 2 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 16548001..e5f33a26 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -49,8 +49,14 @@ class DummySemaphores(object):
     def has_run(self, _name, _freq):
         return False
 
+    def clear(self, _name, _freq):
+        return True
 
-class Semaphores(object):
+    def clear_all(self):
+        pass
+
+
+class FileSemaphores(object):
     def __init__(self, sem_path):
         self.sem_path = sem_path
 
@@ -71,6 +77,12 @@ class Semaphores(object):
             return False
         return True
 
+    def clear_all(self):
+        try:
+            util.del_dir(self.sem_path)
+        except (IOError, OSError):
+            pass
+
     def _acquire(self, name, freq):
         if self.has_run(name, freq):
             return None
@@ -117,7 +129,7 @@ class Runners(object):
         if not sem_path:
             return None
         if sem_path not in self.sems:
-            self.sems[sem_path] = Semaphores(sem_path)
+            self.sems[sem_path] = FileSemaphores(sem_path)
         return self.sems[sem_path]
 
     def run(self, name, functor, args, freq=None, clear_on_fail=False):

From 54435c2557c9b2881cf81cfd16dab751e4fd7b10 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 20:12:36 -0700
Subject: [PATCH 082/434] Fix copy right.

---
 cloudinit/netinfo.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index a211788c..874c2674 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -1,11 +1,12 @@
-#!/usr/bin/python
 # vi: ts=4 expandtab
 #
 #    Copyright (C) 2012 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
 #    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as

From 473cc39708f476e141092630a4dabcf203ceac03 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 11 Jun 2012 22:15:11 -0700
Subject: [PATCH 083/434] Update with parsing of a requirments file, changelog
 for this new refactoring stuff and setup.py for both of those.

---
 ChangeLog |  2 ++
 Requires  |  2 ++
 setup.py  | 66 +++++++++++++++++++++++++++++++++++++++++++------------
 3 files changed, 56 insertions(+), 14 deletions(-)
 create mode 100644 Requires

diff --git a/ChangeLog b/ChangeLog
index 0964877e..f701927b 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,3 +1,5 @@
+0.7.0:
+ - Huge refactor [Joshua Harlow]
 0.6.4:
  - support relative path in AuthorizedKeysFile (LP: #970071).
 0.6.3:
diff --git a/Requires b/Requires
new file mode 100644
index 00000000..6a7064af
--- /dev/null
+++ b/Requires
@@ -0,0 +1,2 @@
+Tempita>=0.4
+PrettyTable>=0.4
diff --git a/setup.py b/setup.py
index f32662b8..96f889d8 100755
--- a/setup.py
+++ b/setup.py
@@ -1,10 +1,12 @@
-#!/usr/bin/python
 # vi: ts=4 expandtab
 #
 #    Distutils magic for ec2-init
+#
 #    Copyright (C) 2009 Canonical Ltd.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Soren Hansen <soren@canonical.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -17,24 +19,59 @@
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-#
-from distutils.core import setup
+
 from glob import glob
-import os.path
-import subprocess
+
+import os
+import re
+
+from distutils.core import setup
+from setuptools import find_packages
+
 
 def is_f(p):
-    return(os.path.isfile(p))
+    return os.path.isfile(p)
+
+
+def versions(fn="ChangeLog"):
+    with open(fn, 'r') as fh:
+        lines = fh.read().splitlines()
+    versions = []
+    for line in lines:
+        line = line.strip()
+        if line.startswith("-") or not line:
+            continue
+        if not re.match(r"[\d]", line):
+            continue
+        line = line.strip(":")
+        if (re.match(r"^[\d+]\.[\d+]\.[\d+]$", line) or
+            re.match(r"^[\d+]\.[\d+]$", line)):
+            versions.append(line)
+    return versions
+
+
+def requires(fn='Requires'):
+    requires = []
+    with open(fn, 'r') as fh:
+        lines = fh.read().splitlines()
+    for line in lines:
+        line = line.strip()
+        if not line or line[0] == '#':
+            continue
+        else:
+            requires.append(line)
+    return requires
+
 
 setup(name='cloud-init',
-      version='0.6.3',
+      version=versions()[0],
       description='EC2 initialisation magic',
       author='Scott Moser',
       author_email='scott.moser@canonical.com',
       url='http://launchpad.net/cloud-init/',
-      packages=['cloudinit', 'cloudinit.CloudConfig' ],
-      scripts=['cloud-init.py',
-               'cloud-init-cfg.py',
+      packages=find_packages(),
+      scripts=['bin/cloud-init.py',
+               'bin/cloud-init-cfg.py',
                'tools/cloud-init-per',
                ],
       data_files=[('/etc/cloud', glob('config/*.cfg')),
@@ -42,11 +79,12 @@ setup(name='cloud-init',
                   ('/etc/cloud/templates', glob('templates/*')),
                   ('/etc/init', glob('upstart/*.conf')),
                   ('/usr/share/cloud-init', []),
-                  ('/usr/lib/cloud-init', 
+                  ('/usr/lib/cloud-init',
                     ['tools/uncloud-init', 'tools/write-ssh-key-fingerprints']),
-                  ('/usr/share/doc/cloud-init', filter(is_f,glob('doc/*'))),
-                  ('/usr/share/doc/cloud-init/examples', filter(is_f,glob('doc/examples/*'))),
-                  ('/usr/share/doc/cloud-init/examples/seed', filter(is_f,glob('doc/examples/seed/*'))),
+                  ('/usr/share/doc/cloud-init', filter(is_f, glob('doc/*'))),
+                  ('/usr/share/doc/cloud-init/examples', filter(is_f, glob('doc/examples/*'))),
+                  ('/usr/share/doc/cloud-init/examples/seed', filter(is_f, glob('doc/examples/seed/*'))),
                   ('/etc/profile.d', ['tools/Z99-cloud-locale-test.sh']),
                   ],
+      install_requires=requires(),
       )

From e526bcc736fbc0a86da774c5a2bc606ddf0359ad Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 13 Jun 2012 12:48:38 -0700
Subject: [PATCH 084/434] Add in a make url function (might be useful). Adjust
 usage of logexc to use that in the utils file for exceptions that occur. Add
 in more options to sub function to capture outputs, shell mode and such.

---
 cloudinit/util.py | 222 ++++++++++++++++++++++++++++++++++++++++------
 1 file changed, 195 insertions(+), 27 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index f02fcfe9..7d5932c1 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -36,6 +36,7 @@ import socket
 import subprocess
 import sys
 import tempfile
+import traceback
 import types
 import urlparse
 
@@ -259,11 +260,79 @@ def get_cfg_by_path(yobj, keyp, default=None):
     cur = yobj
     for tok in keyp:
         if tok not in cur:
-            return(default)
+            return default
         cur = cur[tok]
     return cur
 
 
+# redirect_output(outfmt, errfmt, orig_out, orig_err)
+#  replace orig_out and orig_err with filehandles specified in outfmt or errfmt
+#  fmt can be:
+#   > FILEPATH
+#   >> FILEPATH
+#   | program [ arg1 [ arg2 [ ... ] ] ]
+#
+#   with a '|', arguments are passed to shell, so one level of
+#   shell escape is required.
+def redirect_output(outfmt, errfmt, o_out=sys.stdout, o_err=sys.stderr):
+    if outfmt:
+        (mode, arg) = outfmt.split(" ", 1)
+        if mode == ">" or mode == ">>":
+            owith = "ab"
+            if mode == ">":
+                owith = "wb"
+            new_fp = open(arg, owith)
+        elif mode == "|":
+            proc = subprocess.Popen(arg, shell=True, stdin=subprocess.PIPE)
+            new_fp = proc.stdin
+        else:
+            raise TypeError("Invalid type for outfmt: %s" % outfmt)
+
+        if o_out:
+            os.dup2(new_fp.fileno(), o_out.fileno())
+        if errfmt == outfmt:
+            os.dup2(new_fp.fileno(), o_err.fileno())
+            return
+
+    if errfmt:
+        (mode, arg) = errfmt.split(" ", 1)
+        if mode == ">" or mode == ">>":
+            owith = "ab"
+            if mode == ">":
+                owith = "wb"
+            new_fp = open(arg, owith)
+        elif mode == "|":
+            proc = subprocess.Popen(arg, shell=True, stdin=subprocess.PIPE)
+            new_fp = proc.stdin
+        else:
+            raise TypeError("Invalid type for errfmt: %s" % errfmt)
+
+        if o_err:
+            os.dup2(new_fp.fileno(), o_err.fileno())
+
+
+def make_url(scheme, host, port=None,
+                path='', params='', query='', fragment=''):
+
+    pieces = []
+    pieces.append(scheme or '')
+
+    netloc = ''
+    if host:
+        netloc = str(host)
+
+    if port is not None:
+        netloc += ":" + "%s" % (port)
+
+    pieces.append(netloc or '')
+    pieces.append(path or '')
+    pieces.append(params or '')
+    pieces.append(query or '')
+    pieces.append(fragment or '')
+
+    return urlparse.urlunparse(pieces)
+
+
 def obj_name(obj):
     if isinstance(obj, (types.TypeType,
                         types.ModuleType,
@@ -359,7 +428,7 @@ def runparts(dirp, skip_no_exist=True):
             try:
                 subp([exe_path])
             except ProcessExecutionError as e:
-                LOG.exception("Failed running %s [%s]", exe_path, e.exit_code)
+                logexc(LOG, "Failed running %s [%s]", exe_path, e.exit_code)
                 failed += 1
 
     if failed and attempted:
@@ -405,7 +474,7 @@ def load_yaml(blob, default=None, allowed=(dict,)):
                             (allowed, obj_name(converted)))
         loaded = converted
     except (yaml.YAMLError, TypeError, ValueError) as exc:
-        LOG.exception("Failed loading yaml due to: %s", exc)
+        logexc(LOG, "Failed loading yaml blob")
     return loaded
 
 
@@ -682,9 +751,9 @@ def find_devs_with(criteria=None):
 
 def load_file(fname, read_cb=None):
     LOG.debug("Reading from %s", fname)
-    with open(fname, 'rb') as fh:
+    with open(fname, 'rb') as ifh:
         ofh = StringIO()
-        pipe_in_out(fh, ofh, chunk_cb=read_cb)
+        pipe_in_out(ifh, ofh, chunk_cb=read_cb)
         ofh.flush()
         contents = ofh.getvalue()
         LOG.debug("Read %s bytes from %s", len(contents), fname)
@@ -736,12 +805,90 @@ def chownbyname(fname, user=None, group=None):
     chownbyid(fname, uid, gid)
 
 
+# Always returns well formated values
+# cfg is expected to have an entry 'output' in it, which is a dictionary
+# that includes entries for 'init', 'config', 'final' or 'all'
+#   init: /var/log/cloud.out
+#   config: [ ">> /var/log/cloud-config.out", /var/log/cloud-config.err ]
+#   final:
+#     output: "| logger -p"
+#     error: "> /dev/null"
+# this returns the specific 'mode' entry, cleanly formatted, with value
+def get_output_cfg(cfg, mode="init"):
+    ret = [None, None]
+    if not cfg or not 'output' in cfg:
+        return ret
+
+    outcfg = cfg['output']
+    if mode in outcfg:
+        modecfg = outcfg[mode]
+    else:
+        if 'all' not in outcfg:
+            return ret
+        # if there is a 'all' item in the output list
+        # then it applies to all users of this (init, config, final)
+        modecfg = outcfg['all']
+
+    # if value is a string, it specifies stdout and stderr
+    if isinstance(modecfg, str):
+        ret = [modecfg, modecfg]
+
+    # if its a list, then we expect (stdout, stderr)
+    if isinstance(modecfg, list):
+        if len(modecfg) > 0:
+            ret[0] = modecfg[0]
+        if len(modecfg) > 1:
+            ret[1] = modecfg[1]
+
+    # if it is a dictionary, expect 'out' and 'error'
+    # items, which indicate out and error
+    if isinstance(modecfg, dict):
+        if 'output' in modecfg:
+            ret[0] = modecfg['output']
+        if 'error' in modecfg:
+            ret[1] = modecfg['error']
+
+    # if err's entry == "&1", then make it same as stdout
+    # as in shell syntax of "echo foo >/dev/null 2>&1"
+    if ret[1] == "&1":
+        ret[1] = ret[0]
+
+    swlist = [">>", ">", "|"]
+    for i in range(len(ret)):
+        if not ret[i]:
+            continue
+        val = ret[i].lstrip()
+        found = False
+        for s in swlist:
+            if val.startswith(s):
+                val = "%s %s" % (s, val[len(s):].strip())
+                found = True
+                break
+        if not found:
+            # default behavior is append
+            val = "%s %s" % (">>", val.strip())
+        ret[i] = val
+
+    return ret
+
+
+def logexc(log, msg='', *args):
+    # Setting this here allows this to change
+    # levels easily (not always error level)
+    # or even desirable to have that much junk
+    # coming out to a non-debug stream
+    if msg:
+        log.warn(msg, *args)
+    # Debug gets the full trace
+    log.debug(msg, exc_info=1, *args)
+
+
 def ensure_dirs(dirlist, mode=0755):
     for d in dirlist:
         ensure_dir(d, mode)
 
 
-def ensure_dir(path, mode=0755):
+def ensure_dir(path, mode=None):
     if not os.path.isdir(path):
         # Make the dir and adjust the mode
         LOG.debug("Ensuring directory exists at path %s", path)
@@ -771,24 +918,29 @@ def unmounter(umount):
 def mounts():
     mounted = {}
     try:
-        # Go through mounts to see if it was already mounted
+        # Go through mounts to see what is already mounted
         mount_locs = load_file("/proc/mounts").splitlines()
         for mpline in mount_locs:
             # Format at: http://linux.die.net/man/5/fstab
             try:
-                (dev, mp, fstype, _opts, _freq, _passno) = mpline.split()
+                (dev, mp, fstype, opts, _freq, _passno) = mpline.split()
             except:
                 continue
             # If the name of the mount point contains spaces these 
             # can be escaped as '\040', so undo that..
             mp = mp.replace("\\040", " ")
-            mounted[dev] = (dev, fstype, mp, False)
+            mounted[dev] = {
+                'fstype': fstype,
+                'mountpoint': mp,
+                'opts': opts,
+            }
+        LOG.debug("Fetched %s mounts from %s", mounted, "/proc/mounts")
     except (IOError, OSError):
-        pass
+        logexc(LOG, "Failed fetching mount points from /proc/mounts")
     return mounted
 
 
-def mount_cb(device, callback, data=None, rw=False):
+def mount_cb(device, callback, data=None, rw=False, mtype=None):
     """
     Mount the device, call method 'callback' passing the directory
     in which it was mounted, then unmount.  Return whatever 'callback'
@@ -798,7 +950,7 @@ def mount_cb(device, callback, data=None, rw=False):
     with tempdir() as tmpd:
         umount = False
         if device in mounted:
-            mountpoint = "%s/" % mounted[device][2]
+            mountpoint = "%s/" % mounted[device]['mountpoint']
         else:
             try:
                 mountcmd = ['mount', "-o"]
@@ -806,6 +958,8 @@ def mount_cb(device, callback, data=None, rw=False):
                     mountcmd.append('rw')
                 else:
                     mountcmd.append('ro')
+                if mtype:
+                    mountcmd.extend(['-t', mtype])
                 mountcmd.append(device)
                 mountcmd.append(tmpd)
                 subp(mountcmd)
@@ -891,28 +1045,42 @@ def delete_dir_contents(dirname):
             del_file(node_fullpath)
 
 
-def subp(args, input_data=None, allowed_rc=None, env=None):
-    if allowed_rc is None:
-        allowed_rc = [0]
+def subp(args, data=None, rcs=None, env=None, capture=True, shell=False):
+    if rcs is None:
+        rcs = [0]
     try:
-        LOG.debug("Running command %s with allowed return codes %s",
-                  args, allowed_rc)
-        sp = subprocess.Popen(args, stdout=subprocess.PIPE,
-            stderr=subprocess.PIPE, stdin=subprocess.PIPE,
-            env=env)
-        (out, err) = sp.communicate(input_data)
+        LOG.debug(("Running command %s with allowed return codes %s"
+                   " (shell=%s, capture=%s)"), args, rcs, shell, capture)
+        if not capture:
+            stdout = None
+            stderr = None
+        else:
+            stdout = subprocess.PIPE
+            stderr = subprocess.PIPE
+        # Always pipe stdin (for now)
+        # harlowja: I don't see why anyone would want to pipe stdin
+        # since cloud-init shuts it down (via the method close stdin)
+        stdin = subprocess.PIPE
+        sp = subprocess.Popen(args, stdout=stdout,
+                        stderr=stderr, stdin=stdin,
+                        env=env, shell=shell)
+        (out, err) = sp.communicate(data)
     except OSError as e:
         raise ProcessExecutionError(cmd=args, reason=e)
     rc = sp.returncode
-    if rc not in allowed_rc:
+    if rc not in rcs:
         raise ProcessExecutionError(stdout=out, stderr=err,
-                                         exit_code=rc,
-                                         cmd=args)
-    # Just ensure blank instead of none??
-    if not out:
+                                    exit_code=rc,
+                                    cmd=args)
+    # Just ensure blank instead of none?? (iff capturing)
+    if not out and capture:
         out = ''
-    if not err:
+    if not err and capture:
         err = ''
+    # Useful to note what happened...
+    if capture:
+        LOG.debug("Stdout: %s", out)
+        LOG.debug("Stderr: %s", err)
     return (out, err)
 
 

From 7ac25d5ec3ed06d1c0df1462c147c70cf4c5948d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:33:55 -0700
Subject: [PATCH 085/434] Moved the contents of this file back to user_data.py
 It seems to make sense to have that file, then have a handler directory for
 user data handlers.

---
 cloudinit/user_data/__init__.py | 215 --------------------------------
 1 file changed, 215 deletions(-)
 delete mode 100644 cloudinit/user_data/__init__.py

diff --git a/cloudinit/user_data/__init__.py b/cloudinit/user_data/__init__.py
deleted file mode 100644
index 1910ba28..00000000
--- a/cloudinit/user_data/__init__.py
+++ /dev/null
@@ -1,215 +0,0 @@
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2012 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#    Copyright (C) 2012 Yahoo! Inc.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
-#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-
-import os
-import glob
-
-import email
-
-from email.mime.base import MIMEBase
-
-from cloudinit import importer
-from cloudinit import log as logging
-from cloudinit import util
-
-from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
-
-LOG = logging.getLogger(__name__)
-
-# Special content types that signal the start and end of processing
-CONTENT_END = "__end__"
-CONTENT_START = "__begin__"
-CONTENT_SIGNALS = [CONTENT_START, CONTENT_END]
-
-# Used when a part-handler type is encountered
-# to allow for registration of new types.
-PART_CONTENT_TYPES = ["text/part-handler"]
-PART_HANDLER_FN_TMPL = 'part-handler-%03d'
-
-# For parts without filenames
-PART_FN_TPL = 'part-%03d'
-
-# Used as the content type when a message is not multipart
-# and it doesn't contain its own content-type
-NOT_MULTIPART_TYPE = "text/x-not-multipart"
-OCTET_TYPE = 'application/octet-stream'
-
-# Different file beginnings to there content type
-INCLUSION_TYPES_MAP = {
-    '#include': 'text/x-include-url',
-    '#include-once': 'text/x-include-once-url',
-    '#!': 'text/x-shellscript',
-    '#cloud-config': 'text/cloud-config',
-    '#upstart-job': 'text/upstart-job',
-    '#part-handler': 'text/part-handler',
-    '#cloud-boothook': 'text/cloud-boothook',
-    '#cloud-config-archive': 'text/cloud-config-archive',
-}
-
-# Sorted longest first
-INCLUSION_SRCH = sorted(INCLUSION_TYPES_MAP.keys(), key=(lambda e: 0 - len(e)))
-
-
-class PartHandler(object):
-    def __init__(self, frequency, version=2):
-        self.handler_version = version
-        self.frequency = frequency
-
-    def __repr__(self):
-        return "%s: [%s]" % (self.__class__.__name__, self.list_types())
-
-    def list_types(self):
-        raise NotImplementedError()
-
-    def handle_part(self, data, ctype, filename, payload, frequency):
-        return self._handle_part(data, ctype, filename, payload, frequency)
-
-    def _handle_part(self, data, ctype, filename, payload, frequency):
-        raise NotImplementedError()
-
-
-def fixup_module(mod, def_freq=PER_INSTANCE):
-    if not hasattr(mod, "handler_version"):
-        setattr(mod, "handler_version", 1)
-    if not hasattr(mod, 'list_types'):
-        def empty_types():
-            return []
-        setattr(mod, 'list_types', empty_types)
-    if not hasattr(mod, 'frequency'):
-        setattr(mod, 'frequency', def_freq)
-    if not hasattr(mod, 'handle_part'):
-        def empty_handler(_data, _ctype, _filename, _payload):
-            pass
-        setattr(mod, 'handle_part', empty_handler)
-    return mod
-
-
-def run_part(mod, data, ctype, filename, payload, frequency):
-    mod_freq = mod.frequency
-    if not (mod_freq == PER_ALWAYS or
-            (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
-        return
-    mod_ver = mod.handler_version
-    try:
-        if mod_ver == 1:
-            mod.handle_part(data, ctype, filename, payload)
-        else:
-            mod.handle_part(data, ctype, filename, payload, frequency)
-    except:
-        LOG.exception(("Failed calling mod %s (%s, %s, %s)"
-                     " with frequency %s"), mod, ctype, filename,
-                     mod_ver, frequency)
-
-
-def call_begin(mod, data, frequency):
-    run_part(mod, data, CONTENT_START, None, None, frequency)
-
-
-def call_end(mod, data, frequency):
-    run_part(mod, data, CONTENT_END, None, None, frequency)
-
-
-def walker_handle_handler(pdata, _ctype, _filename, payload):
-    curcount = pdata['handlercount']
-    modname = PART_HANDLER_FN_TMPL % (curcount)
-    frequency = pdata['frequency']
-    modfname = os.path.join(pdata['handlerdir'], "%s.py" % (modname))
-    # TODO: Check if path exists??
-    util.write_file(modfname, payload, 0600)
-    handlers = pdata['handlers']
-    try:
-        mod = fixup_module(importer.import_module(modname))
-        handlers.register(mod)
-        call_begin(mod, pdata['data'], frequency)
-        pdata['handlercount'] = curcount + 1
-    except:
-        LOG.exception("Failed at registered python file: %s", modfname)
-
-
-def walker_callback(pdata, ctype, filename, payload):
-    if ctype in PART_CONTENT_TYPES:
-        walker_handle_handler(pdata, ctype, filename, payload)
-        return
-    handlers = pdata['handlers']
-    if ctype not in handlers:
-        if ctype == NOT_MULTIPART_TYPE:
-            # Extract the first line or 24 bytes for displaying in the log
-            start = payload.split("\n", 1)[0][:24]
-            if start < payload:
-                details = "starting '%s...'" % start.encode("string-escape")
-            else:
-                details = repr(payload)
-            LOG.warning("Unhandled non-multipart userdata: %s", details)
-        return
-    run_part(handlers[ctype], pdata['data'], ctype, filename,
-             payload, pdata['frequency'])
-
-
-# Callback is a function that will be called with 
-# (data, content_type, filename, payload)
-def walk(msg, callback, data):
-    partnum = 0
-    for part in msg.walk():
-        # multipart/* are just containers
-        if part.get_content_maintype() == 'multipart':
-            continue
-
-        ctype = part.get_content_type()
-        if ctype is None:
-            ctype = OCTET_TYPE
-
-        filename = part.get_filename()
-        if not filename:
-            filename = PART_FN_TPL % (partnum)
-
-        callback(data, ctype, filename, part.get_payload(decode=True))
-        partnum = partnum + 1
-
-
-# Coverts a raw string into a mime message
-def convert_string(raw_data, headers=None):
-    if not raw_data:
-        raw_data = ''
-    if not headers:
-        headers = {}
-    data = util.decomp_str(raw_data)
-    if "mime-version:" in data[0:4096].lower():
-        msg = email.message_from_string(data)
-        for (key, val) in headers.items():
-            if key in msg:
-                msg.replace_header(key, val)
-            else:
-                msg[key] = val
-    else:
-        mtype = headers.get("Content-Type", NOT_MULTIPART_TYPE)
-        maintype, subtype = mtype.split("/", 1)
-        msg = MIMEBase(maintype, subtype, *headers)
-        msg.set_payload(data)
-    return msg
-
-
-def type_from_starts_with(payload, default=None):
-    for text in INCLUSION_SRCH:
-        if payload.startswith(text):
-            return INCLUSION_TYPES_MAP[text]
-    return default
\ No newline at end of file

From 1559180eea66d9e73ce81fcfadab252f7f5c5461 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:34:28 -0700
Subject: [PATCH 086/434] Moved this class which does the user data process
 back to the main user_data.py file. It seems to make a little more sense for
 now to move it to there.

---
 cloudinit/user_data/processor.py | 204 -------------------------------
 1 file changed, 204 deletions(-)
 delete mode 100644 cloudinit/user_data/processor.py

diff --git a/cloudinit/user_data/processor.py b/cloudinit/user_data/processor.py
deleted file mode 100644
index 6e796f1c..00000000
--- a/cloudinit/user_data/processor.py
+++ /dev/null
@@ -1,204 +0,0 @@
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2012 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#    Copyright (C) 2012 Yahoo! Inc.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
-#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-import hashlib
-import os
-
-from email.mime.multipart import MIMEMultipart
-from email.mime.text import MIMEText
-from email.mime.base import MIMEBase
-
-from cloudinit import log as logging
-from cloudinit import url_helper
-from cloudinit import user_data as ud
-from cloudinit import util
-
-# Various special content types
-TYPE_NEEDED = ["text/plain", "text/x-not-multipart"]
-INCLUDE_TYPES = ['text/x-include-url', 'text/x-include-once-url']
-ARCHIVE_TYPES = ["text/cloud-config-archive"]
-UNDEF_TYPE = "text/plain"
-ARCHIVE_UNDEF_TYPE = "text/cloud-config"
-OCTET_TYPE = 'application/octet-stream'
-
-# Msg header used to track attachments
-ATTACHMENT_FIELD = 'Number-Attachments'
-
-# This will be used to create a filename from a url (or like) entry
-# When we want to make sure a entry isn't included
-# more than once across sessions.
-INCLUDE_ONCE_HASHER = 'md5'
-MAX_INCLUDE_FN_LEN = 64
-
-LOG = logging.getLogger(__name__)
-
-
-class UserDataProcessor(object):
-    def __init__(self, paths):
-        self.paths = paths
-
-    def process(self, blob):
-        base_msg = ud.convert_string(blob)
-        process_msg = MIMEMultipart()
-        self._process_msg(base_msg, process_msg)
-        return process_msg
-
-    def _process_msg(self, base_msg, append_msg):
-        for part in base_msg.walk():
-            # multipart/* are just containers
-            if part.get_content_maintype() == 'multipart':
-                continue
-    
-            ctype = None
-            ctype_orig = part.get_content_type()
-            payload = part.get_payload(decode=True)
-    
-            if not ctype_orig:
-                ctype_orig = UNDEF_TYPE
-    
-            if ctype_orig in TYPE_NEEDED:
-                ctype = ud.type_from_starts_with(payload)
-    
-            if ctype is None:
-                ctype = ctype_orig
-    
-            if ctype in INCLUDE_TYPES:
-                self._do_include(payload, append_msg)
-                continue
-    
-            if ctype in ARCHIVE_TYPES:
-                self._explode_archive(payload, append_msg)
-                continue
-    
-            if 'Content-Type' in base_msg:
-                base_msg.replace_header('Content-Type', ctype)
-            else:
-                base_msg['Content-Type'] = ctype
-    
-            self._attach_part(append_msg, part)
-
-    def _get_include_once_filename(self, entry):
-        msum = hashlib.new(INCLUDE_ONCE_HASHER)
-        msum.update(entry)
-        # Don't get to long now
-        entry_fn = msum.hexdigest()[0:MAX_INCLUDE_FN_LEN]
-        return os.path.join(self.paths.get_ipath_cur('data'),
-                            'urlcache', entry_fn)
-
-    def _do_include(self, content, append_msg):
-        # is just a list of urls, one per line
-        # also support '#include <url here>'
-        for line in content.splitlines():
-            includeonce = False
-            if line in ("#include", "#include-once"):
-                continue
-            if line.startswith("#include-once"):
-                line = line[len("#include-once"):].lstrip()
-                includeonce = True
-            elif line.startswith("#include"):
-                line = line[len("#include"):].lstrip()
-            if line.startswith("#"):
-                continue
-            include_url = line.strip()
-            if not include_url:
-                continue
-
-            includeonce_filename = self._get_include_once_filename(include_url)
-            if includeonce and os.path.isfile(includeonce_filename):
-                content = util.load_file(includeonce_filename)
-            else:
-                (content, st) = url_helper.readurl(include_url)
-                if includeonce and url_helper.ok_http_code(st):
-                    util.write_file(includeonce_filename, content, mode=0600)
-                if not url_helper.ok_http_code(st):
-                    content = ''
-
-            new_msg = ud.convert_string(content)
-            self._process_msg(new_msg, append_msg)
-
-    def _explode_archive(self, archive, append_msg):
-        entries = util.load_yaml(archive, default=[], allowed=[list, set])
-        for ent in entries:
-            # ent can be one of:
-            #  dict { 'filename' : 'value', 'content' :
-            #       'value', 'type' : 'value' }
-            #    filename and type not be present
-            # or
-            #  scalar(payload)
-            if isinstance(ent, str):
-                ent = {'content': ent}
-            if not isinstance(ent, (dict)):
-                # TODO raise?
-                continue
-
-            content = ent.get('content', '')
-            mtype = ent.get('type')
-            if not mtype:
-                mtype = ud.type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
-
-            maintype, subtype = mtype.split('/', 1)
-            if maintype == "text":
-                msg = MIMEText(content, _subtype=subtype)
-            else:
-                msg = MIMEBase(maintype, subtype)
-                msg.set_payload(content)
-
-            if 'filename' in ent:
-                msg.add_header('Content-Disposition', 'attachment',
-                                filename=ent['filename'])
-
-            for header in ent.keys():
-                if header in ('content', 'filename', 'type'):
-                    continue
-                msg.add_header(header, ent['header'])
-
-            self._attach_part(append_msg, msg)
-
-    def _multi_part_count(self, outer_msg, new_count=None):
-        """
-        Return the number of attachments to this MIMEMultipart by looking
-        at its 'Number-Attachments' header.
-        """
-        if ATTACHMENT_FIELD not in outer_msg:
-            outer_msg[ATTACHMENT_FIELD] = str(0)
-    
-        if new_count is not None:
-            outer_msg.replace_header(ATTACHMENT_FIELD, str(new_count))
-    
-        fetched_count = 0
-        try:
-            fetched_count = int(outer_msg.get(ATTACHMENT_FIELD))
-        except (ValueError, TypeError):
-            outer_msg.replace_header(ATTACHMENT_FIELD, str(fetched_count))
-        return fetched_count
-
-    def _attach_part(self, outer_msg, part):
-        """
-        Attach an part to an outer message. outermsg must be a MIMEMultipart.
-        Modifies a header in the message to keep track of number of attachments.
-        """
-        cur = self._multi_part_count(outer_msg)
-        if not part.get_filename():
-            fn = ud.PART_FN_TPL % (cur + 1)
-            part.add_header('Content-Disposition', 'attachment', filename=fn)
-        outer_msg.attach(part)
-        self._multi_part_count(outer_msg, cur + 1)

From a4ce5195713f5d2dab5a4d84921f77549ab792e6 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:35:07 -0700
Subject: [PATCH 087/434] Moved the handlers from a user_data directory to a
 handler directory.

---
 cloudinit/{user_data => handlers}/boot_hook.py              | 6 +++---
 cloudinit/{handlers => transforms}/__init__.py              | 0
 cloudinit/{handlers => transforms}/cc_apt_pipelining.py     | 0
 cloudinit/{handlers => transforms}/cc_apt_update_upgrade.py | 0
 cloudinit/{handlers => transforms}/cc_bootcmd.py            | 0
 cloudinit/{handlers => transforms}/cc_byobu.py              | 0
 cloudinit/{handlers => transforms}/cc_ca_certs.py           | 0
 cloudinit/{handlers => transforms}/cc_chef.py               | 0
 .../{handlers => transforms}/cc_disable_ec2_metadata.py     | 0
 cloudinit/{handlers => transforms}/cc_final_message.py      | 0
 cloudinit/{handlers => transforms}/cc_foo.py                | 0
 cloudinit/{handlers => transforms}/cc_grub_dpkg.py          | 0
 cloudinit/{handlers => transforms}/cc_keys_to_console.py    | 0
 cloudinit/{handlers => transforms}/cc_landscape.py          | 0
 cloudinit/{handlers => transforms}/cc_locale.py             | 0
 cloudinit/{handlers => transforms}/cc_mcollective.py        | 0
 cloudinit/{handlers => transforms}/cc_mounts.py             | 0
 cloudinit/{handlers => transforms}/cc_phone_home.py         | 0
 cloudinit/{handlers => transforms}/cc_puppet.py             | 0
 cloudinit/{handlers => transforms}/cc_resizefs.py           | 0
 .../{handlers => transforms}/cc_rightscale_userdata.py      | 0
 cloudinit/{handlers => transforms}/cc_rsyslog.py            | 0
 cloudinit/{handlers => transforms}/cc_runcmd.py             | 0
 cloudinit/{handlers => transforms}/cc_salt_minion.py        | 0
 cloudinit/{handlers => transforms}/cc_scripts_per_boot.py   | 0
 .../{handlers => transforms}/cc_scripts_per_instance.py     | 0
 cloudinit/{handlers => transforms}/cc_scripts_per_once.py   | 0
 cloudinit/{handlers => transforms}/cc_scripts_user.py       | 0
 cloudinit/{handlers => transforms}/cc_set_hostname.py       | 0
 cloudinit/{handlers => transforms}/cc_set_passwords.py      | 0
 cloudinit/{handlers => transforms}/cc_ssh.py                | 0
 cloudinit/{handlers => transforms}/cc_ssh_import_id.py      | 0
 cloudinit/{handlers => transforms}/cc_timezone.py           | 0
 cloudinit/{handlers => transforms}/cc_update_etc_hosts.py   | 0
 cloudinit/{handlers => transforms}/cc_update_hostname.py    | 0
 35 files changed, 3 insertions(+), 3 deletions(-)
 rename cloudinit/{user_data => handlers}/boot_hook.py (91%)
 rename cloudinit/{handlers => transforms}/__init__.py (100%)
 rename cloudinit/{handlers => transforms}/cc_apt_pipelining.py (100%)
 rename cloudinit/{handlers => transforms}/cc_apt_update_upgrade.py (100%)
 rename cloudinit/{handlers => transforms}/cc_bootcmd.py (100%)
 rename cloudinit/{handlers => transforms}/cc_byobu.py (100%)
 rename cloudinit/{handlers => transforms}/cc_ca_certs.py (100%)
 rename cloudinit/{handlers => transforms}/cc_chef.py (100%)
 rename cloudinit/{handlers => transforms}/cc_disable_ec2_metadata.py (100%)
 rename cloudinit/{handlers => transforms}/cc_final_message.py (100%)
 rename cloudinit/{handlers => transforms}/cc_foo.py (100%)
 rename cloudinit/{handlers => transforms}/cc_grub_dpkg.py (100%)
 rename cloudinit/{handlers => transforms}/cc_keys_to_console.py (100%)
 rename cloudinit/{handlers => transforms}/cc_landscape.py (100%)
 rename cloudinit/{handlers => transforms}/cc_locale.py (100%)
 rename cloudinit/{handlers => transforms}/cc_mcollective.py (100%)
 rename cloudinit/{handlers => transforms}/cc_mounts.py (100%)
 rename cloudinit/{handlers => transforms}/cc_phone_home.py (100%)
 rename cloudinit/{handlers => transforms}/cc_puppet.py (100%)
 rename cloudinit/{handlers => transforms}/cc_resizefs.py (100%)
 rename cloudinit/{handlers => transforms}/cc_rightscale_userdata.py (100%)
 rename cloudinit/{handlers => transforms}/cc_rsyslog.py (100%)
 rename cloudinit/{handlers => transforms}/cc_runcmd.py (100%)
 rename cloudinit/{handlers => transforms}/cc_salt_minion.py (100%)
 rename cloudinit/{handlers => transforms}/cc_scripts_per_boot.py (100%)
 rename cloudinit/{handlers => transforms}/cc_scripts_per_instance.py (100%)
 rename cloudinit/{handlers => transforms}/cc_scripts_per_once.py (100%)
 rename cloudinit/{handlers => transforms}/cc_scripts_user.py (100%)
 rename cloudinit/{handlers => transforms}/cc_set_hostname.py (100%)
 rename cloudinit/{handlers => transforms}/cc_set_passwords.py (100%)
 rename cloudinit/{handlers => transforms}/cc_ssh.py (100%)
 rename cloudinit/{handlers => transforms}/cc_ssh_import_id.py (100%)
 rename cloudinit/{handlers => transforms}/cc_timezone.py (100%)
 rename cloudinit/{handlers => transforms}/cc_update_etc_hosts.py (100%)
 rename cloudinit/{handlers => transforms}/cc_update_hostname.py (100%)

diff --git a/cloudinit/user_data/boot_hook.py b/cloudinit/handlers/boot_hook.py
similarity index 91%
rename from cloudinit/user_data/boot_hook.py
rename to cloudinit/handlers/boot_hook.py
index 87e7a3ec..c75aeb72 100644
--- a/cloudinit/user_data/boot_hook.py
+++ b/cloudinit/handlers/boot_hook.py
@@ -60,7 +60,7 @@ class BootHookPartHandler(ud.PartHandler):
             env['INSTANCE_ID'] = str(self.instance_id)
             util.subp([filepath], env=env)
         except util.ProcessExecutionError as e:
-            LOG.error("Boothooks script %s execution error %s", filepath, e)
+            util.logexc(LOG, "Boothooks script %s execution error", filepath)
         except Exception as e:
-            LOG.exception(("Boothooks unknown "
-                           "error %s when running %s"), e, filepath)
+            util.logexc(LOG, ("Boothooks unknown "
+                              "error when running %s"), filepath)
diff --git a/cloudinit/handlers/__init__.py b/cloudinit/transforms/__init__.py
similarity index 100%
rename from cloudinit/handlers/__init__.py
rename to cloudinit/transforms/__init__.py
diff --git a/cloudinit/handlers/cc_apt_pipelining.py b/cloudinit/transforms/cc_apt_pipelining.py
similarity index 100%
rename from cloudinit/handlers/cc_apt_pipelining.py
rename to cloudinit/transforms/cc_apt_pipelining.py
diff --git a/cloudinit/handlers/cc_apt_update_upgrade.py b/cloudinit/transforms/cc_apt_update_upgrade.py
similarity index 100%
rename from cloudinit/handlers/cc_apt_update_upgrade.py
rename to cloudinit/transforms/cc_apt_update_upgrade.py
diff --git a/cloudinit/handlers/cc_bootcmd.py b/cloudinit/transforms/cc_bootcmd.py
similarity index 100%
rename from cloudinit/handlers/cc_bootcmd.py
rename to cloudinit/transforms/cc_bootcmd.py
diff --git a/cloudinit/handlers/cc_byobu.py b/cloudinit/transforms/cc_byobu.py
similarity index 100%
rename from cloudinit/handlers/cc_byobu.py
rename to cloudinit/transforms/cc_byobu.py
diff --git a/cloudinit/handlers/cc_ca_certs.py b/cloudinit/transforms/cc_ca_certs.py
similarity index 100%
rename from cloudinit/handlers/cc_ca_certs.py
rename to cloudinit/transforms/cc_ca_certs.py
diff --git a/cloudinit/handlers/cc_chef.py b/cloudinit/transforms/cc_chef.py
similarity index 100%
rename from cloudinit/handlers/cc_chef.py
rename to cloudinit/transforms/cc_chef.py
diff --git a/cloudinit/handlers/cc_disable_ec2_metadata.py b/cloudinit/transforms/cc_disable_ec2_metadata.py
similarity index 100%
rename from cloudinit/handlers/cc_disable_ec2_metadata.py
rename to cloudinit/transforms/cc_disable_ec2_metadata.py
diff --git a/cloudinit/handlers/cc_final_message.py b/cloudinit/transforms/cc_final_message.py
similarity index 100%
rename from cloudinit/handlers/cc_final_message.py
rename to cloudinit/transforms/cc_final_message.py
diff --git a/cloudinit/handlers/cc_foo.py b/cloudinit/transforms/cc_foo.py
similarity index 100%
rename from cloudinit/handlers/cc_foo.py
rename to cloudinit/transforms/cc_foo.py
diff --git a/cloudinit/handlers/cc_grub_dpkg.py b/cloudinit/transforms/cc_grub_dpkg.py
similarity index 100%
rename from cloudinit/handlers/cc_grub_dpkg.py
rename to cloudinit/transforms/cc_grub_dpkg.py
diff --git a/cloudinit/handlers/cc_keys_to_console.py b/cloudinit/transforms/cc_keys_to_console.py
similarity index 100%
rename from cloudinit/handlers/cc_keys_to_console.py
rename to cloudinit/transforms/cc_keys_to_console.py
diff --git a/cloudinit/handlers/cc_landscape.py b/cloudinit/transforms/cc_landscape.py
similarity index 100%
rename from cloudinit/handlers/cc_landscape.py
rename to cloudinit/transforms/cc_landscape.py
diff --git a/cloudinit/handlers/cc_locale.py b/cloudinit/transforms/cc_locale.py
similarity index 100%
rename from cloudinit/handlers/cc_locale.py
rename to cloudinit/transforms/cc_locale.py
diff --git a/cloudinit/handlers/cc_mcollective.py b/cloudinit/transforms/cc_mcollective.py
similarity index 100%
rename from cloudinit/handlers/cc_mcollective.py
rename to cloudinit/transforms/cc_mcollective.py
diff --git a/cloudinit/handlers/cc_mounts.py b/cloudinit/transforms/cc_mounts.py
similarity index 100%
rename from cloudinit/handlers/cc_mounts.py
rename to cloudinit/transforms/cc_mounts.py
diff --git a/cloudinit/handlers/cc_phone_home.py b/cloudinit/transforms/cc_phone_home.py
similarity index 100%
rename from cloudinit/handlers/cc_phone_home.py
rename to cloudinit/transforms/cc_phone_home.py
diff --git a/cloudinit/handlers/cc_puppet.py b/cloudinit/transforms/cc_puppet.py
similarity index 100%
rename from cloudinit/handlers/cc_puppet.py
rename to cloudinit/transforms/cc_puppet.py
diff --git a/cloudinit/handlers/cc_resizefs.py b/cloudinit/transforms/cc_resizefs.py
similarity index 100%
rename from cloudinit/handlers/cc_resizefs.py
rename to cloudinit/transforms/cc_resizefs.py
diff --git a/cloudinit/handlers/cc_rightscale_userdata.py b/cloudinit/transforms/cc_rightscale_userdata.py
similarity index 100%
rename from cloudinit/handlers/cc_rightscale_userdata.py
rename to cloudinit/transforms/cc_rightscale_userdata.py
diff --git a/cloudinit/handlers/cc_rsyslog.py b/cloudinit/transforms/cc_rsyslog.py
similarity index 100%
rename from cloudinit/handlers/cc_rsyslog.py
rename to cloudinit/transforms/cc_rsyslog.py
diff --git a/cloudinit/handlers/cc_runcmd.py b/cloudinit/transforms/cc_runcmd.py
similarity index 100%
rename from cloudinit/handlers/cc_runcmd.py
rename to cloudinit/transforms/cc_runcmd.py
diff --git a/cloudinit/handlers/cc_salt_minion.py b/cloudinit/transforms/cc_salt_minion.py
similarity index 100%
rename from cloudinit/handlers/cc_salt_minion.py
rename to cloudinit/transforms/cc_salt_minion.py
diff --git a/cloudinit/handlers/cc_scripts_per_boot.py b/cloudinit/transforms/cc_scripts_per_boot.py
similarity index 100%
rename from cloudinit/handlers/cc_scripts_per_boot.py
rename to cloudinit/transforms/cc_scripts_per_boot.py
diff --git a/cloudinit/handlers/cc_scripts_per_instance.py b/cloudinit/transforms/cc_scripts_per_instance.py
similarity index 100%
rename from cloudinit/handlers/cc_scripts_per_instance.py
rename to cloudinit/transforms/cc_scripts_per_instance.py
diff --git a/cloudinit/handlers/cc_scripts_per_once.py b/cloudinit/transforms/cc_scripts_per_once.py
similarity index 100%
rename from cloudinit/handlers/cc_scripts_per_once.py
rename to cloudinit/transforms/cc_scripts_per_once.py
diff --git a/cloudinit/handlers/cc_scripts_user.py b/cloudinit/transforms/cc_scripts_user.py
similarity index 100%
rename from cloudinit/handlers/cc_scripts_user.py
rename to cloudinit/transforms/cc_scripts_user.py
diff --git a/cloudinit/handlers/cc_set_hostname.py b/cloudinit/transforms/cc_set_hostname.py
similarity index 100%
rename from cloudinit/handlers/cc_set_hostname.py
rename to cloudinit/transforms/cc_set_hostname.py
diff --git a/cloudinit/handlers/cc_set_passwords.py b/cloudinit/transforms/cc_set_passwords.py
similarity index 100%
rename from cloudinit/handlers/cc_set_passwords.py
rename to cloudinit/transforms/cc_set_passwords.py
diff --git a/cloudinit/handlers/cc_ssh.py b/cloudinit/transforms/cc_ssh.py
similarity index 100%
rename from cloudinit/handlers/cc_ssh.py
rename to cloudinit/transforms/cc_ssh.py
diff --git a/cloudinit/handlers/cc_ssh_import_id.py b/cloudinit/transforms/cc_ssh_import_id.py
similarity index 100%
rename from cloudinit/handlers/cc_ssh_import_id.py
rename to cloudinit/transforms/cc_ssh_import_id.py
diff --git a/cloudinit/handlers/cc_timezone.py b/cloudinit/transforms/cc_timezone.py
similarity index 100%
rename from cloudinit/handlers/cc_timezone.py
rename to cloudinit/transforms/cc_timezone.py
diff --git a/cloudinit/handlers/cc_update_etc_hosts.py b/cloudinit/transforms/cc_update_etc_hosts.py
similarity index 100%
rename from cloudinit/handlers/cc_update_etc_hosts.py
rename to cloudinit/transforms/cc_update_etc_hosts.py
diff --git a/cloudinit/handlers/cc_update_hostname.py b/cloudinit/transforms/cc_update_hostname.py
similarity index 100%
rename from cloudinit/handlers/cc_update_hostname.py
rename to cloudinit/transforms/cc_update_hostname.py

From 05a5373c8cd109d7504b7df45d0225b65e2fedee Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:35:38 -0700
Subject: [PATCH 088/434] Moved the user_data directory back to a user_data.py
 and made a handler subdir for just the internal handlers.

---
 cloudinit/{user_data => handlers}/cloud_config.py | 0
 cloudinit/{user_data => handlers}/shell_script.py | 0
 cloudinit/{user_data => handlers}/upstart_job.py  | 0
 3 files changed, 0 insertions(+), 0 deletions(-)
 rename cloudinit/{user_data => handlers}/cloud_config.py (100%)
 rename cloudinit/{user_data => handlers}/shell_script.py (100%)
 rename cloudinit/{user_data => handlers}/upstart_job.py (100%)

diff --git a/cloudinit/user_data/cloud_config.py b/cloudinit/handlers/cloud_config.py
similarity index 100%
rename from cloudinit/user_data/cloud_config.py
rename to cloudinit/handlers/cloud_config.py
diff --git a/cloudinit/user_data/shell_script.py b/cloudinit/handlers/shell_script.py
similarity index 100%
rename from cloudinit/user_data/shell_script.py
rename to cloudinit/handlers/shell_script.py
diff --git a/cloudinit/user_data/upstart_job.py b/cloudinit/handlers/upstart_job.py
similarity index 100%
rename from cloudinit/user_data/upstart_job.py
rename to cloudinit/handlers/upstart_job.py

From ff0adc4337192c4955b7f8c2d2950ffcb8d62b53 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:36:07 -0700
Subject: [PATCH 089/434] This provides a nice little utility class that avoids
 the python config parser throwing when options + values are being added to
 unknown sections since it handles the creation and checking that those
 sections exist before the option is added. Also it adds a little helper that
 can turn that config into a string.

---
 cloudinit/cfg.py | 72 ++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 72 insertions(+)
 create mode 100644 cloudinit/cfg.py

diff --git a/cloudinit/cfg.py b/cloudinit/cfg.py
new file mode 100644
index 00000000..dd8f7baf
--- /dev/null
+++ b/cloudinit/cfg.py
@@ -0,0 +1,72 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import io
+
+from ConfigParser import (NoSectionError, NoOptionError, RawConfigParser)
+
+
+class DefaultingConfigParser(RawConfigParser):
+    DEF_INT = 0
+    DEF_FLOAT = 0.0
+    DEF_BOOLEAN = False
+    DEF_BASE = None
+
+    def get(self, section, option):
+        value = self.DEF_BASE
+        try:
+            value = RawConfigParser.get(self, section, option)
+        except NoSectionError:
+            pass
+        except NoOptionError:
+            pass
+        return value
+
+    def set(self, section, option, value):
+        if not self.has_section(section) and section.lower() != 'default':
+            self.add_section(section)
+        RawConfigParser.set(self, section, option, value)
+
+    def remove_option(self, section, option):
+        if self.has_option(section, option):
+            RawConfigParser.remove_option(self, section, option)
+
+    def getboolean(self, section, option):
+        if not self.has_option(section, option):
+            return self.DEF_BOOLEAN
+        return RawConfigParser.getboolean(self, section, option)
+
+    def getfloat(self, section, option):
+        if not self.has_option(section, option):
+            return self.DEF_FLOAT
+        return RawConfigParser.getfloat(self, section, option)
+
+    def getint(self, section, option):
+        if not self.has_option(section, option):
+            return self.DEF_INT
+        return RawConfigParser.getint(self, section, option)
+
+    def stringify(self, header=None):
+        contents = ''
+        with io.BytesIO() as outputstream:
+            self.write(outputstream)
+            outputstream.flush()
+            contents = outputstream.getvalue()
+            if header:
+                contents = "\n".join([header, contents])
+        return contents

From 71ae0da5833ef68447668a30808d1d5b3cb5fb62 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:37:17 -0700
Subject: [PATCH 090/434] Added a new transform that can be used to show and
 initial welcome message to users. It is similar to the final msg one, but is
 used at the start of cloud init instead.

---
 cloudinit/transforms/cc_welcome.py | 64 ++++++++++++++++++++++++++++++
 templates/welcome_msg.tmpl         | 15 +++++++
 2 files changed, 79 insertions(+)
 create mode 100644 cloudinit/transforms/cc_welcome.py
 create mode 100644 templates/welcome_msg.tmpl

diff --git a/cloudinit/transforms/cc_welcome.py b/cloudinit/transforms/cc_welcome.py
new file mode 100644
index 00000000..0db71125
--- /dev/null
+++ b/cloudinit/transforms/cc_welcome.py
@@ -0,0 +1,64 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+from cloudinit.settings import PER_ALWAYS
+
+from cloudinit import templater
+from cloudinit import util
+from cloudinit import version
+
+import sys
+
+welcome_message_def = ("Cloud-init v. {{version}} starting stage {{stage}} at "
+                       "{{timestamp}}. Up {{uptime}} seconds.")
+
+
+frequency = PER_ALWAYS
+
+
+def handle(name, cfg, cloud, log, args):
+
+    welcome_msg = util.get_cfg_option_str(cfg, "welcome_msg"):
+    if not welcome_msg:
+        tpl_fn = cloud.get_template_filename("welcome_msg")
+        if tpl_fn:
+            welcome_msg = util.load_file(tpl_fn)
+
+    if not welcome_msg:
+        welcome_msg = welcome_message_def
+
+    stage = "??"
+    if args:
+        stage = args[0]
+
+    tpl_params = {
+        'stage': stage,
+        'version': version.version_string(),
+        'uptime': util.uptime(),
+        'timestamp', util.time_rfc2822(),
+    }
+    try:
+        contents = templater.render_string(welcome_msg, tpl_params)
+        # TODO use log or sys.stderr??
+        sys.stderr.write("%s\n" % (contents))
+    except:
+        util.logexc(log, "Failed to render welcome message template")
diff --git a/templates/welcome_msg.tmpl b/templates/welcome_msg.tmpl
new file mode 100644
index 00000000..999202cc
--- /dev/null
+++ b/templates/welcome_msg.tmpl
@@ -0,0 +1,15 @@
+             _
+           _( )_
+          (     )
+         (_______)
+    _     \ \ \ \
+  _( )_        _
+ (     )     _( )_
+(_______)   (     )
+ \ \ \ \   (_______)
+            \ \ \ \
+
+Cloud-init v. {{version}}
+Starting stage: {{stage}} on {{timestamp}}
+System uptime: {{uptime}} seconds
+--

From a2a0bb8998e818444bfcecf1981d715a51281a07 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:38:32 -0700
Subject: [PATCH 091/434] Moved the common user data classes and functionality
 back to this file since for now it seems to make organizational sense to put
 it here.

---
 cloudinit/user_data.py | 383 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 383 insertions(+)
 create mode 100644 cloudinit/user_data.py

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
new file mode 100644
index 00000000..64fc2734
--- /dev/null
+++ b/cloudinit/user_data.py
@@ -0,0 +1,383 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+
+import os
+import glob
+
+import email
+
+from email.mime.base import MIMEBase
+
+from cloudinit import importer
+from cloudinit import log as logging
+from cloudinit import util
+
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE, FREQUENCIES)
+
+LOG = logging.getLogger(__name__)
+
+# Special content types that signal the start and end of processing
+CONTENT_END = "__end__"
+CONTENT_START = "__begin__"
+CONTENT_SIGNALS = [CONTENT_START, CONTENT_END]
+
+# Used when a part-handler type is encountered
+# to allow for registration of new types.
+PART_CONTENT_TYPES = ["text/part-handler"]
+PART_HANDLER_FN_TMPL = 'part-handler-%03d'
+
+# For parts without filenames
+PART_FN_TPL = 'part-%03d'
+
+# Used as the content type when a message is not multipart
+# and it doesn't contain its own content-type
+NOT_MULTIPART_TYPE = "text/x-not-multipart"
+OCTET_TYPE = 'application/octet-stream'
+
+# Different file beginnings to there content type
+INCLUSION_TYPES_MAP = {
+    '#include': 'text/x-include-url',
+    '#include-once': 'text/x-include-once-url',
+    '#!': 'text/x-shellscript',
+    '#cloud-config': 'text/cloud-config',
+    '#upstart-job': 'text/upstart-job',
+    '#part-handler': 'text/part-handler',
+    '#cloud-boothook': 'text/cloud-boothook',
+    '#cloud-config-archive': 'text/cloud-config-archive',
+}
+
+# Sorted longest first
+INCLUSION_SRCH = sorted(INCLUSION_TYPES_MAP.keys(), key=(lambda e: 0 - len(e)))
+
+# Various special content types
+TYPE_NEEDED = ["text/plain", "text/x-not-multipart"]
+INCLUDE_TYPES = ['text/x-include-url', 'text/x-include-once-url']
+ARCHIVE_TYPES = ["text/cloud-config-archive"]
+UNDEF_TYPE = "text/plain"
+ARCHIVE_UNDEF_TYPE = "text/cloud-config"
+OCTET_TYPE = 'application/octet-stream'
+
+# Msg header used to track attachments
+ATTACHMENT_FIELD = 'Number-Attachments'
+
+
+class UserDataProcessor(object):
+    def __init__(self, paths):
+        self.paths = paths
+
+    def process(self, blob):
+        base_msg = ud.convert_string(blob)
+        process_msg = MIMEMultipart()
+        self._process_msg(base_msg, process_msg)
+        return process_msg
+
+    def _process_msg(self, base_msg, append_msg):
+        for part in base_msg.walk():
+            # multipart/* are just containers
+            if part.get_content_maintype() == 'multipart':
+                continue
+    
+            ctype = None
+            ctype_orig = part.get_content_type()
+            payload = part.get_payload(decode=True)
+    
+            if not ctype_orig:
+                ctype_orig = UNDEF_TYPE
+    
+            if ctype_orig in TYPE_NEEDED:
+                ctype = ud.type_from_starts_with(payload)
+    
+            if ctype is None:
+                ctype = ctype_orig
+    
+            if ctype in INCLUDE_TYPES:
+                self._do_include(payload, append_msg)
+                continue
+    
+            if ctype in ARCHIVE_TYPES:
+                self._explode_archive(payload, append_msg)
+                continue
+    
+            if 'Content-Type' in base_msg:
+                base_msg.replace_header('Content-Type', ctype)
+            else:
+                base_msg['Content-Type'] = ctype
+    
+            self._attach_part(append_msg, part)
+
+    def _get_include_once_filename(self, entry):
+        entry_fn = util.hash_blob(entry, 'md5', 64)
+        return os.path.join(self.paths.get_ipath_cur('data'),
+                            'urlcache', entry_fn)
+
+    def _do_include(self, content, append_msg):
+        # is just a list of urls, one per line
+        # also support '#include <url here>'
+        for line in content.splitlines():
+            includeonce = False
+            if line in ("#include", "#include-once"):
+                continue
+            if line.startswith("#include-once"):
+                line = line[len("#include-once"):].lstrip()
+                includeonce = True
+            elif line.startswith("#include"):
+                line = line[len("#include"):].lstrip()
+            if line.startswith("#"):
+                continue
+            include_url = line.strip()
+            if not include_url:
+                continue
+
+            includeonce_filename = self._get_include_once_filename(include_url)
+            if includeonce and os.path.isfile(includeonce_filename):
+                content = util.load_file(includeonce_filename)
+            else:
+                (content, st) = url_helper.readurl(include_url)
+                if includeonce and url_helper.ok_http_code(st):
+                    util.write_file(includeonce_filename, content, mode=0600)
+                if not url_helper.ok_http_code(st):
+                    content = ''
+
+            new_msg = ud.convert_string(content)
+            self._process_msg(new_msg, append_msg)
+
+    def _explode_archive(self, archive, append_msg):
+        entries = util.load_yaml(archive, default=[], allowed=[list, set])
+        for ent in entries:
+            # ent can be one of:
+            #  dict { 'filename' : 'value', 'content' :
+            #       'value', 'type' : 'value' }
+            #    filename and type not be present
+            # or
+            #  scalar(payload)
+            if isinstance(ent, (str, basestring)):
+                ent = {'content': ent}
+            if not isinstance(ent, (dict)):
+                # TODO raise?
+                continue
+
+            content = ent.get('content', '')
+            mtype = ent.get('type')
+            if not mtype:
+                mtype = ud.type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
+
+            maintype, subtype = mtype.split('/', 1)
+            if maintype == "text":
+                msg = MIMEText(content, _subtype=subtype)
+            else:
+                msg = MIMEBase(maintype, subtype)
+                msg.set_payload(content)
+
+            if 'filename' in ent:
+                msg.add_header('Content-Disposition', 'attachment',
+                                filename=ent['filename'])
+
+            for header in ent.keys():
+                if header in ('content', 'filename', 'type'):
+                    continue
+                msg.add_header(header, ent['header'])
+
+            self._attach_part(append_msg, msg)
+
+    def _multi_part_count(self, outer_msg, new_count=None):
+        """
+        Return the number of attachments to this MIMEMultipart by looking
+        at its 'Number-Attachments' header.
+        """
+        if ATTACHMENT_FIELD not in outer_msg:
+            outer_msg[ATTACHMENT_FIELD] = '0'
+    
+        if new_count is not None:
+            outer_msg.replace_header(ATTACHMENT_FIELD, str(new_count))
+    
+        fetched_count = 0
+        try:
+            fetched_count = int(outer_msg.get(ATTACHMENT_FIELD))
+        except (ValueError, TypeError):
+            outer_msg.replace_header(ATTACHMENT_FIELD, str(fetched_count))
+        return fetched_count
+
+    def _attach_part(self, outer_msg, part):
+        """
+        Attach an part to an outer message. outermsg must be a MIMEMultipart.
+        Modifies a header in the message to keep track of number of attachments.
+        """
+        cur = self._multi_part_count(outer_msg)
+        if not part.get_filename():
+            fn = PART_FN_TPL % (cur + 1)
+            part.add_header('Content-Disposition', 'attachment', filename=fn)
+        outer_msg.attach(part)
+        self._multi_part_count(outer_msg, cur + 1)
+
+
+class PartHandler(object):
+    def __init__(self, frequency, version=2):
+        self.handler_version = version
+        self.frequency = frequency
+
+    def __repr__(self):
+        return "%s: [%s]" % (util.obj_name(self), self.list_types())
+
+    def list_types(self):
+        raise NotImplementedError()
+
+    def handle_part(self, data, ctype, filename, payload, frequency):
+        return self._handle_part(data, ctype, filename, payload, frequency)
+
+    def _handle_part(self, data, ctype, filename, payload, frequency):
+        raise NotImplementedError()
+
+
+def fixup_module(mod, def_freq=PER_INSTANCE):
+    if not hasattr(mod, "handler_version"):
+        setattr(mod, "handler_version", 1)
+    if not hasattr(mod, 'list_types'):
+        def empty_types():
+            return []
+        setattr(mod, 'list_types', empty_types)
+    if not hasattr(mod, 'frequency'):
+        setattr(mod, 'frequency', def_freq)
+    else:
+        freq = mod.frequency
+        if freq and freq not in FREQUENCIES:
+            LOG.warn("Module %s has an unknown frequency %s", mod, freq)
+    if not hasattr(mod, 'handle_part'):
+        def empty_handler(_data, _ctype, _filename, _payload):
+            pass
+        setattr(mod, 'handle_part', empty_handler)
+    return mod
+
+
+def run_part(mod, data, ctype, filename, payload, frequency):
+    mod_freq = mod.frequency
+    if not (mod_freq == PER_ALWAYS or
+            (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
+        return
+    mod_ver = mod.handler_version
+    try:
+        if mod_ver == 1:
+            mod.handle_part(data, ctype, filename, payload)
+        else:
+            mod.handle_part(data, ctype, filename, payload, frequency)
+    except:
+        util.logexc(LOG, ("Failed calling mod %s (%s, %s, %s)"
+                         " with frequency %s"), 
+                    mod, ctype, filename,
+                    mod_ver, frequency)
+
+
+def call_begin(mod, data, frequency):
+    run_part(mod, data, CONTENT_START, None, None, frequency)
+
+
+def call_end(mod, data, frequency):
+    run_part(mod, data, CONTENT_END, None, None, frequency)
+
+
+def walker_handle_handler(pdata, _ctype, _filename, payload):
+    curcount = pdata['handlercount']
+    modname = PART_HANDLER_FN_TMPL % (curcount)
+    frequency = pdata['frequency']
+    modfname = os.path.join(pdata['handlerdir'], "%s" % (modname))
+    if not modfname.endswith(".py"):
+        modfname = "%s.py" % (modfname)
+    # TODO: Check if path exists??
+    util.write_file(modfname, payload, 0600)
+    handlers = pdata['handlers']
+    try:
+        mod = fixup_module(importer.import_module(modname))
+        handlers.register(mod)
+        call_begin(mod, pdata['data'], frequency)
+        pdata['handlercount'] = curcount + 1
+    except:
+        util.logexc(LOG, "Failed at registered python file: %s", modfname)
+
+
+def walker_callback(pdata, ctype, filename, payload):
+    if ctype in PART_CONTENT_TYPES:
+        walker_handle_handler(pdata, ctype, filename, payload)
+        return
+    handlers = pdata['handlers']
+    if ctype not in handlers:
+        if ctype == NOT_MULTIPART_TYPE:
+            # Extract the first line or 24 bytes for displaying in the log
+            start = payload.split("\n", 1)[0][:24]
+            if start < payload:
+                details = "starting '%s...'" % start.encode("string-escape")
+            else:
+                details = repr(payload)
+            LOG.warning("Unhandled non-multipart userdata: %s", details)
+        return
+    run_part(handlers[ctype], pdata['data'], ctype, filename,
+             payload, pdata['frequency'])
+
+
+# Callback is a function that will be called with 
+# (data, content_type, filename, payload)
+def walk(msg, callback, data):
+    partnum = 0
+    for part in msg.walk():
+        # multipart/* are just containers
+        if part.get_content_maintype() == 'multipart':
+            continue
+
+        ctype = part.get_content_type()
+        if ctype is None:
+            ctype = OCTET_TYPE
+
+        filename = part.get_filename()
+        if not filename:
+            filename = PART_FN_TPL % (partnum)
+
+        callback(data, ctype, filename, part.get_payload(decode=True))
+        partnum = partnum + 1
+
+
+# Coverts a raw string into a mime message
+def convert_string(raw_data, headers=None):
+    if not raw_data:
+        raw_data = ''
+    if not headers:
+        headers = {}
+    data = util.decomp_str(raw_data)
+    if "mime-version:" in data[0:4096].lower():
+        msg = email.message_from_string(data)
+        for (key, val) in headers.items():
+            if key in msg:
+                msg.replace_header(key, val)
+            else:
+                msg[key] = val
+    else:
+        mtype = headers.get("Content-Type", NOT_MULTIPART_TYPE)
+        maintype, subtype = mtype.split("/", 1)
+        msg = MIMEBase(maintype, subtype, *headers)
+        msg.set_payload(data)
+    return msg
+
+
+def type_from_starts_with(payload, default=None):
+    for text in INCLUSION_SRCH:
+        if payload.startswith(text):
+            return INCLUSION_TYPES_MAP[text]
+    return default
+

From 65fd2978925b1dab595dd80dd789cd283da0f0a8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:39:42 -0700
Subject: [PATCH 092/434] Added a python file which can be used internally to
 determine the version of cloud init that is running for internal messaging,
 if desired

---
 cloudinit/version.py | 27 +++++++++++++++++++++++++++
 1 file changed, 27 insertions(+)
 create mode 100644 cloudinit/version.py

diff --git a/cloudinit/version.py b/cloudinit/version.py
new file mode 100644
index 00000000..4599910c
--- /dev/null
+++ b/cloudinit/version.py
@@ -0,0 +1,27 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+from distutils import version as vr
+
+
+def version():
+    return vr.StrictVersion("0.7.0")
+
+
+def version_string():
+    return str(version())

From a6304508dd5f84c0f69144afcfeebfcb4aadf2ad Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:39:54 -0700
Subject: [PATCH 093/434] Added a hosts template file (in tempita format) that
 provides the base of a "/etc/hosts" file for rhel like systems.

---
 templates/hosts.redhat.tmpl | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)
 create mode 100644 templates/hosts.redhat.tmpl

diff --git a/templates/hosts.redhat.tmpl b/templates/hosts.redhat.tmpl
new file mode 100644
index 00000000..cfc40668
--- /dev/null
+++ b/templates/hosts.redhat.tmpl
@@ -0,0 +1,22 @@
+{{# This file /etc/cloud/templates/hosts.tmpl is only utilized
+    if enabled in cloud-config.  Specifically, in order to enable it
+    you need to add the following to config:
+      manage_etc_hosts: True}}
+# 
+# Your system has configured 'manage_etc_hosts' as True.
+# As a result, if you wish for changes to this file to persist
+# then you will need to either
+# a.) make changes to the master file in /etc/cloud/templates/hosts.tmpl
+# b.) change or remove the value of 'manage_etc_hosts' in
+#     /etc/cloud/cloud.cfg or cloud-config from user-data
+# 
+# The following lines are desirable for IPv4 capable hosts
+127.0.0.1 {{fqdn}} {{hostname}} 
+127.0.0.1 localhost.localdomain localhost
+127.0.0.1 localhost4.localdomain4 localhost4
+
+# The following lines are desirable for IPv6 capable hosts
+::1 {{fqdn}} {{hostname}}
+::1 localhost.localdomain localhost
+::1 localhost6.localdomain6 localhost6
+

From 28301fc16c66352e0430f018363dcf7d1e931442 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:40:55 -0700
Subject: [PATCH 094/434] Renamed hosts to match the ubuntu distro. Also
 converted all the other templates to tempita format instead of the more
 complicated (and more dependent on other packages) cheetah format.

---
 templates/chef_client.rb.tmpl               |   8 +-
 templates/default-locale.tmpl               |   2 +-
 templates/{hosts.tmpl => hosts.ubuntu.tmpl} |  15 ++-
 templates/sources.list.tmpl                 | 101 ++++++++++----------
 4 files changed, 62 insertions(+), 64 deletions(-)
 rename templates/{hosts.tmpl => hosts.ubuntu.tmpl} (60%)

diff --git a/templates/chef_client.rb.tmpl b/templates/chef_client.rb.tmpl
index d3d9a922..35123ced 100644
--- a/templates/chef_client.rb.tmpl
+++ b/templates/chef_client.rb.tmpl
@@ -1,12 +1,12 @@
 log_level              :info
 log_location           "/var/log/chef/client.log"
 ssl_verify_mode        :verify_none
-validation_client_name "$validation_name"
+validation_client_name "{{validation_name}}"
 validation_key         "/etc/chef/validation.pem"
 client_key             "/etc/chef/client.pem"
-chef_server_url        "$server_url"
-environment            "$environment"
-node_name              "$node_name"
+chef_server_url        "{{server_url}}"
+environment            "{{environment}}"
+node_name              "{{node_name}}"
 json_attribs           "/etc/chef/firstboot.json"
 file_cache_path        "/var/cache/chef"
 file_backup_path       "/var/backups/chef"
diff --git a/templates/default-locale.tmpl b/templates/default-locale.tmpl
index 7940672b..5ee7e454 100644
--- a/templates/default-locale.tmpl
+++ b/templates/default-locale.tmpl
@@ -1 +1 @@
-LANG="$locale"
+LANG="{{locale}}"
diff --git a/templates/hosts.tmpl b/templates/hosts.ubuntu.tmpl
similarity index 60%
rename from templates/hosts.tmpl
rename to templates/hosts.ubuntu.tmpl
index ae120b02..9eebe971 100644
--- a/templates/hosts.tmpl
+++ b/templates/hosts.ubuntu.tmpl
@@ -1,9 +1,7 @@
-## This file (/etc/cloud/templates/hosts.tmpl) is only utilized
-## if enabled in cloud-config.  Specifically, in order to enable it
-## you need to add the following to config:
-##    manage_etc_hosts: True
-##
-## Note, double-hash commented lines will not appear in /etc/hosts
+{{# This file /etc/cloud/templates/hosts.tmpl is only utilized
+    if enabled in cloud-config.  Specifically, in order to enable it
+    you need to add the following to config:
+      manage_etc_hosts: True}}
 # 
 # Your system has configured 'manage_etc_hosts' as True.
 # As a result, if you wish for changes to this file to persist
@@ -12,8 +10,8 @@
 # b.) change or remove the value of 'manage_etc_hosts' in
 #     /etc/cloud/cloud.cfg or cloud-config from user-data
 # 
-## The value '$hostname' will be replaced with the local-hostname
-127.0.1.1 $fqdn $hostname
+# The following lines are desirable for IPv4 capable hosts
+127.0.1.1 {{fqdn}} {{hostname}}
 127.0.0.1 localhost
 
 # The following lines are desirable for IPv6 capable hosts
@@ -23,3 +21,4 @@ ff00::0 ip6-mcastprefix
 ff02::1 ip6-allnodes
 ff02::2 ip6-allrouters
 ff02::3 ip6-allhosts
+
diff --git a/templates/sources.list.tmpl b/templates/sources.list.tmpl
index f702025f..8acbd7d5 100644
--- a/templates/sources.list.tmpl
+++ b/templates/sources.list.tmpl
@@ -1,60 +1,59 @@
-\## Note, this file is written by cloud-init on first boot of an instance
-\## modifications made here will not survive a re-bundle.
-\## if you wish to make changes you can:
-\## a.) add 'apt_preserve_sources_list: true' to /etc/cloud/cloud.cfg
-\##     or do the same in user-data
-\## b.) add sources in /etc/apt/sources.list.d
-\## c.) make changes to template file /etc/cloud/templates/sources.list.tmpl
-\###
+# Note, this file is written by cloud-init on first boot of an instance
+# modifications made here will not survive a re-bundle.
+# if you wish to make changes you can:
+# a.) add 'apt_preserve_sources_list: true' to /etc/cloud/cloud.cfg
+#     or do the same in user-data
+# b.) add sources in /etc/apt/sources.list.d
+# c.) make changes to template file /etc/cloud/templates/sources.list.tmpl
 
 # See http://help.ubuntu.com/community/UpgradeNotes for how to upgrade to
 # newer versions of the distribution.
-deb $mirror $codename main
-deb-src $mirror $codename main
+deb {{mirror}} {{codename}} main
+deb-src {{mirror}} {{codename}} main
 
-\## Major bug fix updates produced after the final release of the
-\## distribution.
-deb $mirror $codename-updates main
-deb-src $mirror $codename-updates main
+# Major bug fix updates produced after the final release of the
+# distribution.
+deb {{mirror}} {{codename}}-updates main
+deb-src {{mirror}} {{codename}}-updates main
 
-\## N.B. software from this repository is ENTIRELY UNSUPPORTED by the Ubuntu
-\## team. Also, please note that software in universe WILL NOT receive any
-\## review or updates from the Ubuntu security team.
-deb $mirror $codename universe
-deb-src $mirror $codename universe
-deb $mirror $codename-updates universe
-deb-src $mirror $codename-updates universe
+# N.B. software from this repository is ENTIRELY UNSUPPORTED by the Ubuntu
+# team. Also, please note that software in universe WILL NOT receive any
+# review or updates from the Ubuntu security team.
+deb {{mirror}} {{codename}} universe
+deb-src {{mirror}} {{codename}} universe
+deb {{mirror}} {{codename}}-updates universe
+deb-src {{mirror}} {{codename}}-updates universe
 
-\## N.B. software from this repository is ENTIRELY UNSUPPORTED by the Ubuntu 
-\## team, and may not be under a free licence. Please satisfy yourself as to
-\## your rights to use the software. Also, please note that software in 
-\## multiverse WILL NOT receive any review or updates from the Ubuntu
-\## security team.
-# deb $mirror $codename multiverse
-# deb-src $mirror $codename multiverse
-# deb $mirror $codename-updates multiverse
-# deb-src $mirror $codename-updates multiverse
+# N.B. software from this repository is ENTIRELY UNSUPPORTED by the Ubuntu 
+# team, and may not be under a free licence. Please satisfy yourself as to
+# your rights to use the software. Also, please note that software in 
+# multiverse WILL NOT receive any review or updates from the Ubuntu
+# security team.
+# deb {{mirror}} {{codename}} multiverse
+# deb-src {{mirror}} {{codename}} multiverse
+# deb {{mirror}} {{codename}}-updates multiverse
+# deb-src {{mirror}} {{codename}}-updates multiverse
 
-\## Uncomment the following two lines to add software from the 'backports'
-\## repository.
-\## N.B. software from this repository may not have been tested as
-\## extensively as that contained in the main release, although it includes
-\## newer versions of some applications which may provide useful features.
-\## Also, please note that software in backports WILL NOT receive any review
-\## or updates from the Ubuntu security team.
-# deb $mirror $codename-backports main restricted universe multiverse
-# deb-src $mirror $codename-backports main restricted universe multiverse
+# Uncomment the following two lines to add software from the 'backports'
+# repository.
+# N.B. software from this repository may not have been tested as
+# extensively as that contained in the main release, although it includes
+# newer versions of some applications which may provide useful features.
+# Also, please note that software in backports WILL NOT receive any review
+# or updates from the Ubuntu security team.
+# deb {{mirror}} {{codename}}-backports main restricted universe multiverse
+# deb-src {{mirror}} {{codename}}-backports main restricted universe multiverse
 
-\## Uncomment the following two lines to add software from Canonical's
-\## 'partner' repository.
-\## This software is not part of Ubuntu, but is offered by Canonical and the
-\## respective vendors as a service to Ubuntu users.
-# deb http://archive.canonical.com/ubuntu $codename partner
-# deb-src http://archive.canonical.com/ubuntu $codename partner
+# Uncomment the following two lines to add software from Canonical's
+# 'partner' repository.
+# This software is not part of Ubuntu, but is offered by Canonical and the
+# respective vendors as a service to Ubuntu users.
+# deb http://archive.canonical.com/ubuntu {{codename}} partner
+# deb-src http://archive.canonical.com/ubuntu {{codename}} partner
 
-deb http://security.ubuntu.com/ubuntu $codename-security main
-deb-src http://security.ubuntu.com/ubuntu $codename-security main
-deb http://security.ubuntu.com/ubuntu $codename-security universe
-deb-src http://security.ubuntu.com/ubuntu $codename-security universe
-# deb http://security.ubuntu.com/ubuntu $codename-security multiverse
-# deb-src http://security.ubuntu.com/ubuntu $codename-security multiverse
+deb http://security.ubuntu.com/ubuntu {{codename}}-security main
+deb-src http://security.ubuntu.com/ubuntu {{codename}}-security main
+deb http://security.ubuntu.com/ubuntu {{codename}}-security universe
+deb-src http://security.ubuntu.com/ubuntu {{codename}}-security universe
+# deb http://security.ubuntu.com/ubuntu {{codename}}-security multiverse
+# deb-src http://security.ubuntu.com/ubuntu {{codename}}-security multiverse

From 1218acfd410e78dff2179b96106bad61a30cfae9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:42:05 -0700
Subject: [PATCH 095/434] Updated so that pylint and pyflakes will now run over
 cloudinit/ and bin/ python files

---
 Makefile | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/Makefile b/Makefile
index 0fc6c46b..0a73f987 100644
--- a/Makefile
+++ b/Makefile
@@ -1,11 +1,13 @@
+CWD=$(shell pwd)
+PY_FILES=$(shell find cloudinit bin -name "*.py")
 
 all: test
 
 pylint:
-	pylint cloudinit
+	$(CWD)/tools/run-pylint $(PY_FILES)
 
 pyflakes:
-	pyflakes .
+	pyflakes $(PY_FILES)
 
 test:
 	nosetests tests/unittests/

From 92635ee5e170abd4e75a442bc499aa6cf5660b8f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:43:01 -0700
Subject: [PATCH 096/434] Enabled the oauth library, which seems needed for
 maas datasource.

---
 Requires | 1 +
 1 file changed, 1 insertion(+)

diff --git a/Requires b/Requires
index 6a7064af..dbf64baf 100644
--- a/Requires
+++ b/Requires
@@ -1,2 +1,3 @@
 Tempita>=0.4
 PrettyTable>=0.4
+oauth>=1.0

From 3b6745531eaf36128512bc131bdbe747ee7ac562 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:44:53 -0700
Subject: [PATCH 097/434] Continued adding more comments about what each
 section/option does. Continued adding more system info sections as needed for
 various components. Enabled the welcome transform.

---
 config/cloud.cfg | 40 +++++++++++++++++++++++++++++++++-------
 1 file changed, 33 insertions(+), 7 deletions(-)

diff --git a/config/cloud.cfg b/config/cloud.cfg
index 33feec48..f1c43f2f 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -1,8 +1,26 @@
-user: ubuntu
-disable_root: 1
-preserve_hostname: False
+# The top level settings are used as transforms
+# and system configuration.
 
+# This user will have its passwd adjusted
+user: ubuntu
+
+# If this is set, 'root' will not be able to ssh in and they 
+# will get a message to login instead as the above $user
+disable_root: true
+
+# This will cause the set+update hostname module to not operate (if true)
+preserve_hostname: false
+
+# Example datasource config
+# datasource: 
+#    Ec2: 
+#      metadata_urls: [ 'blah.com' ]
+#      timeout: 5 # (defaults to 50 seconds)
+#      max_wait: 10 # (defaults to 120 seconds)
+
+# The transform modules that run in the 'init' stage
 cloud_init_modules:
+ - welcome
  - bootcmd
  - resizefs
  - set_hostname
@@ -12,6 +30,7 @@ cloud_init_modules:
  - rsyslog
  - ssh
 
+ # The transform modules that run in the 'config' stage
 cloud_config_modules:
  - mounts
  - ssh-import-id
@@ -30,6 +49,7 @@ cloud_config_modules:
  - runcmd
  - byobu
 
+# The transform modules that run in the 'final' stage
 cloud_final_modules:
  - rightscale_userdata
  - scripts-per-once
@@ -40,9 +60,15 @@ cloud_final_modules:
  - phone-home
  - final-message
 
+# System and/or distro specific settings
 system_info:
-   paths:
-      cloud_dir: /var/lib/cloud/
-      templates_dir: /etc/cloud/templates/
-      upstart_dir: /etc/init/
+   # This will affect which distro class gets used
    distro: ubuntu
+   # Other config here will be given to the distro class and/or path classes
+   paths:
+      cloud_dir: "/var/lib/cloud/"
+      templates_dir: "/etc/cloud/templates/"
+      upstart_dir: "/etc/init/"
+   package_mirror: "http://archive.ubuntu.com/ubuntu"
+   availability_zone_template: "http://%(zone)s.ec2.archive.ubuntu.com/ubuntu/"
+   ssh_svcname: ssh

From 707c10341d30d5d4dfbb87e8e2006764149491f2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:45:52 -0700
Subject: [PATCH 098/434] Instead of having the cloud pass large references to
 its constructor, this has been reduced to actual objects. Added a get
 template filename helper which can be used to locate template files for
 various handlers/transforms. Ensured that the config that we give back out is
 copied, so that it can't be modified by any 'malicous' handlers/transforms.
 Added helper method cycle_logging that can resetup logging, this is mainly
 used by the rsyslog transform.

---
 cloudinit/cloud.py | 37 +++++++++++++++++++++++++++++++------
 1 file changed, 31 insertions(+), 6 deletions(-)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index 765e7d3a..b2dfc749 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -20,6 +20,9 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+import copy
+import os
+
 from cloudinit import distros
 from cloudinit import helpers
 from cloudinit import log as logging
@@ -28,18 +31,40 @@ LOG = logging.getLogger(__name__)
 
 
 class Cloud(object):
-    def __init__(self, datasource, paths, cfg):
+    def __init__(self, datasource, paths, cfg, distro, runners):
         self.datasource = datasource
         self.paths = paths
-        self.cfg = cfg
-        self.distro = distros.fetch(cfg, self)
-        self.runners = helpers.Runners(paths)
+        self.distro = distro
+        self._cfg = cfg
+        self._runners = runners
+
+    # If a transform manipulates logging or logging services
+    # it is typically useful to cause the logging to be
+    # setup again.
+    def cycle_logging(self):
+        logging.setupLogging(self.cfg)
+
+    @property
+    def cfg(self):
+        # Ensure that not indirectly modified
+        return copy.deepcopy(self._cfg)
 
     def run(self, name, functor, args, freq=None, clear_on_fail=False):
-        return self.runners.run(name, functor, args, freq, clear_on_fail)
+        return self._runners.run(name, functor, args, freq, clear_on_fail)
 
+    def get_template_filename(self, name):
+        fn = self.paths.template_tpl % (name)
+        if not os.path.isfile(fn):
+            LOG.warn("No template found at %s for template named %s", fn, name)
+            return None
+        return fn
+
+    # The rest of thes are just useful proxies
     def get_userdata(self):
         return self.datasource.get_userdata()
+    
+    def get_instance_id(self):
+        return self.datasource.get_instance_id()
 
     def get_public_ssh_keys(self):
         return self.datasource.get_public_ssh_keys()
@@ -47,7 +72,7 @@ class Cloud(object):
     def get_locale(self):
         return self.datasource.get_locale()
 
-    def get_mirror(self):
+    def get_local_mirror(self):
         return self.datasource.get_local_mirror()
 
     def get_hostname(self, fqdn=False):

From 0475ced448db2b38da2f4300c8475817819e7275 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:48:09 -0700
Subject: [PATCH 099/434] Continued adding distro specific functionality to
 this new parent distro class as needed.

---
 cloudinit/distros/__init__.py | 133 +++++++++++++++++++++++++++++++---
 1 file changed, 123 insertions(+), 10 deletions(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index f7f48d1f..90607668 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -20,26 +20,139 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import contextlib
+import abc
+import copy
 
 from cloudinit import importer
+from cloudinit import util
+
+from StringIO import StringIO
+
+# TODO: Make this via config??
+IFACE_ACTIONS = {
+    'up': ['ifup', '--all'],
+    'down': ['ifdown', '--all'],
+}
 
 
 class Distro(object):
-    def __init__(self, cloud):
-        self.cloud = cloud
 
+    __metaclass__ = abc.ABCMeta
+
+    def __init__(self, cfg, runner):
+        self._runner = runner
+        self._cfg = util.get_cfg_by_path(cfg, ('system_info', ), {})
+        self.name = self._cfg.pop("distro", 'generic')
+
+    @abc.abstractmethod
     def install_packages(self, pkglist):
         raise NotImplementedError()
 
-    def apply_network(self, settings):
+    @abc.abstractmethod
+    def _write_network(self, settings):
+        # In the future use the python-netcf
+        # to write this blob out in a distro format
         raise NotImplementedError()
 
+    def get_option(self, opt_name, default=None):
+        return self._cfg.get(opt_name, default)
 
-def fetch(cfg, cloud):
-    sys_info = cfg.get('system_info', {})
-    distro = sys_info.get('distro', 'ubuntu')
-    mod_name = "%s.%s" % (__name__, distro)
-    mod = importer.import_module(mod_name)
+    @abc.abstractmethod
+    def set_hostname(self, hostname):
+        raise NotImplementedError()
+
+    @abc.abstractmethod
+    def update_hostname(self, hostname, prev_hostname_fn):
+        raise NotImplementedError()
+
+    @abc.abstractmethod
+    def package_command(self, cmd, args=None):
+        raise NotImplementedError()
+
+    def get_package_mirror(self):
+        return self.get_option('package_mirror')
+
+    def get_paths(self):
+        paths = self.get_option("paths") or {}
+        return copy.deepcopy(paths)
+
+    def apply_network(self, settings, bring_up=True):
+        # Write it out
+        self._write_network(settings)
+        # Now try to bring them up
+        if bring_up:
+            self._interface_action('up')
+
+    @abc.abstractmethod
+    def set_timezone(self, tz):
+        raise NotImplementedError()
+
+    def _get_localhost_ip(self):
+        return "127.0.0.1"
+
+    def update_etc_hosts(self, hostname, fqdn):
+        # Format defined at
+        # http://unixhelp.ed.ac.uk/CGI/man-cgi?hosts
+        header = "# Added by cloud-init"
+        real_header = "%s on %s" % (header, util.time_rfc2822())
+        local_ip = self._get_localhost_ip()
+        hosts_line = "%s\t%s %s" % (local_ip, fqdn, hostname)
+        new_etchosts = StringIO()
+        need_write = False
+        need_change = True
+        for line in util.load_file("/etc/hosts").splitlines():
+            if line.strip().startswith(header):
+                continue
+            if not line.strip() or line.strip().startswith("#"):
+                new_etchosts.write("%s\n" % (line))
+                continue
+            split_line = [s.strip() for s in line.split()]
+            if len(split_line) < 2:
+                new_etchosts.write("%s\n" % (line))
+                continue
+            (ip, hosts) = split_line[0], split_line[1:]
+            if ip == local_ip:
+                if sorted([hostname, fqdn]) == sorted(hosts):
+                    need_change = False
+                if need_change:
+                    line = "%s\n%s" % (real_header, hosts_line)
+                    need_change = False
+                    need_write = True
+            new_etchosts.write("%s\n" % (line))
+        if need_change:
+            new_etchosts.write("%s\n%s\n" % (real_header, hosts_line))
+            need_write = True
+        if need_write:
+            contents = new_etchosts.getvalue()
+            util.write_file("/etc/hosts", contents)
+
+    def _interface_action(self, action):
+        if action not in IFACE_ACTIONS:
+            raise NotImplementedError("Unknown interface action %s" % (action))
+        cmd = IFACE_ACTIONS[action]
+        try:
+            LOG.info("Attempting to run %s interface action using command %s",
+                     action, cmd)
+            (_out, err) = util.subp(cmd)
+            if len(err):
+                LOG.warn("Running %s resulted in stderr output: %s",
+                         IF_UP_CMD, err)
+            return True
+        except util.ProcessExecutionError as exc:
+            util.logexc(LOG, "Running %s failed", cmd)
+            return False
+
+
+def fetch(distro_name, mods=(__name__, )):
+    mod = None
+    for m in mods:
+        try:
+            mod_name = "%s.%s" % (m, distro_name)
+            mod = importer.import_module(mod_name)
+        except RuntimeError:
+            pass
+    if not mod:
+        raise RuntimeError("No distribution found for distro %s" % (distro_name))
     distro_cls = getattr(mod, 'Distro')
-    return distro_cls(cloud)
\ No newline at end of file
+    return distro_cls
+    

From f84615d505b1732e9af8354228be8dbd5760a1e4 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:49:02 -0700
Subject: [PATCH 100/434] Change variable names to reflect usage correctly

---
 cloudinit/templater.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cloudinit/templater.py b/cloudinit/templater.py
index 5839911c..41315adf 100644
--- a/cloudinit/templater.py
+++ b/cloudinit/templater.py
@@ -29,9 +29,9 @@ def render_from_file(fn, params):
     return render_string(util.load_file(fn), params, name=fn)
 
 
-def render_to_file(name, outfile, params):
-    contents = render_from_file(name, params)
-    util.write_file(outfile, contents)
+def render_to_file(fn, outfn, params):
+    contents = render_from_file(fn, params)
+    util.write_file(outfn, contents)
 
 
 def render_string(content, params, name=None):

From d20aba320691ccf1946d2197b2a9722e39d0f497 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:49:28 -0700
Subject: [PATCH 101/434] Moved as many distro specific actions to here as
 should be needed. Mainly this is the following:

1. Hostname updating
2. Package command invocation
3. Network settings writings
4. Timezone setting (needs cleanup)
---
 cloudinit/distros/ubuntu.py | 81 +++++++++++++++++++++++++++++++++----
 1 file changed, 73 insertions(+), 8 deletions(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index ccf2cec4..b8aff03c 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -20,36 +20,101 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from StringIO import StringIO
+
 import os
+import socket
 
 from cloudinit import distros
 from cloudinit import log as logging
+from cloudinit import templater
 from cloudinit import util
 
 from cloudinit.settings import (PER_INSTANCE)
 
-
 LOG = logging.getLogger(__name__)
 
 
 class Distro(distros.Distro):
 
     def install_packages(self, pkglist):
-        self.update_package_sources()
-        self.apt_get('install', pkglist)
+        self._update_package_sources()
+        self._apt_get('install', pkglist)
 
-    def apply_network(self, settings):
+    def _write_network(self, settings):
         util.write_file("/etc/network/interfaces", settings)
 
+    def package_command(self, command, args=None):
+        self._apt_get(command, args)
+
+    def set_hostname(self, hostname):
+        util.write_file("/etc/hostname", "%s\n" % hostname, 0644)
+        LOG.debug("Setting hostname to %s", hostname)
+        util.subp(['hostname', hostname])
+
+    def update_hostname(self, hostname, prev_file):
+        hostname_prev = None 
+        prev_name = self._read_hostname(prev_file)
+        hostname_in_etc = self._read_hostname("/etc/hostname")
+        update_files = []
+        if not hostname_prev or hostname_prev != hostname:
+            update_files.append(prev_file)
+        if (not hostname_in_etc or
+           (hostname_in_etc == hostname_prev and hostname_in_etc != hostname)):
+            update_files.append("/etc/hostname")
+        for fn in update_files:
+            try:
+                util.write_file(fn, "%s\n" % hostname, 0644)
+            except:
+                util.logexc(LOG, "Failed to write hostname %s to %s", hostname, fn)
+        if hostname_in_etc and hostname_prev and hostname_in_etc != hostname_prev:
+             LOG.debug(("%s differs from /etc/hostname."
+                        " Assuming user maintained hostname."), prev_file)
+        if "/etc/hostname" in update_files:
+            LOG.debug("Setting hostname to %s", hostname)
+            util.subp(['hostname', hostname])
+
+    def _read_hostname(filename, default=None):
+        contents = util.load_file(filename, quiet=True)
+        for line in contents.splitlines():
+            hpos = line.find("#")
+            if hpos != -1:
+                line = line[0:hpos]
+            line = line.rstrip()
+            if line:
+                return line
+        return default
+
+    def _get_localhost_ip(self):
+        # Note: http://www.leonardoborda.com/blog/127-0-1-1-ubuntu-debian/
+        return "127.0.1.1"
+
+    def set_timezone(self, tz):
+        tz_file = os.path.join("/usr/share/zoneinfo", tz)
+        if not os.path.isfile(tz_file):
+            raise Exception("Invalid timezone %s, no file found at %s" % (tz, tz_file))
+        tz_contents = "%s\n" % tz
+        util.write_file("/etc/timezone", tz_contents)
+        # TODO, this should be in a rhel distro subclass??
+        if os.path.exists("/etc/sysconfig/clock"):
+            tz_contents = '"%s"\n' % tz
+            util.write_file("/etc/sysconfig/clock", tz_contents)
+        # This ensures that the correct tz will be used for the system
+        util.copy(tz_file, "/etc/localtime")
+
+    def name(self):
+        return "ubuntu"
+
     # apt_get top level command (install, update...), and args to pass it
-    def apt_get(self, tlc, args=None):
+    def _apt_get(self, tlc, args=None):
         e = os.environ.copy()
         e['DEBIAN_FRONTEND'] = 'noninteractive'
         cmd = ['apt-get', '--option', 'Dpkg::Options::=--force-confold',
                '--assume-yes', tlc]
         if args:
             cmd.extend(args)
-        util.subp(cmd, env=e)
+        # Allow the output of this to flow outwards (ie not be captured)
+        util.subp(cmd, env=e, capture=False)
 
-    def update_package_sources(self):
-        self.cloud.run("update-sources", self.apt_get, ["update"], freq=PER_INSTANCE)
\ No newline at end of file
+    def _update_package_sources(self):
+        self.runner.run("update-sources", self._apt_get, ["update"], freq=PER_INSTANCE)
\ No newline at end of file

From e1b300595aa57222a30474fbd1e024f6129e7dc2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:51:27 -0700
Subject: [PATCH 102/434] 1. Handle returning values from handlers better. 2.
 Throw lock specific exception when semaphores can't be obtained 3. Make the
 paths constructor config variable named better to its actual usage.

---
 cloudinit/helpers.py | 39 ++++++++++++++++++++++++++-------------
 1 file changed, 26 insertions(+), 13 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index e5f33a26..2ecda3e9 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -38,12 +38,16 @@ from cloudinit.user_data import upstart_job as up_part
 LOG = logging.getLogger(__name__)
 
 
+class LockFailure(Exception):
+    pass
+
+
 class DummySemaphores(object):
     def __init__(self):
         pass
 
     @contextlib.contextmanager
-    def lock(self, _name, _freq, _clear_on_fail):
+    def lock(self, _name, _freq, _clear_on_fail=False):
         yield True
 
     def has_run(self, _name, _freq):
@@ -61,7 +65,7 @@ class FileSemaphores(object):
         self.sem_path = sem_path
 
     @contextlib.contextmanager
-    def lock(self, name, freq, clear_on_fail):
+    def lock(self, name, freq, clear_on_fail=False):
         try:
             yield self._acquire(name, freq)
         except:
@@ -73,15 +77,17 @@ class FileSemaphores(object):
         sem_file = self._get_path(name, freq)
         try:
             util.del_file(sem_file)
-        except (IOError, OSError):
+        except (IOError, OSError) as e:
+            util.logexc(LOG, "Failed deleting semaphore %s", sem_file)
             return False
         return True
 
     def clear_all(self):
         try:
             util.del_dir(self.sem_path)
-        except (IOError, OSError):
-            pass
+        except (IOError, OSError) as e:
+            LOG.debug("Failed deleting semaphore directory %s due to %s",
+                      self.sem_path, e)
 
     def _acquire(self, name, freq):
         if self.has_run(name, freq):
@@ -93,7 +99,8 @@ class FileSemaphores(object):
         contents = "%s: %s\n" % (os.getpid(), time())
         try:
             util.write_file(sem_file, contents)
-        except (IOError, OSError):
+        except (IOError, OSError) as e:
+            util.logexc(LOG, "Failed writing semaphore file %s", sem_file)
             return None
         return sem_file
 
@@ -143,11 +150,14 @@ class Runners(object):
             return None
         with sem.lock(name, freq, clear_on_fail) as lk:
             if not lk:
-                raise RuntimeError("Failed to acquire lock on %s" % name)
+                raise LockFailure("Failed to acquire lock for %s" % name)
             else:
                 LOG.debug("Running %s with args %s using lock %s",
                           functor, args, lk)
-                return functor(*args)
+                if isinstance(args, (dict)):
+                    return functor(**args)
+                else:
+                    return functor(*args)
 
 
 class ContentHandlers(object):
@@ -217,12 +227,12 @@ class ContentHandlers(object):
 
 
 class Paths(object):
-    def __init__(self, sys_info):
-        self.cloud_dir = sys_info.get('cloud_dir', '/var/lib/cloud')
+    def __init__(self, path_cfgs, ds=None):
+        self.cloud_dir = path_cfgs.get('cloud_dir', '/var/lib/cloud')
         self.instance_link = os.path.join(self.cloud_dir, 'instance')
         self.boot_finished = os.path.join(self.instance_link, "boot-finished")
-        self.upstart_conf_d = sys_info.get('upstart_dir')
-        template_dir = sys_info.get('templates_dir', '/etc/cloud/templates/')
+        self.upstart_conf_d = path_cfgs.get('upstart_dir')
+        template_dir = path_cfgs.get('templates_dir', '/etc/cloud/templates/')
         self.template_tpl = os.path.join(template_dir, '%s.tmpl')
         self.seed_dir = os.path.join(self.cloud_dir, 'seed')
         self.lookups = {
@@ -237,7 +247,7 @@ class Paths(object):
            "data": "data",
         }
         # Set when a datasource becomes active
-        self.datasource = None
+        self.datasource = ds
 
     # get_ipath_cur: get the current instance path for an item
     def get_ipath_cur(self, name=None):
@@ -256,6 +266,8 @@ class Paths(object):
             cpath = os.path.join(cpath, add_on)
         return cpath
 
+    # get_ipath : get the instance path for a name in pathmap
+    # (/var/lib/cloud/instances/<instance>/<name>)
     def _get_ipath(self, name=None):
         if not self.datasource:
             return None
@@ -268,6 +280,7 @@ class Paths(object):
             ipath = os.path.join(ipath, add_on)
         return ipath
 
+    # get_ipath : get the instance path for a name in pathmap
     # (/var/lib/cloud/instances/<instance>/<name>)
     def get_ipath(self, name=None):
         ipath = self._get_ipath(name)

From 61db967999f2411366dbee815f413ec17f900c6d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:54:27 -0700
Subject: [PATCH 103/434] Ensure that the root logger is manipulated instead of
 just the cloudinit logger, show how many configs were tried if none
 succeeded, and for basic logging setup try to mirror more of what is in the
 default configuration file if all else fails

---
 cloudinit/log.py | 42 ++++++++++++++++++++++++++++++------------
 1 file changed, 30 insertions(+), 12 deletions(-)

diff --git a/cloudinit/log.py b/cloudinit/log.py
index 6e7424e1..c247eb9e 100644
--- a/cloudinit/log.py
+++ b/cloudinit/log.py
@@ -41,16 +41,27 @@ DEBUG = logging.DEBUG
 NOTSET = logging.NOTSET
 
 # Default basic format
-DEF_FORMAT = '%(levelname)s: @%(name)s : %(message)s'
+DEF_CON_FORMAT = '%(asctime)s - %(filename)s[%(levelname)s]: %(message)s'
 
 
-def setupBasicLogging(level=INFO, fmt=DEF_FORMAT):
-    root = getLogger()
-    console = logging.StreamHandler(sys.stdout)
-    console.setFormatter(logging.Formatter(fmt))
-    console.setLevel(level)
+def setupBasicLogging():
+    root = logging.getLogger()
+    # Warnings go to the console
+    console = logging.StreamHandler(sys.stderr)
+    console.setFormatter(logging.Formatter(DEF_CON_FORMAT))
+    console.setLevel(WARNING)
     root.addHandler(console)
-    root.setLevel(level)
+    # Everything else goes to this file (if we can)
+    try:
+        cfile = logging.FileHandler('/var/log/cloud-init.log')
+        cfile.setFormatter(logging.Formatter(DEF_CON_FORMAT))
+        cfile.setLevel(DEBUG)
+        root.addHandle(cfile)
+    except (IOError, OSError):
+        # Likely that u can't write to that file...
+        # Make console now have DEBUG??
+        console.setLevel(DEBUG)
+    root.setLevel(DEBUG)
 
 
 def setupLogging(cfg=None):
@@ -61,7 +72,7 @@ def setupLogging(cfg=None):
     log_cfgs = []
     log_cfg = cfg.get('logcfg')
     if log_cfg and isinstance(log_cfg, (str, basestring)):
-        # Ff there is a 'logcfg' entry in the config,
+        # If there is a 'logcfg' entry in the config,
         # respect it, it is the old keyname
         log_cfgs.append(str(log_cfg))
     elif "log_cfgs" in cfg and isinstance(cfg['log_cfgs'], (set, list)):
@@ -73,20 +84,27 @@ def setupLogging(cfg=None):
                 log_cfgs.append(str(a_cfg))
 
     # See if any of them actually load...
+    am_tried = 0
     am_worked = 0
     for log_cfg in log_cfgs:
         try:
-            if not os.path.isfile(log_cfg):
+            am_tried += 1
+            # Assume its just a string if not a filename
+            if log_cfg.startswith("/") and os.path.isfile(log_cfg):
+                pass
+            else:
                 log_cfg = StringIO(log_cfg)
+            # Attempt to load its config
             logging.config.fileConfig(log_cfg)
             am_worked += 1
         except Exception:
             pass
 
-    # If it didn't work, at least setup a basic logger
+    # If it didn't work, at least setup a basic logger (if desired)
     basic_enabled = cfg.get('log_basic', True)
     if not am_worked:
-        sys.stderr.write("Warning, no logging configured!\n")
+        sys.stderr.write(("Warning, no logging configured!"
+                          " (tried %s configs)\n") % (am_tried))
         if basic_enabled:
             sys.stderr.write("Setting up basic logging...\n")
             setupBasicLogging()
@@ -105,5 +123,5 @@ except ImportError:
         def emit(self, record):
             pass
 
-logger = getLogger()
+logger = logging.getLogger()
 logger.addHandler(NullHandler())

From 204add3020c94d62ef55364eaf2a7e033f713141 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:54:52 -0700
Subject: [PATCH 104/434] Logic test on split up line length (just incase).
 Removed un-used pre debug info option, since this is not used in the
 prettytable case.

---
 cloudinit/netinfo.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index 874c2674..0d729502 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -82,7 +82,7 @@ def route_info():
         if not line:
             continue
         toks = line.split()
-        if toks[0] == "Kernel" or toks[0] == "Destination":
+        if len(toks) < 8 or toks[0] == "Kernel" or toks[0] == "Destination":
             continue
         entry = {
             'destination': toks[0],
@@ -140,9 +140,9 @@ def route_pformat():
         fields = ['Route', 'Destination', 'Gateway',
                   'Genmask', 'Interface', 'Flags']
         tbl = PrettyTable(fields)
-        for n, r in enumerate(routes):
+        for (n, r) in enumerate(routes):
             route_id = str(n)
-            tbl.add_row([str(n), r['destination'],
+            tbl.add_row([route_id, r['destination'],
                         r['gateway'], r['genmask'],
                         r['iface'], r['flags']])
         route_s = tbl.get_string()
@@ -152,7 +152,7 @@ def route_pformat():
     return os.linesep.join(lines)
 
 
-def debug_info(pre=""):
+def debug_info():
     lines = []
     lines.append(netdev_pformat())
     lines.append(route_pformat())

From 391e88b4f74bc5702da50fd78bcc164aa6b35643 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:56:10 -0700
Subject: [PATCH 105/434] Add more comments around what the settings mean, add
 in a list that can be used to check if user provided frequencies are actually
 valid or not

---
 cloudinit/settings.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/cloudinit/settings.py b/cloudinit/settings.py
index f58c4b52..8a1eaeb3 100644
--- a/cloudinit/settings.py
+++ b/cloudinit/settings.py
@@ -20,10 +20,17 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+# Set and read for determining the cloud config file location
 CFG_ENV_NAME = "CLOUD_CFG"
+
+# This is expected to be a yaml formatted file
 CLOUD_CONFIG = '/etc/cloud/cloud.cfg'
+
+# This legacy format is expected to be readable by
+# configobj, see http://pypi.python.org/pypi/configobj
 OLD_CLOUD_CONFIG = '/etc/ec2-init/ec2-config.cfg'
 
+# What u get if no config is provided
 CFG_BUILTIN = {
     'datasource_list': [
         'NoCloud',
@@ -45,7 +52,10 @@ CFG_BUILTIN = {
     },
 }
 
+# Valid frequencies of handlers/modules
 PER_INSTANCE = "once-per-instance"
 PER_ALWAYS = "always"
 PER_ONCE = "once"
 
+# Used to sanity check incoming handlers/modules frequencies
+FREQUENCIES = [PER_INSTANCE, PER_ALWAYS, PER_ONCE]

From bfd3dbdc8ea05abcb7b9d2b59daf7ebbba9c11a0 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:56:56 -0700
Subject: [PATCH 106/434] Split up time calculation, use logexc instead of
 log.exception

---
 cloudinit/sources/DataSourceCloudStack.py | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/cloudinit/sources/DataSourceCloudStack.py b/cloudinit/sources/DataSourceCloudStack.py
index 33fb3491..791df68f 100644
--- a/cloudinit/sources/DataSourceCloudStack.py
+++ b/cloudinit/sources/DataSourceCloudStack.py
@@ -2,9 +2,11 @@
 #
 #    Copyright (C) 2012 Canonical Ltd.
 #    Copyright (C) 2012 Cosmin Luta
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Cosmin Luta <q4break@gmail.com>
 #    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -66,7 +68,7 @@ class DataSourceCloudStack(sources.DataSource):
         if util.read_optional_seed(seed_ret, base=(self.seed_dir + "/")):
             self.userdata_raw = seed_ret['user-data']
             self.metadata = seed_ret['meta-data']
-            LOG.info("Using seeded cloudstack data from: %s", self.seed_dir)
+            LOG.debug("Using seeded cloudstack data from: %s", self.seed_dir)
             return True
         try:
             start = time.time()
@@ -74,12 +76,12 @@ class DataSourceCloudStack(sources.DataSource):
                 None, self.metadata_address)
             self.metadata = boto_utils.get_instance_metadata(self.api_ver,
                 self.metadata_address)
-            LOG.debug("Crawl of metadata service took %ds",
-                      (time.time() - start))
+            tot_time = (time.time() - start)
+            LOG.debug("Crawl of metadata service took %s", int(tot_time))
             return True
         except Exception as e:
-            LOG.exception(('Failed fetching from metadata '
-                           'service %s due to: %s'), self.metadata_address, e)
+            util.logexc(LOG, ('Failed fetching from metadata '
+                              'service %s'), self.metadata_address)
             return False
 
     def get_instance_id(self):

From 7fe94ef97845396167d3eaa9d7969060da5dd2e7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:58:38 -0700
Subject: [PATCH 107/434] Update applying network esttings to use the distro
 function to handle this, use logexc instead of log.exception

---
 cloudinit/sources/DataSourceConfigDrive.py | 27 ++++++++++------------
 1 file changed, 12 insertions(+), 15 deletions(-)

diff --git a/cloudinit/sources/DataSourceConfigDrive.py b/cloudinit/sources/DataSourceConfigDrive.py
index ca4bb7cf..176b62b0 100644
--- a/cloudinit/sources/DataSourceConfigDrive.py
+++ b/cloudinit/sources/DataSourceConfigDrive.py
@@ -1,6 +1,10 @@
+# vi: ts=4 expandtab
+#
 #    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -22,6 +26,8 @@ from cloudinit import sources
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)
+
+# Various defaults/constants...
 DEFAULT_IID = "iid-dsconfigdrive"
 DEFAULT_MODE = 'pass'
 CFG_DRIVE_FILES = [
@@ -33,7 +39,6 @@ DEFAULT_METADATA = {
     "instance-id": DEFAULT_IID, 
     "dsmode": DEFAULT_MODE,
 }
-IF_UP_CMD = ['ifup', '--all']
 CFG_DRIVE_DEV_ENV = 'CLOUD_INIT_CONFIG_DRIVE_DEVICE'
 
 
@@ -43,11 +48,11 @@ class DataSourceConfigDrive(sources.DataSource):
         self.seed = None
         self.cfg = {}
         self.dsmode = 'local'
-        self.seed_dir = os.path.join(self.paths.seed_dir, 'config_drive')
+        self.seed_dir = os.path.join(paths.seed_dir, 'config_drive')
 
     def __str__(self):
         mstr = "%s[%s]" % (util.obj_name(self), self.dsmode)
-        mstr = mstr + " [seed=%s]" % (self.seed)
+        mstr += " [seed=%s]" % (self.seed)
         return mstr
 
     def get_data(self):
@@ -60,8 +65,8 @@ class DataSourceConfigDrive(sources.DataSource):
                 (md, ud) = read_config_drive_dir(self.seed_dir)
                 found = self.seed_dir
             except NonConfigDriveDir:
-                LOG.exception("Failed reading config drive from %s",
-                              self.seed_dir)
+                util.logexc(LOG, "Failed reading config drive from %s",
+                            self.seed_dir)
         if not found:
             dev = find_cfg_drive_device()
             if dev:
@@ -86,15 +91,7 @@ class DataSourceConfigDrive(sources.DataSource):
                 LOG.info("Updating network interfaces from configdrive")
             else:
                 LOG.debug("Updating network interfaces from configdrive")
-
             self.distro.apply_network(md['network-interfaces'])
-            try:
-                (_out, err) = util.subp(IF_UP_CMD)
-                if len(err):
-                    LOG.warn("Running %s resulted in stderr output: %s",
-                             IF_UP_CMD, err)
-            except util.ProcessExecutionError:
-                LOG.exception("Running %s failed", IF_UP_CMD)
 
         self.seed = found
         self.metadata = md
@@ -109,7 +106,7 @@ class DataSourceConfigDrive(sources.DataSource):
     def get_public_ssh_keys(self):
         if not 'public-keys' in self.metadata:
             return []
-        return list(self.metadata['public-keys'])
+        return self.metadata['public-keys']
 
     # The data sources' config_obj is a cloud-config formated
     # object that came to it from ways other than cloud-config
@@ -226,6 +223,6 @@ datasources = [
 ]
 
 
-# Used to match classes to dependencies
+# Return a list of data sources that match this set of dependencies
 def get_datasource_list(depends):
     return sources.list_from_depends(depends, datasources)

From f6a93d74bca2cbee832a369ed3c2518f6057d157 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 17:59:12 -0700
Subject: [PATCH 108/434] Complete cleanup for refactoring/rework that makes it
 comptabile with the new structure, using unified util functions, logging and
 eliminating code and calls.

---
 cloudinit/sources/DataSourceEc2.py | 229 +++++++++++++++++------------
 1 file changed, 133 insertions(+), 96 deletions(-)

diff --git a/cloudinit/sources/DataSourceEc2.py b/cloudinit/sources/DataSourceEc2.py
index 7051ecda..38be71fa 100644
--- a/cloudinit/sources/DataSourceEc2.py
+++ b/cloudinit/sources/DataSourceEc2.py
@@ -2,9 +2,11 @@
 #
 #    Copyright (C) 2009-2010 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
 #    Author: Juerg Hafliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -18,31 +20,38 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.DataSource as DataSource
-
-from cloudinit import seeddir as base_seeddir
-from cloudinit import log
-import cloudinit.util as util
-import socket
+import os
 import time
+
 import boto.utils as boto_utils
-import os.path
+
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import url_helper as uhelp
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
+DEF_MD_URL = "http://169.254.169.254"
+DEF_MD_VERSION = '2009-04-04'
+DEF_MD_URLS = [DEF_MD_URL, "http://instance-data:8773"]
 
 
-class DataSourceEc2(DataSource.DataSource):
-    api_ver = '2009-04-04'
-    seeddir = base_seeddir + '/ec2'
-    metadata_address = "http://169.254.169.254"
+class DataSourceEc2(sources.DataSource):
+    def __init__(self, sys_cfg, distro, paths):
+        sources.DataSource.__init__(self, sys_cfg, distro, paths)
+        self.metadata_address = DEF_MD_URL
+        self.seed_dir = os.path.join(paths.seed_dir, "ec2")
+        self.api_ver = DEF_MD_VERSION
 
     def __str__(self):
-        return("DataSourceEc2")
+        return util.obj_name(self)
 
     def get_data(self):
-        seedret = {}
-        if util.read_optional_seed(seedret, base=self.seeddir + "/"):
-            self.userdata_raw = seedret['user-data']
-            self.metadata = seedret['meta-data']
-            log.debug("using seeded ec2 data in %s" % self.seeddir)
+        seed_ret = {}
+        if util.read_optional_seed(seed_ret, base=(self.seed_dir + "/")):
+            self.userdata_raw = seed_ret['user-data']
+            self.metadata = seed_ret['meta-data']
+            LOG.debug("Using seeded ec2 data from %s", self.seed_dir)
             return True
 
         try:
@@ -53,51 +62,61 @@ class DataSourceEc2(DataSource.DataSource):
                 None, self.metadata_address)
             self.metadata = boto_utils.get_instance_metadata(self.api_ver,
                 self.metadata_address)
-            log.debug("crawl of metadata service took %ds" % (time.time() -
-                                                              start))
+            tot_time = int(time.time() - start)
+            LOG.debug("Crawl of metadata service took %s", tot_time)
             return True
-        except Exception as e:
-            print e
+        except Exception:
+            util.logexc(LOG, "Failed reading from metadata address %s",
+                        self.metadata_address)
             return False
 
     def get_instance_id(self):
-        return(self.metadata['instance-id'])
+        return self.metadata['instance-id']
 
     def get_availability_zone(self):
-        return(self.metadata['placement']['availability-zone'])
+        return self.metadata['placement']['availability-zone']
 
     def get_local_mirror(self):
-        return(self.get_mirror_from_availability_zone())
+        return self.get_mirror_from_availability_zone()
 
     def get_mirror_from_availability_zone(self, availability_zone=None):
-        # availability is like 'us-west-1b' or 'eu-west-1a'
-        if availability_zone == None:
+        # Availability is like 'us-west-1b' or 'eu-west-1a'
+        if availability_zone is None:
             availability_zone = self.get_availability_zone()
 
-        fallback = None
-
         if self.is_vpc():
-            return fallback
+            return None
 
-        try:
-            host = "%s.ec2.archive.ubuntu.com" % availability_zone[:-1]
-            socket.getaddrinfo(host, None, 0, socket.SOCK_STREAM)
-            return 'http://%s/ubuntu/' % host
-        except:
-            return fallback
+        # Use the distro to get the mirror
+        if not availability_zone:
+            return None
 
-    def wait_for_metadata_service(self):
+        mirror_tpl = self.distro.get_option('availability_zone_template')
+        if not mirror_tpl:
+            return None
+
+        tpl_params = {
+            'zone': availability_zone.strip(),
+        }
+        mirror_url = mirror_tpl % (tpl_params)
+
+        (max_wait, timeout) = self._get_url_settings()
+        worked = uhelp.wait_for_url([mirror_url], max_wait=max_wait,
+                                timeout=timeout, status_cb=LOG.warn)
+        if not worked:
+            return None
+
+        return mirror_url
+
+    def _get_url_settings(self):
         mcfg = self.ds_cfg
-
-        if not hasattr(mcfg, "get"):
+        if not mcfg:
             mcfg = {}
-
         max_wait = 120
         try:
             max_wait = int(mcfg.get("max_wait", max_wait))
         except Exception:
-            util.logexc(log)
-            log.warn("Failed to get max wait. using %s" % max_wait)
+            util.logexc(LOG, "Failed to get max wait. using %s", max_wait)
 
         if max_wait == 0:
             return False
@@ -106,91 +125,104 @@ class DataSourceEc2(DataSource.DataSource):
         try:
             timeout = int(mcfg.get("timeout", timeout))
         except Exception:
-            util.logexc(log)
-            log.warn("Failed to get timeout, using %s" % timeout)
+            util.logexc(LOG, "Failed to get timeout, using %s", timeout)
+        return (max_wait, timeout)
 
-        def_mdurls = ["http://169.254.169.254", "http://instance-data:8773"]
-        mdurls = mcfg.get("metadata_urls", def_mdurls)
+    def wait_for_metadata_service(self):
+        mcfg = self.ds_cfg
+        if not mcfg:
+            mcfg = {}
+
+        (max_wait, timeout) = self._get_url_settings()
 
         # Remove addresses from the list that wont resolve.
+        mdurls = mcfg.get("metadata_urls", DEF_MD_URLS)
         filtered = [x for x in mdurls if util.is_resolvable_url(x)]
 
         if set(filtered) != set(mdurls):
-            log.debug("removed the following from metadata urls: %s" %
-                list((set(mdurls) - set(filtered))))
+            LOG.debug("Removed the following from metadata urls: %s",
+                      list((set(mdurls) - set(filtered))))
 
         if len(filtered):
             mdurls = filtered
         else:
-            log.warn("Empty metadata url list! using default list")
-            mdurls = def_mdurls
+            LOG.warn("Empty metadata url list! using default list")
+            mdurls = DEF_MD_URLS
 
         urls = []
-        url2base = {False: False}
+        url2base = {}
         for url in mdurls:
             cur = "%s/%s/meta-data/instance-id" % (url, self.api_ver)
             urls.append(cur)
             url2base[cur] = url
 
         starttime = time.time()
-        url = util.wait_for_url(urls=urls, max_wait=max_wait,
-                                timeout=timeout, status_cb=log.warn)
+        url = uhelp.wait_for_url(urls=urls, max_wait=max_wait,
+                                timeout=timeout, status_cb=LOG.warn)
 
         if url:
-            log.debug("Using metadata source: '%s'" % url2base[url])
+            LOG.info("Using metadata source: '%s'", url2base[url])
         else:
-            log.critical("giving up on md after %i seconds\n" %
-                         int(time.time() - starttime))
+            LOG.critical("Giving up on md from %s after %i seconds",
+                            urls, int(time.time() - starttime))
 
-        self.metadata_address = url2base[url]
-        return (bool(url))
-
-    def device_name_to_device(self, name):
-        # consult metadata service, that has
-        #  ephemeral0: sdb
-        # and return 'sdb' for input 'ephemeral0'
-        if 'block-device-mapping' not in self.metadata:
-            return(None)
-
-        found = None
-        for entname, device in self.metadata['block-device-mapping'].items():
-            if entname == name:
-                found = device
-                break
-            # LP: #513842 mapping in Euca has 'ephemeral' not 'ephemeral0'
-            if entname == "ephemeral" and name == "ephemeral0":
-                found = device
-        if found == None:
-            log.debug("unable to convert %s to a device" % name)
-            return None
+        self.metadata_address = url2base.get(url)
+        return bool(url)
 
+    def _remap_device(self, short_name):
         # LP: #611137
         # the metadata service may believe that devices are named 'sda'
         # when the kernel named them 'vda' or 'xvda'
         # we want to return the correct value for what will actually
         # exist in this instance
         mappings = {"sd": ("vd", "xvd")}
-        ofound = found
-        short = os.path.basename(found)
-
-        if not found.startswith("/"):
-            found = "/dev/%s" % found
-
-        if os.path.exists(found):
-            return(found)
-
-        for nfrom, tlist in mappings.items():
-            if not short.startswith(nfrom):
+        for (nfrom, tlist) in mappings.iteritems():
+            if not short_name.startswith(nfrom):
                 continue
             for nto in tlist:
-                cand = "/dev/%s%s" % (nto, short[len(nfrom):])
+                cand = "/dev/%s%s" % (nto, short_name[len(nfrom):])
                 if os.path.exists(cand):
-                    log.debug("remapped device name %s => %s" % (found, cand))
-                    return(cand)
+                    return cand
+        return None
 
-        # on t1.micro, ephemeral0 will appear in block-device-mapping from
+    def device_name_to_device(self, name):
+        # Consult metadata service, that has
+        #  ephemeral0: sdb
+        # and return 'sdb' for input 'ephemeral0'
+        if 'block-device-mapping' not in self.metadata:
+            return None
+
+        # Example:
+        # 'block-device-mapping': 
+        # {'ami': '/dev/sda1',
+        # 'ephemeral0': '/dev/sdb',
+        # 'root': '/dev/sda1'}
+        found = None
+        for (entname, device) in self.metadata['block-device-mapping'].items():
+            if entname == name:
+                found = device
+                break
+            # LP: #513842 mapping in Euca has 'ephemeral' not 'ephemeral0'
+            if entname == "ephemeral" and name == "ephemeral0":
+                found = device
+        if found is None:
+            LOG.debug("Unable to convert %s to a device", name)
+            return None
+
+        ofound = found
+        if not found.startswith("/"):
+            found = "/dev/%s" % found
+        if os.path.exists(found):
+            return found
+
+        remapped = self._remap_device(os.path.basename(found))
+        if remapped:
+            LOG.debug("Remapped device name %s => %s", (found, remapped))
+            return remapped
+
+        # On t1.micro, ephemeral0 will appear in block-device-mapping from
         # metadata, but it will not exist on disk (and never will)
-        # at this pint, we've verified that the path did not exist
+        # at this point, we've verified that the path did not exist
         # in the special case of 'ephemeral0' return None to avoid bogus
         # fstab entry (LP: #744019)
         if name == "ephemeral0":
@@ -198,7 +230,11 @@ class DataSourceEc2(DataSource.DataSource):
         return ofound
 
     def is_vpc(self):
-        # per comment in LP: #615545
+        # See: https://bugs.launchpad.net/ubuntu/+source/cloud-init/+bug/615545
+        # Detect that the machine was launched in a VPC.
+        # But I did notice that when in a VPC, meta-data
+        # does not have public-ipv4 and public-hostname
+        # listed as a possibility.
         ph = "public-hostname"
         p4 = "public-ipv4"
         if ((ph not in self.metadata or self.metadata[ph] == "") and
@@ -207,11 +243,12 @@ class DataSourceEc2(DataSource.DataSource):
         return False
 
 
+# Used to match classes to dependencies
 datasources = [
-  (DataSourceEc2, (DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK)),
+  (DataSourceEc2, (sources.DEP_FILESYSTEM, sources.DEP_NETWORK)),
 ]
 
 
-# return a list of data sources that match this set of dependencies
+# Return a list of data sources that match this set of dependencies
 def get_datasource_list(depends):
-    return(DataSource.list_from_depends(depends, datasources))
+    return sources.list_from_depends(depends, datasources)

From acc6265a2560979750925cb7c3ca1b351468fba2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:01:03 -0700
Subject: [PATCH 109/434] Complete initial cleanup for refactoring/rework.

Some of the cleanups were the following

1. Using standard (logged) utility functions for sub process work, writing, reading files, and other file system/operating system options
2. Having distrobutions impelement there own subclasses to handle system specifics (if applicable)
3. Having a cloud wrapper that provides just the functionality we want to expose (cloud.py)
4. Using a path class instead of globals for all cloud init paths (it is configured via config)
5. Removal of as much shared global state as possible (there should be none, minus a set of constants)
6. Other various cleanups that remove transforms/handlers/modules from reading/writing/chmoding there own files.
 a. They should be using util functions to take advantage of the logging that is now enabled in those util functions (very useful for debugging)
7. Urls being read and checked from a single module that serves this and only this purpose (+1 for code organization)
8. Updates to log whenever a transform decides not to run
9. Ensure whenever a exception is thrown (and possibly captured) that the util.logexc function is called
 a. For debugging, tracing this is important to not just drop them on the floor.
10. Code shuffling into utils.py where it makes sense (and where it could serve a benefit for other code now or in the future)
---
 cloudinit/sources/DataSourceMAAS.py           | 226 +++++------------
 cloudinit/sources/DataSourceNoCloud.py        | 143 ++++++-----
 cloudinit/sources/DataSourceOVF.py            | 227 +++++++-----------
 cloudinit/sources/__init__.py                 |  12 +-
 cloudinit/transforms/__init__.py              | 190 +--------------
 cloudinit/transforms/cc_apt_pipelining.py     |   9 +-
 cloudinit/transforms/cc_apt_update_upgrade.py | 116 ++++-----
 cloudinit/transforms/cc_bootcmd.py            |  48 ++--
 cloudinit/transforms/cc_byobu.py              |  22 +-
 cloudinit/transforms/cc_ca_certs.py           |  25 +-
 cloudinit/transforms/cc_chef.py               | 101 ++++----
 .../transforms/cc_disable_ec2_metadata.py     |  14 +-
 cloudinit/transforms/cc_final_message.py      |  63 +++--
 cloudinit/transforms/cc_foo.py                |  35 ++-
 cloudinit/transforms/cc_grub_dpkg.py          |  19 +-
 cloudinit/transforms/cc_keys_to_console.py    |  14 +-
 cloudinit/transforms/cc_landscape.py          |  43 +++-
 cloudinit/transforms/cc_locale.py             |  36 +--
 cloudinit/transforms/cc_mcollective.py        |  80 +++---
 cloudinit/transforms/cc_mounts.py             |  84 ++++---
 cloudinit/transforms/cc_phone_home.py         |  53 ++--
 cloudinit/transforms/cc_puppet.py             |  94 ++++----
 cloudinit/transforms/cc_resizefs.py           | 154 +++++++-----
 .../transforms/cc_rightscale_userdata.py      |  66 +++--
 cloudinit/transforms/cc_rsyslog.py            |  52 ++--
 cloudinit/transforms/cc_runcmd.py             |  15 +-
 cloudinit/transforms/cc_salt_minion.py        |  49 ++--
 cloudinit/transforms/cc_scripts_per_boot.py   |  20 +-
 .../transforms/cc_scripts_per_instance.py     |  20 +-
 cloudinit/transforms/cc_scripts_per_once.py   |  20 +-
 cloudinit/transforms/cc_scripts_user.py       |  19 +-
 cloudinit/transforms/cc_set_hostname.py       |  23 +-
 cloudinit/transforms/cc_set_passwords.py      | 108 +++++----
 cloudinit/transforms/cc_ssh.py                |  93 ++++---
 cloudinit/transforms/cc_ssh_import_id.py      |  25 +-
 cloudinit/transforms/cc_timezone.py           |  41 +---
 cloudinit/transforms/cc_update_etc_hosts.py   |  84 ++-----
 cloudinit/transforms/cc_update_hostname.py    |  80 +-----
 38 files changed, 1121 insertions(+), 1402 deletions(-)

diff --git a/cloudinit/sources/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
index 61a0038f..27196265 100644
--- a/cloudinit/sources/DataSourceMAAS.py
+++ b/cloudinit/sources/DataSourceMAAS.py
@@ -1,8 +1,10 @@
 # vi: ts=4 expandtab
 #
 #    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -16,22 +18,22 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.DataSource as DataSource
-
-from cloudinit import seeddir as base_seeddir
-from cloudinit import log
-import cloudinit.util as util
+import os
 import errno
 import oauth.oauth as oauth
-import os.path
-import urllib2
 import time
+import urllib2
 
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import url_helper as uhelp
+from cloudinit import util
 
+LOG = logging.getLogger(__name__)
 MD_VERSION = "2012-03-01"
 
 
-class DataSourceMAAS(DataSource.DataSource):
+class DataSourceMAAS(sources.DataSource):
     """
     DataSourceMAAS reads instance information from MAAS.
     Given a config metadata_url, and oauth tokens, it expects to find
@@ -40,61 +42,64 @@ class DataSourceMAAS(DataSource.DataSource):
       user-data
       hostname
     """
-    seeddir = base_seeddir + '/maas'
-    baseurl = None
+    def __init__(self, sys_cfg, distro, paths):
+        sources.DataSource.__init__(self, sys_cfg, distro, paths)
+        self.base_url = None
+        self.seed_dir = os.path.join(paths.seed_dir, 'maas')
 
     def __str__(self):
-        return("DataSourceMAAS[%s]" % self.baseurl)
+        return "%s[%s]" % (util.obj_name(self), self.base_url)
 
     def get_data(self):
         mcfg = self.ds_cfg
 
         try:
-            (userdata, metadata) = read_maas_seed_dir(self.seeddir)
+            (userdata, metadata) = read_maas_seed_dir(self.seed_dir)
             self.userdata_raw = userdata
             self.metadata = metadata
-            self.baseurl = self.seeddir
+            self.base_url = self.seed_dir
             return True
         except MAASSeedDirNone:
             pass
         except MAASSeedDirMalformed as exc:
-            log.warn("%s was malformed: %s\n" % (self.seeddir, exc))
+            LOG.warn("%s was malformed: %s" % (self.seed_dir, exc))
             raise
 
-        try:
-            # if there is no metadata_url, then we're not configured
-            url = mcfg.get('metadata_url', None)
-            if url == None:
-                return False
+        # If there is no metadata_url, then we're not configured
+        url = mcfg.get('metadata_url', None)
+        if not url:
+            return False
 
+        try:
             if not self.wait_for_metadata_service(url):
                 return False
 
-            self.baseurl = url
+            self.base_url = url
 
-            (userdata, metadata) = read_maas_seed_url(self.baseurl,
-                self.md_headers)
+            (userdata, metadata) = read_maas_seed_url(self.base_url,
+                                                      self.md_headers)
             self.userdata_raw = userdata
             self.metadata = metadata
             return True
         except Exception:
-            util.logexc(log)
+            util.logexc(LOG, "Failed fetching metadata from url %s", url)
             return False
 
     def md_headers(self, url):
         mcfg = self.ds_cfg
 
-        # if we are missing token_key, token_secret or consumer_key
+        # If we are missing token_key, token_secret or consumer_key
         # then just do non-authed requests
         for required in ('token_key', 'token_secret', 'consumer_key'):
             if required not in mcfg:
-                return({})
+                return {}
 
         consumer_secret = mcfg.get('consumer_secret', "")
-
-        return(oauth_headers(url=url, consumer_key=mcfg['consumer_key'],
-            token_key=mcfg['token_key'], token_secret=mcfg['token_secret'],
-            consumer_secret=consumer_secret))
+        return oauth_headers(url=url,
+                             consumer_key=mcfg['consumer_key'],
+                             token_key=mcfg['token_key'],
+                             token_secret=mcfg['token_secret'],
+                             consumer_secret=consumer_secret)
 
     def wait_for_metadata_service(self, url):
         mcfg = self.ds_cfg
@@ -103,32 +108,31 @@ class DataSourceMAAS(DataSource.DataSource):
         try:
             max_wait = int(mcfg.get("max_wait", max_wait))
         except Exception:
-            util.logexc(log)
-            log.warn("Failed to get max wait. using %s" % max_wait)
+            util.logexc(LOG, "Failed to get max wait. using %s", max_wait)
 
         if max_wait == 0:
             return False
 
         timeout = 50
         try:
-            timeout = int(mcfg.get("timeout", timeout))
+            if timeout in mcfg:
+                timeout = int(mcfg.get("timeout", timeout))
         except Exception:
-            util.logexc(log)
-            log.warn("Failed to get timeout, using %s" % timeout)
+            LOG.warn("Failed to get timeout, using %s" % timeout)
 
         starttime = time.time()
         check_url = "%s/%s/meta-data/instance-id" % (url, MD_VERSION)
         url = util.wait_for_url(urls=[check_url], max_wait=max_wait,
-            timeout=timeout, status_cb=log.warn,
-            headers_cb=self.md_headers)
+                                timeout=timeout, status_cb=LOG.warn,
+                                headers_cb=self.md_headers)
 
         if url:
-            log.debug("Using metadata source: '%s'" % url)
+            LOG.info("Using metadata source: '%s'", url)
         else:
-            log.critical("giving up on md after %i seconds\n" %
-                         int(time.time() - starttime))
+            LOG.critical("Giving up on md from %s after %i seconds",
+                            urls, int(time.time() - starttime))
 
-        return (bool(url))
+        return bool(url)
 
 
 def read_maas_seed_dir(seed_d):
@@ -139,22 +143,19 @@ def read_maas_seed_dir(seed_d):
       * local-hostname
       * user-data
     """
-    files = ('local-hostname', 'instance-id', 'user-data', 'public-keys')
-    md = {}
-
     if not os.path.isdir(seed_d):
         raise MAASSeedDirNone("%s: not a directory")
 
+    files = ('local-hostname', 'instance-id', 'user-data', 'public-keys')
+    md = {}
     for fname in files:
         try:
-            with open(os.path.join(seed_d, fname)) as fp:
-                md[fname] = fp.read()
-                fp.close()
+            md[fname] = util.load_file(os.path.join(seed_d, fname))
         except IOError as e:
             if e.errno != errno.ENOENT:
                 raise
 
-    return(check_seed_contents(md, seed_d))
+    return check_seed_contents(md, seed_d)
 
 
 def read_maas_seed_url(seed_url, header_cb=None, timeout=None,
@@ -169,29 +170,26 @@ def read_maas_seed_url(seed_url, header_cb=None, timeout=None,
       * <seed_url>/<version>/meta-data/local-hostname
       * <seed_url>/<version>/user-data
     """
-    files = ('meta-data/local-hostname',
-             'meta-data/instance-id',
-             'meta-data/public-keys',
-             'user-data')
-
     base_url = "%s/%s" % (seed_url, version)
+    files = {
+        'local-hostname': "%s/%s" % (base_url, 'meta-data/local-hostname'),
+        'instance-id': "%s/%s" % (base_url, 'meta-data/instance-id'),
+        'public-keys': "%s/%s" % (base_url, 'meta-data/public-keys'),
+        'user-data': "%s/%s" % (base_url, 'user-data'),
+    }
     md = {}
-    for fname in files:
-        url = "%s/%s" % (base_url, fname)
+    for (name, url) in files:
         if header_cb:
             headers = header_cb(url)
         else:
             headers = {}
-
         try:
-            req = urllib2.Request(url, data=None, headers=headers)
-            resp = urllib2.urlopen(req, timeout=timeout)
-            md[os.path.basename(fname)] = resp.read()
+            (resp, sc) = uhelp.readurl(url, headers=headers, timeout=timeout)
+            md[name] = resp
         except urllib2.HTTPError as e:
             if e.code != 404:
                 raise
-
-    return(check_seed_contents(md, seed_url))
+    return check_seed_contents(md, seed_url)
 
 
 def check_seed_contents(content, seed):
@@ -201,11 +199,10 @@ def check_seed_contents(content, seed):
        Raise MAASSeedDirMalformed or MAASSeedDirNone
     """
     md_required = ('instance-id', 'local-hostname')
-    found = content.keys()
-
     if len(content) == 0:
         raise MAASSeedDirNone("%s: no data files found" % seed)
 
+    found = content.keys()
     missing = [k for k in md_required if k not in found]
     if len(missing):
         raise MAASSeedDirMalformed("%s: missing files %s" % (seed, missing))
@@ -217,7 +214,7 @@ def check_seed_contents(content, seed):
             continue
         md[key] = val
 
-    return(userdata, md)
+    return (userdata, md)
 
 
 def oauth_headers(url, consumer_key, token_key, token_secret, consumer_secret):
@@ -232,8 +229,8 @@ def oauth_headers(url, consumer_key, token_key, token_secret, consumer_secret):
     }
     req = oauth.OAuthRequest(http_url=url, parameters=params)
     req.sign_request(oauth.OAuthSignatureMethod_PLAINTEXT(),
-        consumer, token)
-    return(req.to_header())
+                     consumer, token)
+    return req.to_header()
 
 
 class MAASSeedDirNone(Exception):
@@ -244,102 +241,11 @@ class MAASSeedDirMalformed(Exception):
     pass
 
 
+# Used to match classes to dependencies
 datasources = [
-  (DataSourceMAAS, (DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK)),
+  (DataSourceMAAS, (sources.DEP_FILESYSTEM, sources.DEP_NETWORK)),
 ]
 
-
-# return a list of data sources that match this set of dependencies
+# Return a list of data sources that match this set of dependencies
 def get_datasource_list(depends):
-    return(DataSource.list_from_depends(depends, datasources))
-
-
-if __name__ == "__main__":
-    def main():
-        """
-        Call with single argument of directory or http or https url.
-        If url is given additional arguments are allowed, which will be
-        interpreted as consumer_key, token_key, token_secret, consumer_secret
-        """
-        import argparse
-        import pprint
-
-        parser = argparse.ArgumentParser(description='Interact with MAAS DS')
-        parser.add_argument("--config", metavar="file",
-            help="specify DS config file", default=None)
-        parser.add_argument("--ckey", metavar="key",
-            help="the consumer key to auth with", default=None)
-        parser.add_argument("--tkey", metavar="key",
-            help="the token key to auth with", default=None)
-        parser.add_argument("--csec", metavar="secret",
-            help="the consumer secret (likely '')", default="")
-        parser.add_argument("--tsec", metavar="secret",
-            help="the token secret to auth with", default=None)
-        parser.add_argument("--apiver", metavar="version",
-            help="the apiver to use ("" can be used)", default=MD_VERSION)
-
-        subcmds = parser.add_subparsers(title="subcommands", dest="subcmd")
-        subcmds.add_parser('crawl', help="crawl the datasource")
-        subcmds.add_parser('get', help="do a single GET of provided url")
-        subcmds.add_parser('check-seed', help="read andn verify seed at url")
-
-        parser.add_argument("url", help="the data source to query")
-
-        args = parser.parse_args()
-
-        creds = {'consumer_key': args.ckey, 'token_key': args.tkey,
-            'token_secret': args.tsec, 'consumer_secret': args.csec}
-
-        if args.config:
-            import yaml
-            with open(args.config) as fp:
-                cfg = yaml.load(fp)
-            if 'datasource' in cfg:
-                cfg = cfg['datasource']['MAAS']
-            for key in creds.keys():
-                if key in cfg and creds[key] == None:
-                    creds[key] = cfg[key]
-
-        def geturl(url, headers_cb):
-            req = urllib2.Request(url, data=None, headers=headers_cb(url))
-            return(urllib2.urlopen(req).read())
-
-        def printurl(url, headers_cb):
-            print "== %s ==\n%s\n" % (url, geturl(url, headers_cb))
-
-        def crawl(url, headers_cb=None):
-            if url.endswith("/"):
-                for line in geturl(url, headers_cb).splitlines():
-                    if line.endswith("/"):
-                        crawl("%s%s" % (url, line), headers_cb)
-                    else:
-                        printurl("%s%s" % (url, line), headers_cb)
-            else:
-                printurl(url, headers_cb)
-
-        def my_headers(url):
-            headers = {}
-            if creds.get('consumer_key', None) != None:
-                headers = oauth_headers(url, **creds)
-            return headers
-
-        if args.subcmd == "check-seed":
-            if args.url.startswith("http"):
-                (userdata, metadata) = read_maas_seed_url(args.url,
-                    header_cb=my_headers, version=args.apiver)
-            else:
-                (userdata, metadata) = read_maas_seed_url(args.url)
-            print "=== userdata ==="
-            print userdata
-            print "=== metadata ==="
-            pprint.pprint(metadata)
-
-        elif args.subcmd == "get":
-            printurl(args.url, my_headers)
-
-        elif args.subcmd == "crawl":
-            if not args.url.endswith("/"):
-                args.url = "%s/" % args.url
-            crawl(args.url, my_headers)
-
-    main()
+    return sources.list_from_depends(depends, datasources)
diff --git a/cloudinit/sources/DataSourceNoCloud.py b/cloudinit/sources/DataSourceNoCloud.py
index e8c56b8f..84d0f99d 100644
--- a/cloudinit/sources/DataSourceNoCloud.py
+++ b/cloudinit/sources/DataSourceNoCloud.py
@@ -2,9 +2,11 @@
 #
 #    Copyright (C) 2009-2010 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
 #    Author: Juerg Hafliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -18,33 +20,34 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.DataSource as DataSource
-
-from cloudinit import seeddir as base_seeddir
-from cloudinit import log
-import cloudinit.util as util
 import errno
-import subprocess
+import os
+
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
 
 
-class DataSourceNoCloud(DataSource.DataSource):
-    metadata = None
-    userdata = None
-    userdata_raw = None
-    supported_seed_starts = ("/", "file://")
-    dsmode = "local"
-    seed = None
-    cmdline_id = "ds=nocloud"
-    seeddir = base_seeddir + '/nocloud'
+class DataSourceNoCloud(sources.DataSource):
+    def __init__(self, sys_cfg, distro, paths):
+        sources.DataSource.__init__(self, sys_cfg, distro, paths)
+        self.dsmode = 'local'
+        self.seed = None
+        self.cmdline_id = "ds=nocloud"
+        self.seed_dir = os.path.join(paths.seed_dir, 'nocloud')
+        self.supported_seed_starts = ("/", "file://")
 
     def __str__(self):
-        mstr = "DataSourceNoCloud"
-        mstr = mstr + " [seed=%s]" % self.seed
-        return(mstr)
+        mstr = "%s [seed=%s][dsmode=%s]" % (util.obj_name(self),
+                                            self.seed, self.dsmode)
+        return mstr
 
     def get_data(self):
         defaults = {
-            "instance-id": "nocloud", "dsmode": self.dsmode
+            "instance-id": "nocloud",
+            "dsmode": self.dsmode,
         }
 
         found = []
@@ -52,24 +55,24 @@ class DataSourceNoCloud(DataSource.DataSource):
         ud = ""
 
         try:
-            # parse the kernel command line, getting data passed in
+            # Parse the kernel command line, getting data passed in
             if parse_cmdline_data(self.cmdline_id, md):
                 found.append("cmdline")
         except:
-            util.logexc(log)
+            util.logexc(LOG, "Unable to parse command line data")
             return False
 
-        # check to see if the seeddir has data.
+        # Check to see if the seed dir has data.
         seedret = {}
-        if util.read_optional_seed(seedret, base=self.seeddir + "/"):
+        if util.read_optional_seed(seedret, base=self.seed_dir + "/"):
             md = util.mergedict(md, seedret['meta-data'])
             ud = seedret['user-data']
-            found.append(self.seeddir)
-            log.debug("using seeded cache data in %s" % self.seeddir)
+            found.append(self.seed_dir)
+            LOG.debug("Using seeded cache data from %s", self.seed_dir)
 
-        # if the datasource config had a 'seedfrom' entry, then that takes
+        # If the datasource config had a 'seedfrom' entry, then that takes
         # precedence over a 'seedfrom' that was found in a filesystem
-        # but not over external medi
+        # but not over external media
         if 'seedfrom' in self.ds_cfg and self.ds_cfg['seedfrom']:
             found.append("ds_config")
             md["seedfrom"] = self.ds_cfg['seedfrom']
@@ -83,35 +86,36 @@ class DataSourceNoCloud(DataSource.DataSource):
 
         for dev in devlist:
             try:
-                (newmd, newud) = util.mount_callback_umount(dev,
-                    util.read_seeded)
+                LOG.debug("Attempting to use data from %s", dev)
+
+                (newmd, newud) = util.mount_cb(dev, util.read_seeded)
                 md = util.mergedict(newmd, md)
                 ud = newud
 
-                # for seed from a device, the default mode is 'net'.
+                # For seed from a device, the default mode is 'net'.
                 # that is more likely to be what is desired.
                 # If they want dsmode of local, then they must
                 # specify that.
                 if 'dsmode' not in md:
                     md['dsmode'] = "net"
 
-                log.debug("using data from %s" % dev)
+                LOG.debug("Using data from %s", dev)
                 found.append(dev)
                 break
-            except OSError, e:
+            except OSError as e:
                 if e.errno != errno.ENOENT:
                     raise
-            except util.mountFailedError:
-                log.warn("Failed to mount %s when looking for seed" % dev)
+            except util.MountFailedError:
+                util.logexc(LOG, "Failed to mount %s when looking for seed", dev)
 
-        # there was no indication on kernel cmdline or data
+        # There was no indication on kernel cmdline or data
         # in the seeddir suggesting this handler should be used.
         if len(found) == 0:
             return False
 
         seeded_interfaces = None
 
-        # the special argument "seedfrom" indicates we should
+        # The special argument "seedfrom" indicates we should
         # attempt to seed the userdata / metadata from its value
         # its primarily value is in allowing the user to type less
         # on the command line, ie: ds=nocloud;s=http://bit.ly/abcdefg
@@ -123,57 +127,46 @@ class DataSourceNoCloud(DataSource.DataSource):
                     seedfound = proto
                     break
             if not seedfound:
-                log.debug("seed from %s not supported by %s" %
-                    (seedfrom, self.__class__))
+                LOG.debug("Seed from %s not supported by %s", seedfrom, self)
                 return False
 
             if 'network-interfaces' in md:
                 seeded_interfaces = self.dsmode
 
-            # this could throw errors, but the user told us to do it
+            # This could throw errors, but the user told us to do it
             # so if errors are raised, let them raise
             (md_seed, ud) = util.read_seeded(seedfrom, timeout=None)
-            log.debug("using seeded cache data from %s" % seedfrom)
+            LOG.debug("Using seeded cache data from %s", seedfrom)
 
-            # values in the command line override those from the seed
+            # Values in the command line override those from the seed
             md = util.mergedict(md, md_seed)
             found.append(seedfrom)
 
+        # Now that we have exhausted any other places merge in the defaults
         md = util.mergedict(md, defaults)
 
-        # update the network-interfaces if metadata had 'network-interfaces'
+        # Update the network-interfaces if metadata had 'network-interfaces'
         # entry and this is the local datasource, or 'seedfrom' was used
         # and the source of the seed was self.dsmode
         # ('local' for NoCloud, 'net' for NoCloudNet')
         if ('network-interfaces' in md and
             (self.dsmode in ("local", seeded_interfaces))):
-            log.info("updating network interfaces from nocloud")
-
-            util.write_file("/etc/network/interfaces",
-                md['network-interfaces'])
-            try:
-                (out, err) = util.subp(['ifup', '--all'])
-                if len(out) or len(err):
-                    log.warn("ifup --all had stderr: %s" % err)
-
-            except subprocess.CalledProcessError as exc:
-                log.warn("ifup --all failed: %s" % (exc.output[1]))
-
-        self.seed = ",".join(found)
-        self.metadata = md
-        self.userdata_raw = ud
-
+            LOG.info("Updating network interfaces from %s", self)
+            self.distro.apply_network(md['network-interfaces'])
+            
         if md['dsmode'] == self.dsmode:
+            self.seed = ",".join(found)
+            self.metadata = md
+            self.userdata_raw = ud
             return True
 
-        log.debug("%s: not claiming datasource, dsmode=%s" %
-            (self, md['dsmode']))
+        LOG.debug("%s: not claiming datasource, dsmode=%s", self, md['dsmode'])
         return False
 
 
-# returns true or false indicating if cmdline indicated
+# Returns true or false indicating if cmdline indicated
 # that this module should be used
-# example cmdline:
+# Example cmdline:
 #  root=LABEL=uec-rootfs ro ds=nocloud
 def parse_cmdline_data(ds_id, fill, cmdline=None):
     if cmdline is None:
@@ -210,23 +203,25 @@ def parse_cmdline_data(ds_id, fill, cmdline=None):
             k = s2l[k]
         fill[k] = v
 
-    return(True)
+    return True
 
 
 class DataSourceNoCloudNet(DataSourceNoCloud):
-    cmdline_id = "ds=nocloud-net"
-    supported_seed_starts = ("http://", "https://", "ftp://")
-    seeddir = base_seeddir + '/nocloud-net'
-    dsmode = "net"
+    def __init__(self, sys_cfg, distro, paths):
+        DataSourceNoCloud.__init__(self, sys_cfg, distro, paths)
+        self.cmdline_id = "ds=nocloud-net"
+        self.supported_seed_starts = ("http://", "https://", "ftp://")
+        self.seed_dir = os.path.join(paths.seed_dir, 'nocloud-net')
+        self.dsmode = "net"
 
 
-datasources = (
-  (DataSourceNoCloud, (DataSource.DEP_FILESYSTEM, )),
-  (DataSourceNoCloudNet,
-    (DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK)),
-)
+# Used to match classes to dependencies
+datasources = [
+  (DataSourceNoCloud, (sources.DEP_FILESYSTEM, )),
+  (DataSourceNoCloudNet, (sources.DEP_FILESYSTEM, sources.DEP_NETWORK)),
+]
 
 
-# return a list of data sources that match this set of dependencies
+# Return a list of data sources that match this set of dependencies
 def get_datasource_list(depends):
-    return(DataSource.list_from_depends(depends, datasources))
+    return sources.list_from_depends(depends, datasources)
diff --git a/cloudinit/sources/DataSourceOVF.py b/cloudinit/sources/DataSourceOVF.py
index a0b1b518..bb0f46c2 100644
--- a/cloudinit/sources/DataSourceOVF.py
+++ b/cloudinit/sources/DataSourceOVF.py
@@ -2,9 +2,11 @@
 #
 #    Copyright (C) 2011 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
 #    Author: Juerg Hafliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -18,33 +20,30 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.DataSource as DataSource
-
-from cloudinit import seeddir as base_seeddir
-from cloudinit import log
-import cloudinit.util as util
-import os.path
-import os
 from xml.dom import minidom
 import base64
+import os
 import re
 import tempfile
-import subprocess
+
+from cloudinit import log as logging
+from cloudinit import sources
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
 
 
-class DataSourceOVF(DataSource.DataSource):
-    seed = None
-    seeddir = base_seeddir + '/ovf'
-    environment = None
-    cfg = {}
-    userdata_raw = None
-    metadata = None
-    supported_seed_starts = ("/", "file://")
+class DataSourceOVF(sources.DataSource):
+    def __init__(self, sys_cfg, distro, paths):
+        sources.DataSource.__init__(self, sys_cfg, distro, paths)
+        self.seed = None
+        self.seed_dir = os.path.join(paths.seed_dir, 'ovf')
+        self.environment = None
+        self.cfg = {}
+        self.supported_seed_starts = ("/", "file://")
 
     def __str__(self):
-        mstr = "DataSourceOVF"
-        mstr = mstr + " [seed=%s]" % self.seed
-        return(mstr)
+        return "%s [seed=%s]" % (util.obj_name(self), self.seed)
 
     def get_data(self):
         found = []
@@ -55,13 +54,12 @@ class DataSourceOVF(DataSource.DataSource):
             "instance-id": "iid-dsovf"
         }
 
-        (seedfile, contents) = get_ovf_env(base_seeddir)
+        (seedfile, contents) = get_ovf_env(self.paths.seed_dir)
         if seedfile:
-            # found a seed dir
-            seed = "%s/%s" % (base_seeddir, seedfile)
+            # Found a seed dir
+            seed = os.path.join(self.paths.seed_dir, seedfile)
             (md, ud, cfg) = read_ovf_environment(contents)
             self.environment = contents
-
             found.append(seed)
         else:
             np = {'iso': transport_iso9660,
@@ -71,7 +69,6 @@ class DataSourceOVF(DataSource.DataSource):
                 (contents, _dev, _fname) = transfunc()
                 if contents:
                     break
-
             if contents:
                 (md, ud, cfg) = read_ovf_environment(contents)
                 self.environment = contents
@@ -89,17 +86,19 @@ class DataSourceOVF(DataSource.DataSource):
                     seedfound = proto
                     break
             if not seedfound:
-                log.debug("seed from %s not supported by %s" %
-                    (seedfrom, self.__class__))
+                LOG.debug("Seed from %s not supported by %s",
+                          seedfrom, self)
                 return False
 
             (md_seed, ud) = util.read_seeded(seedfrom, timeout=None)
-            log.debug("using seeded cache data from %s" % seedfrom)
+            LOG.debug("Using seeded cache data from %s", seedfrom)
 
             md = util.mergedict(md, md_seed)
             found.append(seedfrom)
 
+        # Now that we have exhausted any other places merge in the defaults
         md = util.mergedict(md, defaults)
+
         self.seed = ",".join(found)
         self.metadata = md
         self.userdata_raw = ud
@@ -108,31 +107,37 @@ class DataSourceOVF(DataSource.DataSource):
 
     def get_public_ssh_keys(self):
         if not 'public-keys' in self.metadata:
-            return([])
-        return([self.metadata['public-keys'], ])
+            return []
+        pks = self.metadata['public-keys']
+        if isinstance(pks, (list)):
+            return pks
+        else:
+            return [pks]
 
-    # the data sources' config_obj is a cloud-config formated
+    # The data sources' config_obj is a cloud-config formatted
     # object that came to it from ways other than cloud-config
     # because cloud-config content would be handled elsewhere
     def get_config_obj(self):
-        return(self.cfg)
+        return self.cfg
 
 
 class DataSourceOVFNet(DataSourceOVF):
-    seeddir = base_seeddir + '/ovf-net'
-    supported_seed_starts = ("http://", "https://", "ftp://")
+    def __init__(self, sys_cfg, distro, paths):
+        DataSourceOVF.__init__(self, sys_cfg, distro, paths)
+        self.seed_dir = os.path.join(paths.seed_dir, 'ovf-net')
+        self.supported_seed_starts = ("http://", "https://", "ftp://")
 
 
-# this will return a dict with some content
-#  meta-data, user-data
+# This will return a dict with some content
+#  meta-data, user-data, some config
 def read_ovf_environment(contents):
-    props = getProperties(contents)
+    props = get_properties(contents)
     md = {}
     cfg = {}
     ud = ""
-    cfg_props = ['password', ]
+    cfg_props = ['password']
     md_props = ['seedfrom', 'local-hostname', 'public-keys', 'instance-id']
-    for prop, val in props.iteritems():
+    for (prop, val) in props.iteritems():
         if prop == 'hostname':
             prop = "local-hostname"
         if prop in md_props:
@@ -144,23 +149,25 @@ def read_ovf_environment(contents):
                 ud = base64.decodestring(val)
             except:
                 ud = val
-    return(md, ud, cfg)
+    return (md, ud, cfg)
 
 
-# returns tuple of filename (in 'dirname', and the contents of the file)
+# Returns tuple of filename (in 'dirname', and the contents of the file)
 # on "not found", returns 'None' for filename and False for contents
 def get_ovf_env(dirname):
     env_names = ("ovf-env.xml", "ovf_env.xml", "OVF_ENV.XML", "OVF-ENV.XML")
     for fname in env_names:
-        if os.path.isfile("%s/%s" % (dirname, fname)):
-            fp = open("%s/%s" % (dirname, fname))
-            contents = fp.read()
-            fp.close()
-            return(fname, contents)
-    return(None, False)
+        full_fn = os.path.join(dirname, fname)
+        if os.path.isfile(full_fn):
+            try:
+                contents = util.load_file(full_fn)
+                return (fname, contents)
+            except:
+                util.logexc(LOG, "Failed loading ovf file %s", full_fn)
+    return (None, False)
 
 
-# transport functions take no input and return
+# Transport functions take no input and return
 # a 3 tuple of content, path, filename
 def transport_iso9660(require_iso=True):
 
@@ -173,79 +180,45 @@ def transport_iso9660(require_iso=True):
     devname_regex = os.environ.get(envname, default_regex)
     cdmatch = re.compile(devname_regex)
 
-    # go through mounts to see if it was already mounted
-    fp = open("/proc/mounts")
-    mounts = fp.readlines()
-    fp.close()
-
-    mounted = {}
-    for mpline in mounts:
-        (dev, mp, fstype, _opts, _freq, _passno) = mpline.split()
-        mounted[dev] = (dev, fstype, mp, False)
-        mp = mp.replace("\\040", " ")
+    # Go through mounts to see if it was already mounted
+    mounts = util.mounts()
+    for (dev, info) in mounts.iteritems():
+        fstype = info['fstype']
         if fstype != "iso9660" and require_iso:
             continue
-
         if cdmatch.match(dev[5:]) == None:  # take off '/dev/'
             continue
-
+        mp = info['mountpoint']
         (fname, contents) = get_ovf_env(mp)
         if contents is not False:
-            return(contents, dev, fname)
-
-    tmpd = None
-    dvnull = None
+            return (contents, dev, fname)
 
     devs = os.listdir("/dev/")
     devs.sort()
-
     for dev in devs:
-        fullp = "/dev/%s" % dev
+        fullp = os.path.join("/dev/", dev)
 
-        if fullp in mounted or not cdmatch.match(dev) or os.path.isdir(fullp):
+        if (fullp in mounted or
+            not cdmatch.match(dev) or os.path.isdir(fullp)):
             continue
 
-        fp = None
         try:
-            fp = open(fullp, "rb")
-            fp.read(512)
-            fp.close()
+            # See if we can read anything at all...??
+            with open(fullp, 'rb') as fp:
+                fp.read(512)
         except:
-            if fp:
-                fp.close()
             continue
 
-        if tmpd is None:
-            tmpd = tempfile.mkdtemp()
-        if dvnull is None:
-            try:
-                dvnull = open("/dev/null")
-            except:
-                pass
-
-        cmd = ["mount", "-o", "ro", fullp, tmpd]
-        if require_iso:
-            cmd.extend(('-t', 'iso9660'))
-
-        rc = subprocess.call(cmd, stderr=dvnull, stdout=dvnull, stdin=dvnull)
-        if rc:
+        try:
+            (fname, contents) = utils.mount_cb(fullp, get_ovf_env, mtype="iso9660")
+        except util.MountFailedError:
+            util.logexc(LOG, "Failed mounting %s", fullp)
             continue
 
-        (fname, contents) = get_ovf_env(tmpd)
-
-        subprocess.call(["umount", tmpd])
-
         if contents is not False:
-            os.rmdir(tmpd)
-            return(contents, fullp, fname)
+            return (contents, fullp, fname)
 
-    if tmpd:
-        os.rmdir(tmpd)
-
-    if dvnull:
-        dvnull.close()
-
-    return(False, None, None)
+    return (False, None, None)
 
 
 def transport_vmware_guestd():
@@ -259,74 +232,60 @@ def transport_vmware_guestd():
     #     # would need to error check here and see why this failed
     #     # to know if log/error should be raised
     #     return(False, None, None)
-    return(False, None, None)
+    return (False, None, None)
 
 
-def findChild(node, filter_func):
+def find_child(node, filter_func):
     ret = []
     if not node.hasChildNodes():
         return ret
     for child in node.childNodes:
         if filter_func(child):
             ret.append(child)
-    return(ret)
+    return ret
 
 
-def getProperties(environString):
-    dom = minidom.parseString(environString)
+def get_properties(contents):
+
+    dom = minidom.parseString(contents)
     if dom.documentElement.localName != "Environment":
-        raise Exception("No Environment Node")
+        raise XmlError("No Environment Node")
 
     if not dom.documentElement.hasChildNodes():
-        raise Exception("No Child Nodes")
+        raise XmlError("No Child Nodes")
 
     envNsURI = "http://schemas.dmtf.org/ovf/environment/1"
 
     # could also check here that elem.namespaceURI ==
     #   "http://schemas.dmtf.org/ovf/environment/1"
-    propSections = findChild(dom.documentElement,
+    propSections = find_child(dom.documentElement,
         lambda n: n.localName == "PropertySection")
 
     if len(propSections) == 0:
-        raise Exception("No 'PropertySection's")
+        raise XmlError("No 'PropertySection's")
 
     props = {}
-    propElems = findChild(propSections[0], lambda n: n.localName == "Property")
+    propElems = find_child(propSections[0], lambda n: n.localName == "Property")
 
     for elem in propElems:
         key = elem.attributes.getNamedItemNS(envNsURI, "key").value
         val = elem.attributes.getNamedItemNS(envNsURI, "value").value
         props[key] = val
 
-    return(props)
+    return props
 
 
+class XmlError(Exception):
+    pass
+
+
+# Used to match classes to dependencies
 datasources = (
-  (DataSourceOVF, (DataSource.DEP_FILESYSTEM, )),
-  (DataSourceOVFNet,
-    (DataSource.DEP_FILESYSTEM, DataSource.DEP_NETWORK)),
+  (DataSourceOVF, (sources.DEP_FILESYSTEM, )),
+  (DataSourceOVFNet, (sources.DEP_FILESYSTEM, sources.DEP_NETWORK)),
 )
 
 
-# return a list of data sources that match this set of dependencies
+# Return a list of data sources that match this set of dependencies
 def get_datasource_list(depends):
-    return(DataSource.list_from_depends(depends, datasources))
-
-
-if __name__ == "__main__":
-    def main():
-        import sys
-        envStr = open(sys.argv[1]).read()
-        props = getProperties(envStr)
-        import pprint
-        pprint.pprint(props)
-
-        md, ud, cfg = read_ovf_environment(envStr)
-        print "=== md ==="
-        pprint.pprint(md)
-        print "=== ud ==="
-        pprint.pprint(ud)
-        print "=== cfg ==="
-        pprint.pprint(cfg)
-
-    main()
+    return sources.list_from_depends(depends, datasources)
diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index dfd1fff3..08669f5d 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -39,10 +39,6 @@ class DataSourceNotFoundException(Exception):
 
 class DataSource(object):
     def __init__(self, sys_cfg, distro, paths):
-        name = util.obj_name(self)
-        if name.startswith(DS_PREFIX):
-            name = name[DS_PREFIX:]
-        self.cfgname = name
         self.sys_cfg = sys_cfg
         self.distro = distro
         self.paths = paths
@@ -50,8 +46,11 @@ class DataSource(object):
         self.userdata = None
         self.metadata = None
         self.userdata_raw = None
+        name = util.obj_name(self)
+        if name.startswith(DS_PREFIX):
+            name = name[DS_PREFIX:]
         self.ds_cfg = util.get_cfg_by_path(self.sys_cfg,
-                        ("datasource", self.cfgname), {})
+                                          ("datasource", name), {})
 
     def get_userdata(self):
         if self.userdata is None:
@@ -112,6 +111,7 @@ class DataSource(object):
 
     def get_instance_id(self):
         if not self.metadata or 'instance-id' not in self.metadata:
+            # Return a magic not really instance id string
             return "iid-datasource"
         return str(self.metadata['instance-id'])
 
@@ -166,7 +166,7 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
             if s.get_data():
                 return (s, ds)
         except Exception as e:
-            LOG.exception("Getting data from %s failed due to %s", ds, e)
+            util.logexc(LOG, "Getting data from %s failed", ds)
 
     msg = "Did not find any data source, searched classes: %s" % (ds_names)
     raise DataSourceNotFoundException(msg)
diff --git a/cloudinit/transforms/__init__.py b/cloudinit/transforms/__init__.py
index 5d70ac43..8275b375 100644
--- a/cloudinit/transforms/__init__.py
+++ b/cloudinit/transforms/__init__.py
@@ -19,183 +19,12 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 #
 
-import os
-import subprocess
-import sys
-import time
-import traceback
-
-import yaml
-
-from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE)
+from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
 
 from cloudinit import log as logging
-from cloudinit import util
 
 LOG = logging.getLogger(__name__)
 
-DEF_HANDLER_VERSION = 1
-DEF_FREQ = PER_INSTANCE
-
-
-# reads a cloudconfig module list, returns
-# a 2 dimensional array suitable to pass to run_cc_modules
-def read_cc_modules(cfg, name):
-    if name not in cfg:
-        return([])
-    module_list = []
-    # create 'module_list', an array of arrays
-    # where array[0] = config
-    #       array[1] = freq
-    #       array[2:] = arguemnts
-    for item in cfg[name]:
-        if isinstance(item, str):
-            module_list.append((item,))
-        elif isinstance(item, list):
-            module_list.append(item)
-        else:
-            raise TypeError("failed to read '%s' item in config")
-    return(module_list)
-
-
-def run_cc_modules(cc, module_list, log):
-    failures = []
-    for cfg_mod in module_list:
-        name = cfg_mod[0]
-        freq = None
-        run_args = []
-        if len(cfg_mod) > 1:
-            freq = cfg_mod[1]
-        if len(cfg_mod) > 2:
-            run_args = cfg_mod[2:]
-
-        try:
-            log.debug("handling %s with freq=%s and args=%s" %
-                (name, freq, run_args))
-            cc.handle(name, run_args, freq=freq)
-        except:
-            log.warn(traceback.format_exc())
-            log.error("config handling of %s, %s, %s failed\n" %
-                (name, freq, run_args))
-            failures.append(name)
-
-    return(failures)
-
-
-# always returns well formated values
-# cfg is expected to have an entry 'output' in it, which is a dictionary
-# that includes entries for 'init', 'config', 'final' or 'all'
-#   init: /var/log/cloud.out
-#   config: [ ">> /var/log/cloud-config.out", /var/log/cloud-config.err ]
-#   final:
-#     output: "| logger -p"
-#     error: "> /dev/null"
-# this returns the specific 'mode' entry, cleanly formatted, with value
-# None if if none is given
-def get_output_cfg(cfg, mode="init"):
-    ret = [None, None]
-    if not 'output' in cfg:
-        return ret
-
-    outcfg = cfg['output']
-    if mode in outcfg:
-        modecfg = outcfg[mode]
-    else:
-        if 'all' not in outcfg:
-            return ret
-        # if there is a 'all' item in the output list
-        # then it applies to all users of this (init, config, final)
-        modecfg = outcfg['all']
-
-    # if value is a string, it specifies stdout and stderr
-    if isinstance(modecfg, str):
-        ret = [modecfg, modecfg]
-
-    # if its a list, then we expect (stdout, stderr)
-    if isinstance(modecfg, list):
-        if len(modecfg) > 0:
-            ret[0] = modecfg[0]
-        if len(modecfg) > 1:
-            ret[1] = modecfg[1]
-
-    # if it is a dictionary, expect 'out' and 'error'
-    # items, which indicate out and error
-    if isinstance(modecfg, dict):
-        if 'output' in modecfg:
-            ret[0] = modecfg['output']
-        if 'error' in modecfg:
-            ret[1] = modecfg['error']
-
-    # if err's entry == "&1", then make it same as stdout
-    # as in shell syntax of "echo foo >/dev/null 2>&1"
-    if ret[1] == "&1":
-        ret[1] = ret[0]
-
-    swlist = [">>", ">", "|"]
-    for i in range(len(ret)):
-        if not ret[i]:
-            continue
-        val = ret[i].lstrip()
-        found = False
-        for s in swlist:
-            if val.startswith(s):
-                val = "%s %s" % (s, val[len(s):].strip())
-                found = True
-                break
-        if not found:
-            # default behavior is append
-            val = "%s %s" % (">>", val.strip())
-        ret[i] = val
-
-    return(ret)
-
-
-# redirect_output(outfmt, errfmt, orig_out, orig_err)
-#  replace orig_out and orig_err with filehandles specified in outfmt or errfmt
-#  fmt can be:
-#   > FILEPATH
-#   >> FILEPATH
-#   | program [ arg1 [ arg2 [ ... ] ] ]
-#
-#   with a '|', arguments are passed to shell, so one level of
-#   shell escape is required.
-def redirect_output(outfmt, errfmt, o_out=sys.stdout, o_err=sys.stderr):
-    if outfmt:
-        (mode, arg) = outfmt.split(" ", 1)
-        if mode == ">" or mode == ">>":
-            owith = "ab"
-            if mode == ">":
-                owith = "wb"
-            new_fp = open(arg, owith)
-        elif mode == "|":
-            proc = subprocess.Popen(arg, shell=True, stdin=subprocess.PIPE)
-            new_fp = proc.stdin
-        else:
-            raise TypeError("invalid type for outfmt: %s" % outfmt)
-
-        if o_out:
-            os.dup2(new_fp.fileno(), o_out.fileno())
-        if errfmt == outfmt:
-            os.dup2(new_fp.fileno(), o_err.fileno())
-            return
-
-    if errfmt:
-        (mode, arg) = errfmt.split(" ", 1)
-        if mode == ">" or mode == ">>":
-            owith = "ab"
-            if mode == ">":
-                owith = "wb"
-            new_fp = open(arg, owith)
-        elif mode == "|":
-            proc = subprocess.Popen(arg, shell=True, stdin=subprocess.PIPE)
-            new_fp = proc.stdin
-        else:
-            raise TypeError("invalid type for outfmt: %s" % outfmt)
-
-        if o_err:
-            os.dup2(new_fp.fileno(), o_err.fileno())
-    return
-
 
 def form_module_name(name):
     canon_name = name.replace("-", "_")
@@ -209,13 +38,18 @@ def form_module_name(name):
     return canon_name
 
 
-def fixup_module(mod):
-    freq = getattr(mod, "frequency", None)
-    if not freq:
-        setattr(mod, 'frequency', PER_INSTANCE)
-    handler = getattr(mod, "handle", None)
-    if not handler:
+def fixup_module(mod, def_freq=PER_INSTANCE):
+    if not hasattr(mod, 'frequency'):
+        setattr(mod, 'frequency', def_freq)
+    else:
+        freq = mod.frequency
+        if freq and freq not in FREQUENCIES:
+            LOG.warn("Module %s has an unknown frequency %s", mod, freq)
+    if not hasattr(mod, 'handle'):
         def empty_handle(_name, _cfg, _cloud, _log, _args):
             pass
         setattr(mod, 'handle', empty_handle)
+    # Used only for warning if possibly running on a not checked distro...
+    if not hasattr(mod, 'distros'):
+        setattr(mod, 'distros', None)
     return mod
diff --git a/cloudinit/transforms/cc_apt_pipelining.py b/cloudinit/transforms/cc_apt_pipelining.py
index 0286a9ae..69027b0c 100644
--- a/cloudinit/transforms/cc_apt_pipelining.py
+++ b/cloudinit/transforms/cc_apt_pipelining.py
@@ -16,10 +16,13 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-from cloudinit.CloudConfig import per_instance
+from cloudinit import util
+from cloudinit.settings import PER_INSTANCE
+
+frequency = PER_INSTANCE
+
+distros = ['ubuntu', 'debian']
 
-frequency = per_instance
 default_file = "/etc/apt/apt.conf.d/90cloud-init-pipelining"
 
 
diff --git a/cloudinit/transforms/cc_apt_update_upgrade.py b/cloudinit/transforms/cc_apt_update_upgrade.py
index a7049bce..c4a543ed 100644
--- a/cloudinit/transforms/cc_apt_update_upgrade.py
+++ b/cloudinit/transforms/cc_apt_update_upgrade.py
@@ -18,12 +18,13 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import subprocess
-import traceback
-import os
 import glob
-import cloudinit.CloudConfig as cc
+import os
+
+from cloudinit import templater
+from cloudinit import util
+
+distros = ['ubuntu', 'debian']
 
 
 def handle(_name, cfg, cloud, log, _args):
@@ -34,13 +35,13 @@ def handle(_name, cfg, cloud, log, _args):
 
     mirror = find_apt_mirror(cloud, cfg)
 
-    log.debug("selected mirror at: %s" % mirror)
+    log.debug("Selected mirror at: %s" % mirror)
 
-    if not util.get_cfg_option_bool(cfg, \
-        'apt_preserve_sources_list', False):
-        generate_sources_list(release, mirror)
-        old_mir = util.get_cfg_option_str(cfg, 'apt_old_mirror', \
-            "archive.ubuntu.com/ubuntu")
+    if not util.get_cfg_option_bool(cfg,
+                                    'apt_preserve_sources_list', False):
+        generate_sources_list(release, mirror, cloud, log)
+        old_mir = util.get_cfg_option_str(cfg, 'apt_old_mirror',
+                                          "archive.ubuntu.com/ubuntu")
         rename_apt_lists(old_mir, mirror)
 
     # set up proxy
@@ -49,19 +50,18 @@ def handle(_name, cfg, cloud, log, _args):
     if proxy:
         try:
             contents = "Acquire::HTTP::Proxy \"%s\";\n"
-            with open(proxy_filename, "w") as fp:
-                fp.write(contents % proxy)
+            util.write_file(proxy_filename, contents % (proxy))
         except Exception as e:
-            log.warn("Failed to write proxy to %s" % proxy_filename)
+            util.logexc(log, "Failed to write proxy to %s", proxy_filename)
     elif os.path.isfile(proxy_filename):
-        os.unlink(proxy_filename)
+        util.del_file(proxy_filename)
 
     # process 'apt_sources'
     if 'apt_sources' in cfg:
         errors = add_sources(cfg['apt_sources'],
                              {'MIRROR': mirror, 'RELEASE': release})
         for e in errors:
-            log.warn("Source Error: %s\n" % ':'.join(e))
+            log.warn("Source Error: %s", ':'.join(e))
 
     dconf_sel = util.get_cfg_option_str(cfg, 'debconf_selections', False)
     if dconf_sel:
@@ -69,41 +69,35 @@ def handle(_name, cfg, cloud, log, _args):
         try:
             util.subp(('debconf-set-selections', '-'), dconf_sel)
         except:
-            log.error("Failed to run debconf-set-selections")
-            log.debug(traceback.format_exc())
+            util.logexc(log, "Failed to run debconf-set-selections")
 
     pkglist = util.get_cfg_option_list_or_str(cfg, 'packages', [])
 
     errors = []
     if update or len(pkglist) or upgrade:
         try:
-            cc.update_package_sources()
-        except subprocess.CalledProcessError as e:
-            log.warn("apt-get update failed")
-            log.debug(traceback.format_exc())
+            cloud.distro.update_package_sources()
+        except Exception as e:
+            util.logexc(log, "Package update failed")
             errors.append(e)
 
     if upgrade:
         try:
-            cc.apt_get("upgrade")
-        except subprocess.CalledProcessError as e:
-            log.warn("apt upgrade failed")
-            log.debug(traceback.format_exc())
+            cloud.distro.package_command("upgrade")
+        except Exception as e:
+            util.logexc(log, "Package upgrade failed")
             errors.append(e)
 
     if len(pkglist):
         try:
-            cc.install_packages(pkglist)
-        except subprocess.CalledProcessError as e:
-            log.warn("Failed to install packages: %s " % pkglist)
-            log.debug(traceback.format_exc())
+            cloud.distro.install_packages(pkglist)
+        except Exception as e:
+            util.logexc(log, "Failed to install packages: %s ", pkglist)
             errors.append(e)
 
     if len(errors):
         raise errors[0]
 
-    return(True)
-
 
 def mirror2lists_fileprefix(mirror):
     string = mirror
@@ -120,37 +114,40 @@ def mirror2lists_fileprefix(mirror):
 def rename_apt_lists(omirror, new_mirror, lists_d="/var/lib/apt/lists"):
     oprefix = "%s/%s" % (lists_d, mirror2lists_fileprefix(omirror))
     nprefix = "%s/%s" % (lists_d, mirror2lists_fileprefix(new_mirror))
-    if(oprefix == nprefix):
+    if oprefix == nprefix:
         return
     olen = len(oprefix)
     for filename in glob.glob("%s_*" % oprefix):
-        os.rename(filename, "%s%s" % (nprefix, filename[olen:]))
+        util.rename(filename, "%s%s" % (nprefix, filename[olen:]))
 
 
 def get_release():
-    stdout, _stderr = subprocess.Popen(['lsb_release', '-cs'],
-                                       stdout=subprocess.PIPE).communicate()
-    return(str(stdout).strip())
+    (stdout, _stderr) = util.subp(['lsb_release', '-cs'])
+    return stdout.strip()
 
 
-def generate_sources_list(codename, mirror):
-    util.render_to_file('sources.list', '/etc/apt/sources.list', \
-        {'mirror': mirror, 'codename': codename})
+def generate_sources_list(codename, mirror, cloud, log):
+    template_fn = cloud.get_template_filename('sources.list')
+    if template_fn:
+        params = {'mirror': mirror, 'codename': codename}
+        templater.render_to_file(template_fn, '/etc/apt/sources.list', params)
+    else:
+        log.warn("No template found, not rendering /etc/apt/sources.list")
 
 
-def add_sources(srclist, searchList=None):
+def add_sources(srclist, template_params=None):
     """
     add entries in /etc/apt/sources.list.d for each abbreviated
     sources.list entry in 'srclist'.  When rendering template, also
     include the values in dictionary searchList
     """
-    if searchList is None:
-        searchList = {}
-    elst = []
+    if template_params is None:
+        template_params = {}
 
+    errorlist = []
     for ent in srclist:
         if 'source' not in ent:
-            elst.append(["", "missing source"])
+            errorlist.append(["", "missing source"])
             continue
 
         source = ent['source']
@@ -158,17 +155,17 @@ def add_sources(srclist, searchList=None):
             try:
                 util.subp(["add-apt-repository", source])
             except:
-                elst.append([source, "add-apt-repository failed"])
+                errorlist.append([source, "add-apt-repository failed"])
             continue
 
-        source = util.render_string(source, searchList)
+        source = templater.render_string(source, template_params)
 
         if 'filename' not in ent:
             ent['filename'] = 'cloud_config_sources.list'
 
         if not ent['filename'].startswith("/"):
-            ent['filename'] = "%s/%s" % \
-                ("/etc/apt/sources.list.d/", ent['filename'])
+            ent['filename'] = os.path.join("/etc/apt/sources.list.d/",
+                                           ent['filename'])
 
         if ('keyid' in ent and 'key' not in ent):
             ks = "keyserver.ubuntu.com"
@@ -177,32 +174,26 @@ def add_sources(srclist, searchList=None):
             try:
                 ent['key'] = util.getkeybyid(ent['keyid'], ks)
             except:
-                elst.append([source, "failed to get key from %s" % ks])
+                errorlist.append([source, "failed to get key from %s" % ks])
                 continue
 
         if 'key' in ent:
             try:
                 util.subp(('apt-key', 'add', '-'), ent['key'])
             except:
-                elst.append([source, "failed add key"])
+                errorlist.append([source, "failed add key"])
 
         try:
             util.write_file(ent['filename'], source + "\n", omode="ab")
         except:
-            elst.append([source, "failed write to file %s" % ent['filename']])
+            errorlist.append([source, "failed write to file %s" % ent['filename']])
 
-    return(elst)
+    return errorlist
 
 
 def find_apt_mirror(cloud, cfg):
     """ find an apt_mirror given the cloud and cfg provided """
 
-    # TODO: distro and defaults should be configurable
-    distro = "ubuntu"
-    defaults = {
-        'ubuntu': "http://archive.ubuntu.com/ubuntu",
-        'debian': "http://archive.debian.org/debian",
-    }
     mirror = None
 
     cfg_mirror = cfg.get("apt_mirror", None)
@@ -211,14 +202,13 @@ def find_apt_mirror(cloud, cfg):
     elif "apt_mirror_search" in cfg:
         mirror = util.search_for_mirror(cfg['apt_mirror_search'])
     else:
-        if cloud:
-            mirror = cloud.get_mirror()
+        mirror = cloud.get_local_mirror()
 
         mydom = ""
 
         doms = []
 
-        if not mirror and cloud:
+        if not mirror:
             # if we have a fqdn, then search its domain portion first
             (_hostname, fqdn) = util.get_hostname_fqdn(cfg, cloud)
             mydom = ".".join(fqdn.split(".")[1:])
@@ -236,6 +226,6 @@ def find_apt_mirror(cloud, cfg):
             mirror = util.search_for_mirror(mirror_list)
 
     if not mirror:
-        mirror = defaults[distro]
+        mirror = cloud.distro.get_package_mirror()
 
     return mirror
diff --git a/cloudinit/transforms/cc_bootcmd.py b/cloudinit/transforms/cc_bootcmd.py
index f584da02..a2efad32 100644
--- a/cloudinit/transforms/cc_bootcmd.py
+++ b/cloudinit/transforms/cc_bootcmd.py
@@ -17,32 +17,36 @@
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-import cloudinit.util as util
-import subprocess
-import tempfile
+
 import os
-from cloudinit.CloudConfig import per_always
-frequency = per_always
+import tempfile
+
+from cloudinit import util
+from cloudinit.settings import PER_ALWAYS
+
+frequency = PER_ALWAYS
 
 
-def handle(_name, cfg, cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
+
     if "bootcmd" not in cfg:
+        log.debug("Skipping module named %s,  no 'bootcomd' key in configuration", name)
         return
 
-    try:
-        content = util.shellify(cfg["bootcmd"])
-        tmpf = tempfile.TemporaryFile()
-        tmpf.write(content)
-        tmpf.seek(0)
-    except:
-        log.warn("failed to shellify bootcmd")
-        raise
+    with tempfile.NamedTemporaryFile(suffix=".sh") as tmpf:
+        try:
+            content = util.shellify(cfg["bootcmd"])
+            tmpf.write(content)
+            tmpf.flush()
+        except:
+            log.warn("Failed to shellify bootcmd")
+            raise
 
-    try:
-        env = os.environ.copy()
-        env['INSTANCE_ID'] = cloud.get_instance_id()
-        subprocess.check_call(['/bin/sh'], env=env, stdin=tmpf)
-        tmpf.close()
-    except:
-        log.warn("failed to run commands from bootcmd")
-        raise
+        try:
+            env = os.environ.copy()
+            env['INSTANCE_ID'] = cloud.get_instance_id()
+            cmd = ['/bin/sh', tmpf.name]
+            util.subp(cmd, env=env, capture=False)
+        except:
+            log.warn("Failed to run commands from bootcmd")
+            raise
diff --git a/cloudinit/transforms/cc_byobu.py b/cloudinit/transforms/cc_byobu.py
index e821b261..38586174 100644
--- a/cloudinit/transforms/cc_byobu.py
+++ b/cloudinit/transforms/cc_byobu.py
@@ -18,18 +18,19 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import subprocess
-import traceback
+from cloudinit import util
+
+distros = ['ubuntu', 'debian']
 
 
-def handle(_name, cfg, _cloud, log, args):
+def handle(name, cfg, _cloud, log, args):
     if len(args) != 0:
         value = args[0]
     else:
         value = util.get_cfg_option_str(cfg, "byobu_by_default", "")
 
     if not value:
+        log.debug("Skipping module named %s, no 'byobu' values found", name)
         return
 
     if value == "user" or value == "system":
@@ -38,7 +39,7 @@ def handle(_name, cfg, _cloud, log, args):
     valid = ("enable-user", "enable-system", "enable",
              "disable-user", "disable-system", "disable")
     if not value in valid:
-        log.warn("Unknown value %s for byobu_by_default" % value)
+        log.warn("Unknown value %s for byobu_by_default", value)
 
     mod_user = value.endswith("-user")
     mod_sys = value.endswith("-system")
@@ -65,13 +66,6 @@ def handle(_name, cfg, _cloud, log, args):
 
     cmd = ["/bin/sh", "-c", "%s %s %s" % ("X=0;", shcmd, "exit $X")]
 
-    log.debug("setting byobu to %s" % value)
+    log.debug("Setting byobu to %s", value)
 
-    try:
-        subprocess.check_call(cmd)
-    except subprocess.CalledProcessError as e:
-        log.debug(traceback.format_exc(e))
-        raise Exception("Cmd returned %s: %s" % (e.returncode, cmd))
-    except OSError as e:
-        log.debug(traceback.format_exc(e))
-        raise Exception("Cmd failed to execute: %s" % (cmd))
+    util.subp(cmd)
diff --git a/cloudinit/transforms/cc_ca_certs.py b/cloudinit/transforms/cc_ca_certs.py
index 3af6238a..8ca9a200 100644
--- a/cloudinit/transforms/cc_ca_certs.py
+++ b/cloudinit/transforms/cc_ca_certs.py
@@ -13,10 +13,10 @@
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
 import os
-from subprocess import check_call
-from cloudinit.util import (write_file, get_cfg_option_list_or_str,
-                            delete_dir_contents, subp)
+
+from cloudinit import util
 
 CA_CERT_PATH = "/usr/share/ca-certificates/"
 CA_CERT_FILENAME = "cloud-init-ca-certs.crt"
@@ -28,7 +28,7 @@ def update_ca_certs():
     """
     Updates the CA certificate cache on the current machine.
     """
-    check_call(["update-ca-certificates"])
+    util.subp(["update-ca-certificates"])
 
 
 def add_ca_certs(certs):
@@ -41,9 +41,9 @@ def add_ca_certs(certs):
     if certs:
         cert_file_contents = "\n".join(certs)
         cert_file_fullpath = os.path.join(CA_CERT_PATH, CA_CERT_FILENAME)
-        write_file(cert_file_fullpath, cert_file_contents, mode=0644)
+        util.write_file(cert_file_fullpath, cert_file_contents, mode=0644)
         # Append cert filename to CA_CERT_CONFIG file.
-        write_file(CA_CERT_CONFIG, "\n%s" % CA_CERT_FILENAME, omode="a")
+        util.write_file(CA_CERT_CONFIG, "\n%s" % CA_CERT_FILENAME, omode="ab")
 
 
 def remove_default_ca_certs():
@@ -51,14 +51,14 @@ def remove_default_ca_certs():
     Removes all default trusted CA certificates from the system. To actually
     apply the change you must also call L{update_ca_certs}.
     """
-    delete_dir_contents(CA_CERT_PATH)
-    delete_dir_contents(CA_CERT_SYSTEM_PATH)
-    write_file(CA_CERT_CONFIG, "", mode=0644)
+    util.delete_dir_contents(CA_CERT_PATH)
+    util.delete_dir_contents(CA_CERT_SYSTEM_PATH)
+    util.write_file(CA_CERT_CONFIG, "", mode=0644)
     debconf_sel = "ca-certificates ca-certificates/trust_new_crts select no"
-    subp(('debconf-set-selections', '-'), debconf_sel)
+    util.subp(('debconf-set-selections', '-'), debconf_sel)
 
 
-def handle(_name, cfg, _cloud, log, _args):
+def handle(name, cfg, _cloud, log, _args):
     """
     Call to handle ca-cert sections in cloud-config file.
 
@@ -70,6 +70,7 @@ def handle(_name, cfg, _cloud, log, _args):
     """
     # If there isn't a ca-certs section in the configuration don't do anything
     if "ca-certs" not in cfg:
+        log.debug("Skipping module named %s, no 'ca-certs' key in configuration", name)
         return
     ca_cert_cfg = cfg['ca-certs']
 
@@ -81,7 +82,7 @@ def handle(_name, cfg, _cloud, log, _args):
 
     # If we are given any new trusted CA certs to add, add them.
     if "trusted" in ca_cert_cfg:
-        trusted_certs = get_cfg_option_list_or_str(ca_cert_cfg, "trusted")
+        trusted_certs = util.get_cfg_option_list_or_str(ca_cert_cfg, "trusted")
         if trusted_certs:
             log.debug("adding %d certificates" % len(trusted_certs))
             add_ca_certs(trusted_certs)
diff --git a/cloudinit/transforms/cc_chef.py b/cloudinit/transforms/cc_chef.py
index 941e04fe..12c2f539 100644
--- a/cloudinit/transforms/cc_chef.py
+++ b/cloudinit/transforms/cc_chef.py
@@ -18,53 +18,59 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import os
-import subprocess
 import json
-import cloudinit.CloudConfig as cc
-import cloudinit.util as util
+import os
+
+from cloudinit import templater
+from cloudinit import util
 
 ruby_version_default = "1.8"
 
 
-def handle(_name, cfg, cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
+
     # If there isn't a chef key in the configuration don't do anything
     if 'chef' not in cfg:
+        log.debug("Skipping module named %s, no 'chef' key in configuration", name)
         return
     chef_cfg = cfg['chef']
 
     # ensure the chef directories we use exist
-    mkdirs(['/etc/chef', '/var/log/chef', '/var/lib/chef',
-            '/var/cache/chef', '/var/backups/chef', '/var/run/chef'])
+    util.ensure_dirs(['/etc/chef', '/var/log/chef', '/var/lib/chef',
+                     '/var/cache/chef', '/var/backups/chef', '/var/run/chef'])
 
     # set the validation key based on the presence of either 'validation_key'
     # or 'validation_cert'. In the case where both exist, 'validation_key'
     # takes precedence
     for key in ('validation_key', 'validation_cert'):
         if key in chef_cfg and chef_cfg[key]:
-            with open('/etc/chef/validation.pem', 'w') as validation_key_fh:
-                validation_key_fh.write(chef_cfg[key])
+            util.write_file('/etc/chef/validation.pem', chef_cfg[key])
             break
 
     # create the chef config from template
-    util.render_to_file('chef_client.rb', '/etc/chef/client.rb',
-        {'server_url': chef_cfg['server_url'],
-         'node_name': util.get_cfg_option_str(chef_cfg, 'node_name',
-                                          cloud.datasource.get_instance_id()),
-         'environment': util.get_cfg_option_str(chef_cfg, 'environment',
-                                                '_default'),
-         'validation_name': chef_cfg['validation_name']})
+    template_fn = cloud.get_template_filename('chef_client.rb')
+    if template_fn:
+        params = {
+            'server_url': chef_cfg['server_url'],
+            'node_name': util.get_cfg_option_str(chef_cfg, 'node_name',
+                                    cloud.datasource.get_instance_id()),
+            'environment': util.get_cfg_option_str(chef_cfg, 'environment',
+                                                   '_default'),
+            'validation_name': chef_cfg['validation_name']
+        }
+        templater.render_to_file(template_fn, '/etc/chef/client.rb', params)
+    else:
+        log.warn("No template found, not rendering to /etc/chef/client.rb")
 
     # set the firstboot json
-    with open('/etc/chef/firstboot.json', 'w') as firstboot_json_fh:
-        initial_json = {}
-        if 'run_list' in chef_cfg:
-            initial_json['run_list'] = chef_cfg['run_list']
-        if 'initial_attributes' in chef_cfg:
-            initial_attributes = chef_cfg['initial_attributes']
-            for k in initial_attributes.keys():
-                initial_json[k] = initial_attributes[k]
-        firstboot_json_fh.write(json.dumps(initial_json))
+    initial_json = {}
+    if 'run_list' in chef_cfg:
+        initial_json['run_list'] = chef_cfg['run_list']
+    if 'initial_attributes' in chef_cfg:
+        initial_attributes = chef_cfg['initial_attributes']
+        for k in initial_attributes.keys():
+            initial_json[k] = initial_attributes[k]
+    util.write_file('/etc/chef/firstboot.json', json.dumps(initial_json))
 
     # If chef is not installed, we install chef based on 'install_type'
     if not os.path.isfile('/usr/bin/chef-client'):
@@ -75,14 +81,15 @@ def handle(_name, cfg, cloud, log, _args):
             chef_version = util.get_cfg_option_str(chef_cfg, 'version', None)
             ruby_version = util.get_cfg_option_str(chef_cfg, 'ruby_version',
                                                    ruby_version_default)
-            install_chef_from_gems(ruby_version, chef_version)
+            install_chef_from_gems(cloud.distro, ruby_version, chef_version)
             # and finally, run chef-client
-            log.debug('running chef-client')
-            subprocess.check_call(['/usr/bin/chef-client', '-d', '-i', '1800',
-                                   '-s', '20'])
-        else:
+            log.debug('Running chef-client')
+            util.subp(['/usr/bin/chef-client', '-d', '-i', '1800', '-s', '20'])
+        elif install_type == 'packages':
             # this will install and run the chef-client from packages
-            cc.install_packages(('chef',))
+            cloud.distro.install_packages(('chef',))
+        else:
+            log.warn("Unknown chef install type %s", install_type)
 
 
 def get_ruby_packages(version):
@@ -90,30 +97,20 @@ def get_ruby_packages(version):
     pkgs = ['ruby%s' % version, 'ruby%s-dev' % version]
     if version == "1.8":
         pkgs.extend(('libopenssl-ruby1.8', 'rubygems1.8'))
-    return(pkgs)
+    return pkgs
 
 
-def install_chef_from_gems(ruby_version, chef_version=None):
-    cc.install_packages(get_ruby_packages(ruby_version))
+def install_chef_from_gems(ruby_version, chef_version, distro):
+    distro.install_packages(get_ruby_packages(ruby_version))
     if not os.path.exists('/usr/bin/gem'):
-        os.symlink('/usr/bin/gem%s' % ruby_version, '/usr/bin/gem')
+        util.sym_link('/usr/bin/gem%s' % ruby_version, '/usr/bin/gem')
     if not os.path.exists('/usr/bin/ruby'):
-        os.symlink('/usr/bin/ruby%s' % ruby_version, '/usr/bin/ruby')
+        util.sym_link('/usr/bin/ruby%s' % ruby_version, '/usr/bin/ruby')
     if chef_version:
-        subprocess.check_call(['/usr/bin/gem', 'install', 'chef',
-                               '-v %s' % chef_version, '--no-ri',
-                               '--no-rdoc', '--bindir', '/usr/bin', '-q'])
+        util.subp(['/usr/bin/gem', 'install', 'chef',
+                  '-v %s' % chef_version, '--no-ri',
+                  '--no-rdoc', '--bindir', '/usr/bin', '-q'])
     else:
-        subprocess.check_call(['/usr/bin/gem', 'install', 'chef',
-                               '--no-ri', '--no-rdoc', '--bindir',
-                               '/usr/bin', '-q'])
-
-
-def ensure_dir(d):
-    if not os.path.exists(d):
-        os.makedirs(d)
-
-
-def mkdirs(dirs):
-    for d in dirs:
-        ensure_dir(d)
+        util.subp(['/usr/bin/gem', 'install', 'chef',
+                  '--no-ri', '--no-rdoc', '--bindir',
+                  '/usr/bin', '-q'])
diff --git a/cloudinit/transforms/cc_disable_ec2_metadata.py b/cloudinit/transforms/cc_disable_ec2_metadata.py
index 6b31ea8e..4d2a7f55 100644
--- a/cloudinit/transforms/cc_disable_ec2_metadata.py
+++ b/cloudinit/transforms/cc_disable_ec2_metadata.py
@@ -17,14 +17,16 @@
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-import cloudinit.util as util
-import subprocess
-from cloudinit.CloudConfig import per_always
 
-frequency = per_always
+from cloudinit import util
+
+from cloudinit.settings import PER_ALWAYS
+
+frequency = PER_ALWAYS
+
+reject_cmd = ['route', 'add', '-host', '169.254.169.254', 'reject']
 
 
 def handle(_name, cfg, _cloud, _log, _args):
     if util.get_cfg_option_bool(cfg, "disable_ec2_metadata", False):
-        fwall = "route add -host 169.254.169.254 reject"
-        subprocess.call(fwall.split(' '))
+        util.subp(reject_cmd)
diff --git a/cloudinit/transforms/cc_final_message.py b/cloudinit/transforms/cc_final_message.py
index abb4ca32..dc4ae34c 100644
--- a/cloudinit/transforms/cc_final_message.py
+++ b/cloudinit/transforms/cc_final_message.py
@@ -18,41 +18,54 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from cloudinit.CloudConfig import per_always
 import sys
-from cloudinit import util, boot_finished
-import time
 
-frequency = per_always
+from cloudinit import templater
+from cloudinit import util
+from cloudinit import version
 
-final_message = "cloud-init boot finished at $TIMESTAMP. Up $UPTIME seconds"
+from cloudinit.settings import PER_ALWAYS
+
+frequency = PER_ALWAYS
+
+final_message_def = ("Cloud-init v. {{version}} finished at {{timestamp}}."
+                     " Up {{uptime}} seconds.")
 
 
-def handle(_name, cfg, _cloud, log, args):
+def handle(name, cfg, cloud, log, args):
+
+    msg_in = None
     if len(args) != 0:
         msg_in = args[0]
     else:
-        msg_in = util.get_cfg_option_str(cfg, "final_message", final_message)
+        msg_in = util.get_cfg_option_str(cfg, "final_message")
+    
+    if not msg_in:
+        template_fn = cloud.get_template_filename('final_message')
+        if template_fn:
+            msg_in = util.load_file(template_fn)
 
-    try:
-        uptimef = open("/proc/uptime")
-        uptime = uptimef.read().split(" ")[0]
-        uptimef.close()
-    except IOError as e:
-        log.warn("unable to open /proc/uptime\n")
-        uptime = "na"
+    if not msg_in:
+        msg_in = final_message_def
 
+    uptime = util.uptime()
+    ts = util.time_rfc2822()
+    cver = version.version_string()
     try:
-        ts = time.strftime("%a, %d %b %Y %H:%M:%S %z", time.gmtime())
-    except:
-        ts = "na"
-
-    try:
-        subs = {'UPTIME': uptime, 'TIMESTAMP': ts}
-        sys.stdout.write("%s\n" % util.render_string(msg_in, subs))
+        subs = {
+            'uptime': uptime, 
+            'timestamp': ts,
+            'version': cver,
+        }
+        # Use stdout, stderr or the logger??
+        content = templater.render_string(msg_in, subs)
+        sys.stderr.write("%s\n" % (content))
     except Exception as e:
-        log.warn("failed to render string to stdout: %s" % e)
+        util.logexc(log, "Failed to render final message template")
 
-    fp = open(boot_finished, "wb")
-    fp.write(uptime + "\n")
-    fp.close()
+    boot_fin_fn = cloud.paths.boot_finished
+    try:
+        contents = "%s - %s - v. %s\n" % (uptime, ts, cver)
+        util.write_file(boot_fin_fn, contents)
+    except:
+        util.logexc(log, "Failed to write boot finished file %s", boot_fin_fn)
diff --git a/cloudinit/transforms/cc_foo.py b/cloudinit/transforms/cc_foo.py
index 35ec3fa7..8007f981 100644
--- a/cloudinit/transforms/cc_foo.py
+++ b/cloudinit/transforms/cc_foo.py
@@ -18,12 +18,35 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-#import cloudinit
-#import cloudinit.util as util
-from cloudinit.CloudConfig import per_instance
+from cloudinit.settings import PER_INSTANCE
 
-frequency = per_instance
+# Modules are expected to have the following attributes.
+# 1. A required 'handle' method which takes the following params.
+#    a) The name will not be this files name, but instead
+#    the name specified in configuration (which is the name
+#    which will be used to find this module).
+#    b) A configuration object that is the result of the merging
+#    of cloud configs configuration with legacy configuration
+#    as well as any datasource provided configuration
+#    c) A cloud object that can be used to access various
+#    datasource and paths for the given distro and data provided
+#    by the various datasource instance types. 
+#    d) A argument list that may or may not be empty to this module.
+#    Typically those are from module configuration where the module
+#    is defined with some extra configuration that will eventually
+#    be translated from yaml into arguments to this module.
+# 2. A optional 'frequency' that defines how often this module should be ran.
+#    Typically one of PER_INSTANCE, PER_ALWAYS, PER_ONCE. If not 
+#    provided PER_INSTANCE will be assumed. 
+#    See settings.py for these constants.
+# 3. A optional 'distros' array/set/tuple that defines the known distros
+#    this module will work with (if not all of them). This is used to write
+#    a warning out if a module is being ran on a untested distribution for
+#    informational purposes. If non existent all distros are assumed and 
+#    no warning occurs.
+
+frequency = settings.PER_INSTANCE
 
 
-def handle(_name, _cfg, _cloud, _log, _args):
-    print "hi"
+def handle(name, _cfg, _cloud, _log, _args):
+    print("Hi from %s" % (name))
diff --git a/cloudinit/transforms/cc_grub_dpkg.py b/cloudinit/transforms/cc_grub_dpkg.py
index 9f3a7eaf..c048d5cc 100644
--- a/cloudinit/transforms/cc_grub_dpkg.py
+++ b/cloudinit/transforms/cc_grub_dpkg.py
@@ -18,10 +18,12 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import traceback
 import os
 
+from cloudinit import util
+
+distros = ['ubuntu', 'debian']
+
 
 def handle(_name, cfg, _cloud, log, _args):
     idevs = None
@@ -52,13 +54,14 @@ def handle(_name, cfg, _cloud, log, _args):
     # now idevs and idevs_empty are set to determined values
     # or, those set by user
 
-    dconf_sel = "grub-pc grub-pc/install_devices string %s\n" % idevs + \
-        "grub-pc grub-pc/install_devices_empty boolean %s\n" % idevs_empty
-    log.debug("setting grub debconf-set-selections with '%s','%s'" %
+    dconf_sel = ("grub-pc grub-pc/install_devices string %s\n"
+                 "grub-pc grub-pc/install_devices_empty boolean %s\n") %
+                (idevs, idevs_empty)
+
+    log.debug("Setting grub debconf-set-selections with '%s','%s'" %
         (idevs, idevs_empty))
 
     try:
-        util.subp(('debconf-set-selections'), dconf_sel)
+        util.subp(['debconf-set-selections'], dconf_sel)
     except:
-        log.error("Failed to run debconf-set-selections for grub-dpkg")
-        log.debug(traceback.format_exc())
+        util.logexc(log, "Failed to run debconf-set-selections for grub-dpkg")
diff --git a/cloudinit/transforms/cc_keys_to_console.py b/cloudinit/transforms/cc_keys_to_console.py
index 73a477c0..2f2a5297 100644
--- a/cloudinit/transforms/cc_keys_to_console.py
+++ b/cloudinit/transforms/cc_keys_to_console.py
@@ -18,11 +18,10 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from cloudinit.CloudConfig import per_instance
-import cloudinit.util as util
-import subprocess
+from cloudinit.settings import PER_INSTANCE
+from cloudinit import util
 
-frequency = per_instance
+frequency = PER_INSTANCE
 
 
 def handle(_name, cfg, _cloud, log, _args):
@@ -32,11 +31,10 @@ def handle(_name, cfg, _cloud, log, _args):
     key_blacklist = util.get_cfg_option_list_or_str(cfg,
         "ssh_key_console_blacklist", ["ssh-dss"])
     try:
-        confp = open('/dev/console', "wb")
         cmd.append(','.join(fp_blacklist))
         cmd.append(','.join(key_blacklist))
-        subprocess.call(cmd, stdout=confp)
-        confp.close()
+        (stdout, stderr) = util.subp(cmd)
+        util.write_file('/dev/console', stdout)
     except:
-        log.warn("writing keys to console value")
+        log.warn("Writing keys to console failed!")
         raise
diff --git a/cloudinit/transforms/cc_landscape.py b/cloudinit/transforms/cc_landscape.py
index a4113cbe..48491992 100644
--- a/cloudinit/transforms/cc_landscape.py
+++ b/cloudinit/transforms/cc_landscape.py
@@ -19,14 +19,24 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 import os
-import os.path
-from cloudinit.CloudConfig import per_instance
-from configobj import ConfigObj
 
-frequency = per_instance
+from StringIO import StringIO
+
+try:
+    from configobj import ConfigObj
+except ImportError:
+    ConfigObj = None
+
+from cloudinit import util
+
+from cloudinit.settings import PER_INSTANCE
+
+frequency = PER_INSTANCE
 
 lsc_client_cfg_file = "/etc/landscape/client.conf"
 
+distros = ['ubuntu']
+
 # defaults taken from stock client.conf in landscape-client 11.07.1.1-0ubuntu2
 lsc_builtincfg = {
   'client': {
@@ -38,36 +48,43 @@ lsc_builtincfg = {
 }
 
 
-def handle(_name, cfg, _cloud, log, _args):
+def handle(name, cfg, _cloud, log, _args):
     """
     Basically turn a top level 'landscape' entry with a 'client' dict
     and render it to ConfigObj format under '[client]' section in
     /etc/landscape/client.conf
     """
+    if not ConfigObj:
+        log.warn("'ConfigObj' support not enabled, running %s disabled", name)
+        return
 
     ls_cloudcfg = cfg.get("landscape", {})
 
     if not isinstance(ls_cloudcfg, dict):
-        raise(Exception("'landscape' existed in config, but not a dict"))
+        raise Exception(("'landscape' key existed in config," 
+                         " but not a dictionary type,"
+                         " is a %s instead"), util.obj_name(ls_cloudcfg))
 
-    merged = mergeTogether([lsc_builtincfg, lsc_client_cfg_file, ls_cloudcfg])
+    merged = merge_together([lsc_builtincfg, lsc_client_cfg_file, ls_cloudcfg])
 
     if not os.path.isdir(os.path.dirname(lsc_client_cfg_file)):
-        os.makedirs(os.path.dirname(lsc_client_cfg_file))
+        util.ensure_dir(os.path.dirname(lsc_client_cfg_file))
 
-    with open(lsc_client_cfg_file, "w") as fp:
-        merged.write(fp)
-
-    log.debug("updated %s" % lsc_client_cfg_file)
+    contents = StringIO()
+    merged.write(contents)
+    util.write_file(lsc_client_cfg_file, contents.getvalue())
+    log.debug("Wrote landscape config file to %s", lsc_client_cfg_file)
 
 
-def mergeTogether(objs):
+def merge_together(objs):
     """
     merge together ConfigObj objects or things that ConfigObj() will take in
     later entries override earlier
     """
     cfg = ConfigObj({})
     for obj in objs:
+        if not obj:
+            continue
         if isinstance(obj, ConfigObj):
             cfg.merge(obj)
         else:
diff --git a/cloudinit/transforms/cc_locale.py b/cloudinit/transforms/cc_locale.py
index 2bb22fdb..3fb4c5d9 100644
--- a/cloudinit/transforms/cc_locale.py
+++ b/cloudinit/transforms/cc_locale.py
@@ -18,22 +18,28 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import os.path
-import subprocess
-import traceback
+import os
+
+from cloudinit import templater
+from cloudinit import util
 
 
-def apply_locale(locale, cfgfile):
+def apply_locale(locale, cfgfile, cloud, log):
+    # TODO this command might not work on RH...
     if os.path.exists('/usr/sbin/locale-gen'):
-        subprocess.Popen(['locale-gen', locale]).communicate()
+        util.subp(['locale-gen', locale], capture=False)
     if os.path.exists('/usr/sbin/update-locale'):
-        subprocess.Popen(['update-locale', locale]).communicate()
-
-    util.render_to_file('default-locale', cfgfile, {'locale': locale})
+        util.subp(['update-locale', locale], capture=False)
+    if not cfgfile:
+        return
+    template_fn = cloud.get_template_filename('default-locale')
+    if not template_fn:
+        log.warn("No template filename found to write to %s", cfgfile)
+    else:
+        templater.render_to_file(template_fn, cfgfile, {'locale': locale})
 
 
-def handle(_name, cfg, cloud, log, args):
+def handle(name, cfg, cloud, log, args):
     if len(args) != 0:
         locale = args[0]
     else:
@@ -43,12 +49,10 @@ def handle(_name, cfg, cloud, log, args):
                                              "/etc/default/locale")
 
     if not locale:
+        log.debug(("Skipping module named %s, "
+                   "no 'locale' configuration found"), name)
         return
 
-    log.debug("setting locale to %s" % locale)
+    log.debug("Setting locale to %s", locale)
 
-    try:
-        apply_locale(locale, locale_cfgfile)
-    except Exception as e:
-        log.debug(traceback.format_exc(e))
-        raise Exception("failed to apply locale %s" % locale)
+    apply_locale(locale, locale_cfgfile, cloud, log)
diff --git a/cloudinit/transforms/cc_mcollective.py b/cloudinit/transforms/cc_mcollective.py
index a2a6230c..aeeda9d2 100644
--- a/cloudinit/transforms/cc_mcollective.py
+++ b/cloudinit/transforms/cc_mcollective.py
@@ -19,50 +19,53 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from ConfigParser import ConfigParser
+from StringIO import StringIO
+
 import os
-import subprocess
-import StringIO
-import ConfigParser
-import cloudinit.CloudConfig as cc
-import cloudinit.util as util
+
+from cloudinit import util
+from cloudinit import cfg
 
 pubcert_file = "/etc/mcollective/ssl/server-public.pem"
 pricert_file = "/etc/mcollective/ssl/server-private.pem"
 
 
-# Our fake header section
-class FakeSecHead(object):
-    def __init__(self, fp):
-        self.fp = fp
-        self.sechead = '[nullsection]\n'
+def handle(name, cfg, cloud, log, _args):
 
-    def readline(self):
-        if self.sechead:
-            try:
-                return self.sechead
-            finally:
-                self.sechead = None
-        else:
-            return self.fp.readline()
-
-
-def handle(_name, cfg, _cloud, _log, _args):
     # If there isn't a mcollective key in the configuration don't do anything
     if 'mcollective' not in cfg:
+        log.debug(("Skipping module named %s, "
+                   "no 'mcollective' key in configuration"), name)
         return
+
     mcollective_cfg = cfg['mcollective']
+
     # Start by installing the mcollective package ...
-    cc.install_packages(("mcollective",))
+    cloud.distro.install_packages(("mcollective",))
 
     # ... and then update the mcollective configuration
     if 'conf' in mcollective_cfg:
         # Create object for reading server.cfg values
-        mcollective_config = ConfigParser.ConfigParser()
+        mcollective_config = cfg.DefaultingConfigParser()
         # Read server.cfg values from original file in order to be able to mix
         # the rest up
-        mcollective_config.readfp(FakeSecHead(open('/etc/mcollective/'
-                                                   'server.cfg')))
-        for cfg_name, cfg in mcollective_cfg['conf'].iteritems():
+        old_contents = util.load_file('/etc/mcollective/server.cfg')
+        # It doesn't contain any sections so just add one temporarily
+        # Use a hash id based off the contents,
+        # just incase of conflicts... (try to not have any...)
+        # This is so that an error won't occur when reading (and no 
+        # sections exist in the file)
+        section_tpl = "[nullsection_%s]"
+        attempts = 0
+        section_head = section_tpl % (attempts)
+        while old_contents.find(section_head) != -1:
+            attempts += 1
+            section_head = section_tpl % (attempts)
+        sectioned_contents = "%s\n%s" % (section_head, old_contents)
+        mcollective_config.readfp(StringIO(sectioned_contents),
+                                  filename='/etc/mcollective/server.cfg')
+        for (cfg_name, cfg) in mcollective_cfg['conf'].iteritems():
             if cfg_name == 'public-cert':
                 util.write_file(pubcert_file, cfg, mode=0644)
                 mcollective_config.set(cfg_name,
@@ -76,24 +79,19 @@ def handle(_name, cfg, _cloud, _log, _args):
             else:
                 # Iterate throug the config items, we'll use ConfigParser.set
                 # to overwrite or create new items as needed
-                for o, v in cfg.iteritems():
+                for (o, v) in cfg.iteritems():
                     mcollective_config.set(cfg_name, o, v)
         # We got all our config as wanted we'll rename
         # the previous server.cfg and create our new one
-        os.rename('/etc/mcollective/server.cfg',
-                  '/etc/mcollective/server.cfg.old')
-        outputfile = StringIO.StringIO()
-        mcollective_config.write(outputfile)
-        # Now we got the whole file, write to disk except first line
+        util.rename('/etc/mcollective/server.cfg',
+                    '/etc/mcollective/server.cfg.old')
+        # Now we got the whole file, write to disk except the section 
+        # we added so that config parser won't error out when trying to read.
         # Note below, that we've just used ConfigParser because it generally
-        # works.  Below, we remove the initial 'nullsection' header
-        # and then change 'key = value' to 'key: value'.  The global
-        # search and replace of '=' with ':' could be problematic though.
-        # this most likely needs fixing.
-        util.write_file('/etc/mcollective/server.cfg',
-            outputfile.getvalue().replace('[nullsection]\n', '').replace(' =',
-                                                                         ':'),
-            mode=0644)
+        # works.  Below, we remove the initial 'nullsection' header.
+        contents = mcollective_config.stringify()
+        contents = contents.replace("%s\n" % (section_head), "")
+        util.write_file('/etc/mcollective/server.cfg', contents, mode=0644)
 
     # Start mcollective
-    subprocess.check_call(['service', 'mcollective', 'start'])
+    util.subp(['service', 'mcollective', 'start'], capture=False)
diff --git a/cloudinit/transforms/cc_mounts.py b/cloudinit/transforms/cc_mounts.py
index 6cdd74e8..babcbda1 100644
--- a/cloudinit/transforms/cc_mounts.py
+++ b/cloudinit/transforms/cc_mounts.py
@@ -18,10 +18,17 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
+from string import whitespace  # pylint: disable=W0402
+
 import os
 import re
-from string import whitespace  # pylint: disable=W0402
+
+from cloudinit import util
+
+# shortname matches 'sda', 'sda1', 'xvda', 'hda', 'sdb', xvdb, vda, vdd1
+shortname_filter = r"^[x]{0,1}[shv]d[a-z][0-9]*$"
+shortname = re.compile(shortname_filter)
+ws = re.compile("[%s]+" % whitespace)
 
 
 def is_mdname(name):
@@ -49,38 +56,46 @@ def handle(_name, cfg, cloud, log, _args):
     if "mounts" in cfg:
         cfgmnt = cfg["mounts"]
 
-    # shortname matches 'sda', 'sda1', 'xvda', 'hda', 'sdb', xvdb, vda, vdd1
-    shortname_filter = r"^[x]{0,1}[shv]d[a-z][0-9]*$"
-    shortname = re.compile(shortname_filter)
-
+    
     for i in range(len(cfgmnt)):
         # skip something that wasn't a list
         if not isinstance(cfgmnt[i], list):
+            log.warn("Mount option %s not a list, got a %s instead",
+                     (i + 1), util.obj_name(cfgmnt[i]))
             continue
 
+        startname = str(cfgmnt[i][0])
+        LOG.debug("Attempting to determine the real name of %s", startname)
+
         # workaround, allow user to specify 'ephemeral'
         # rather than more ec2 correct 'ephemeral0'
-        if cfgmnt[i][0] == "ephemeral":
+        if startname == "ephemeral":
             cfgmnt[i][0] = "ephemeral0"
+            log.debug("Adjusted mount option %s name from ephemeral to ephemeral0", (i + 1))
 
-        if is_mdname(cfgmnt[i][0]):
-            newname = cloud.device_name_to_device(cfgmnt[i][0])
+        if is_mdname(startname):
+            newname = cloud.device_name_to_device(startname)
             if not newname:
-                log.debug("ignoring nonexistant named mount %s" % cfgmnt[i][0])
+                log.debug("Ignoring nonexistant named mount %s", startname)
                 cfgmnt[i][1] = None
             else:
-                if newname.startswith("/"):
-                    cfgmnt[i][0] = newname
-                else:
-                    cfgmnt[i][0] = "/dev/%s" % newname
+                renamed = newname
+                if not newname.startswith("/"):
+                    renamed = "/dev/%s" % newname
+                cfgmnt[i][0] = renamed
+                log.debug("Mapped metadata name %s to %s", startname, renamed)
         else:
-            if shortname.match(cfgmnt[i][0]):
-                cfgmnt[i][0] = "/dev/%s" % cfgmnt[i][0]
+            if shortname.match(startname):
+                renamed = "/dev/%s" % startname
+                log.debug("Mapped shortname name %s to %s", startname, renamed)
+                cfgmnt[i][0] = renamed
 
         # in case the user did not quote a field (likely fs-freq, fs_passno)
         # but do not convert None to 'None' (LP: #898365)
         for j in range(len(cfgmnt[i])):
-            if isinstance(cfgmnt[i][j], int):
+            if j is None:
+                continue
+            else:
                 cfgmnt[i][j] = str(cfgmnt[i][j])
 
     for i in range(len(cfgmnt)):
@@ -102,14 +117,18 @@ def handle(_name, cfg, cloud, log, _args):
     # for each of the "default" mounts, add them only if no other
     # entry has the same device name
     for defmnt in defmnts:
-        devname = cloud.device_name_to_device(defmnt[0])
+        startname = defmnt[0]
+        devname = cloud.device_name_to_device(startname)
         if devname is None:
+            log.debug("Ignoring nonexistant named default mount %s", startname)
             continue
         if devname.startswith("/"):
             defmnt[0] = devname
         else:
             defmnt[0] = "/dev/%s" % devname
 
+        log.debug("Mapped default device %s to %s", startname, defmnt[0])
+
         cfgmnt_has = False
         for cfgm in cfgmnt:
             if cfgm[0] == defmnt[0]:
@@ -117,14 +136,21 @@ def handle(_name, cfg, cloud, log, _args):
                 break
 
         if cfgmnt_has:
+            log.debug("Not including %s, already previously included", startname)
             continue
         cfgmnt.append(defmnt)
 
     # now, each entry in the cfgmnt list has all fstab values
     # if the second field is None (not the string, the value) we skip it
-    actlist = [x for x in cfgmnt if x[1] is not None]
+    actlist = []
+    for x in cfgmnt:
+        if x[1] is None:
+            log.debug("Skipping non-existent device named %s", x[0])
+        else:
+            actlist.append(x)
 
     if len(actlist) == 0:
+        log.debug("No modifications to fstab needed.")
         return
 
     comment = "comment=cloudconfig"
@@ -141,8 +167,7 @@ def handle(_name, cfg, cloud, log, _args):
         cc_lines.append('\t'.join(line))
 
     fstab_lines = []
-    fstab = open("/etc/fstab", "r+")
-    ws = re.compile("[%s]+" % whitespace)
+    fstab = util.load_file("/etc/fstab")
     for line in fstab.read().splitlines():
         try:
             toks = ws.split(line)
@@ -153,27 +178,22 @@ def handle(_name, cfg, cloud, log, _args):
         fstab_lines.append(line)
 
     fstab_lines.extend(cc_lines)
-
-    fstab.seek(0)
-    fstab.write("%s\n" % '\n'.join(fstab_lines))
-    fstab.truncate()
-    fstab.close()
+    contents = "%s\n" % ('\n'.join(fstab_lines))
+    util.write_file("/etc/fstab", contents)
 
     if needswap:
         try:
             util.subp(("swapon", "-a"))
         except:
-            log.warn("Failed to enable swap")
+            util.logexc(log, "Activating swap via 'swapon -a' failed")
 
     for d in dirs:
-        if os.path.exists(d):
-            continue
         try:
-            os.makedirs(d)
+            util.ensure_dir(d)
         except:
-            log.warn("Failed to make '%s' config-mount\n", d)
+            util.logexc(log, "Failed to make '%s' config-mount", d)
 
     try:
         util.subp(("mount", "-a"))
     except:
-        log.warn("'mount -a' failed")
+        util.logexc(log, "Activating mounts via 'mount -a' failed")
diff --git a/cloudinit/transforms/cc_phone_home.py b/cloudinit/transforms/cc_phone_home.py
index a7ff74e1..36af6dfa 100644
--- a/cloudinit/transforms/cc_phone_home.py
+++ b/cloudinit/transforms/cc_phone_home.py
@@ -17,13 +17,18 @@
 #
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-from cloudinit.CloudConfig import per_instance
-import cloudinit.util as util
+
+from cloudinit import templater
+from cloudinit import url_helper as uhelp
+from cloudinit import util
+
+from cloudinit.settings import PER_INSTANCE
+
 from time import sleep
 
-frequency = per_instance
-post_list_all = ['pub_key_dsa', 'pub_key_rsa', 'pub_key_ecdsa', 'instance_id',
-                 'hostname']
+frequency = PER_INSTANCE
+post_list_all = ['pub_key_dsa', 'pub_key_rsa', 'pub_key_ecdsa',
+                 'instance_id', 'hostname']
 
 
 # phone_home:
@@ -35,7 +40,7 @@ post_list_all = ['pub_key_dsa', 'pub_key_rsa', 'pub_key_ecdsa', 'instance_id',
 #  url: http://my.foo.bar/$INSTANCE_ID/
 #  post: [ pub_key_dsa, pub_key_rsa, pub_key_ecdsa, instance_id
 #
-def handle(_name, cfg, cloud, log, args):
+def handle(name, cfg, cloud, log, args):
     if len(args) != 0:
         ph_cfg = util.read_conf(args[0])
     else:
@@ -44,7 +49,8 @@ def handle(_name, cfg, cloud, log, args):
         ph_cfg = cfg['phone_home']
 
     if 'url' not in ph_cfg:
-        log.warn("no 'url' token in phone_home")
+        log.warn(("Skipping module named %s, "
+                  "no 'url' found in 'phone_home' configuration"), name)
         return
 
     url = ph_cfg['url']
@@ -53,8 +59,8 @@ def handle(_name, cfg, cloud, log, args):
     try:
         tries = int(tries)
     except:
-        log.warn("tries is not an integer. using 10")
         tries = 10
+        util.logexc(log, "Configuration entry 'tries' is not an integer, using %s", tries)
 
     if post_list == "all":
         post_list = post_list_all
@@ -71,11 +77,9 @@ def handle(_name, cfg, cloud, log, args):
 
     for n, path in pubkeys.iteritems():
         try:
-            fp = open(path, "rb")
-            all_keys[n] = fp.read()
-            fp.close()
+            all_keys[n] = util.load_file(path)
         except:
-            log.warn("%s: failed to open in phone_home" % path)
+            util.logexc(log, "%s: failed to open, can not phone home that data", path)
 
     submit_keys = {}
     for k in post_list:
@@ -83,24 +87,11 @@ def handle(_name, cfg, cloud, log, args):
             submit_keys[k] = all_keys[k]
         else:
             submit_keys[k] = "N/A"
-            log.warn("requested key %s from 'post' list not available")
+            log.warn("Requested key %s from 'post' configuration list not available", k)
 
-    url = util.render_string(url, {'INSTANCE_ID': all_keys['instance_id']})
+    url = templater.render_string(url, {'INSTANCE_ID': all_keys['instance_id']})
 
-    null_exc = object()
-    last_e = null_exc
-    for i in range(0, tries):
-        try:
-            util.readurl(url, submit_keys)
-            log.debug("succeeded submit to %s on try %i" % (url, i + 1))
-            return
-        except Exception as e:
-            log.debug("failed to post to %s on try %i" % (url, i + 1))
-            last_e = e
-        sleep(3)
-
-    log.warn("failed to post to %s in %i tries" % (url, tries))
-    if last_e is not null_exc:
-        raise(last_e)
-
-    return
+    try:
+        uhelp.readurl(url, data=submit_keys, retries=tries, sec_between=3)
+    except:
+        util.logexc(log, "Failed to post phone home data to %s in %s tries", url, tries)
diff --git a/cloudinit/transforms/cc_puppet.py b/cloudinit/transforms/cc_puppet.py
index 6fc475f6..0a21a929 100644
--- a/cloudinit/transforms/cc_puppet.py
+++ b/cloudinit/transforms/cc_puppet.py
@@ -18,91 +18,85 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from StringIO import StringIO
+
 import os
-import os.path
 import pwd
 import socket
-import subprocess
-import StringIO
-import ConfigParser
-import cloudinit.CloudConfig as cc
-import cloudinit.util as util
+
+from cloudinit import util
+from cloudinit import cfg
 
 
-def handle(_name, cfg, cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     # If there isn't a puppet key in the configuration don't do anything
     if 'puppet' not in cfg:
+        log.debug(("Skipping module named %s,"
+                   " no 'puppet' configuration found"), name)
         return
+
     puppet_cfg = cfg['puppet']
+
     # Start by installing the puppet package ...
-    cc.install_packages(("puppet",))
+    cloud.distro.install_packages(("puppet",))
 
     # ... and then update the puppet configuration
     if 'conf' in puppet_cfg:
         # Add all sections from the conf object to puppet.conf
-        puppet_conf_fh = open('/etc/puppet/puppet.conf', 'r')
+        contents = util.load_file('/etc/puppet/puppet.conf')
         # Create object for reading puppet.conf values
-        puppet_config = ConfigParser.ConfigParser()
+        puppet_config = cfg.DefaultingConfigParser()
         # Read puppet.conf values from original file in order to be able to
-        # mix the rest up
-        puppet_config.readfp(StringIO.StringIO(''.join(i.lstrip() for i in
-                                               puppet_conf_fh.readlines())))
-        # Close original file, no longer needed
-        puppet_conf_fh.close()
-        for cfg_name, cfg in puppet_cfg['conf'].iteritems():
+        # mix the rest up. First clean them up (TODO is this really needed??)
+        cleaned_contents = '\n'.join([i.lstrip() for i in contents.splitlines()])
+        puppet_config.readfp(StringIO(cleaned_contents),
+                             filename='/etc/puppet/puppet.conf')
+        for (cfg_name, cfg) in puppet_cfg['conf'].iteritems():
             # ca_cert configuration is a special case
             # Dump the puppetmaster ca certificate in the correct place
             if cfg_name == 'ca_cert':
                 # Puppet ssl sub-directory isn't created yet
                 # Create it with the proper permissions and ownership
-                os.makedirs('/var/lib/puppet/ssl')
-                os.chmod('/var/lib/puppet/ssl', 0771)
-                os.chown('/var/lib/puppet/ssl',
-                         pwd.getpwnam('puppet').pw_uid, 0)
-                os.makedirs('/var/lib/puppet/ssl/certs/')
-                os.chown('/var/lib/puppet/ssl/certs/',
-                         pwd.getpwnam('puppet').pw_uid, 0)
-                ca_fh = open('/var/lib/puppet/ssl/certs/ca.pem', 'w')
-                ca_fh.write(cfg)
-                ca_fh.close()
-                os.chown('/var/lib/puppet/ssl/certs/ca.pem',
-                         pwd.getpwnam('puppet').pw_uid, 0)
-                util.restorecon_if_possible('/var/lib/puppet', recursive=True)
+                util.ensure_dir('/var/lib/puppet/ssl', 0771)
+                util.chownbyid('/var/lib/puppet/ssl',
+                               pwd.getpwnam('puppet').pw_uid, 0)
+                util.ensure_dir('/var/lib/puppet/ssl/certs/')
+                util.chownbyid('/var/lib/puppet/ssl/certs/',
+                               pwd.getpwnam('puppet').pw_uid, 0)
+                util.write_file('/var/lib/puppet/ssl/certs/ca.pem', cfg)
+                util.chownbyid('/var/lib/puppet/ssl/certs/ca.pem',
+                               pwd.getpwnam('puppet').pw_uid, 0)
             else:
-                #puppet_conf_fh.write("\n[%s]\n" % (cfg_name))
-                # If puppet.conf already has this section we don't want to
-                # write it again
-                if puppet_config.has_section(cfg_name) == False:
-                    puppet_config.add_section(cfg_name)
                 # Iterate throug the config items, we'll use ConfigParser.set
                 # to overwrite or create new items as needed
-                for o, v in cfg.iteritems():
+                for (o, v) in cfg.iteritems():
                     if o == 'certname':
                         # Expand %f as the fqdn
+                        # TODO should this use the cloud fqdn??
                         v = v.replace("%f", socket.getfqdn())
                         # Expand %i as the instance id
-                        v = v.replace("%i",
-                              cloud.datasource.get_instance_id())
-                        # certname needs to be downcase
+                        v = v.replace("%i", cloud.get_instance_id())
+                        # certname needs to be downcased
                         v = v.lower()
                     puppet_config.set(cfg_name, o, v)
-                    #puppet_conf_fh.write("%s=%s\n" % (o, v))
             # We got all our config as wanted we'll rename
             # the previous puppet.conf and create our new one
-            os.rename('/etc/puppet/puppet.conf', '/etc/puppet/puppet.conf.old')
-            with open('/etc/puppet/puppet.conf', 'wb') as configfile:
-                puppet_config.write(configfile)
-            util.restorecon_if_possible('/etc/puppet/puppet.conf')
+            util.rename('/etc/puppet/puppet.conf', '/etc/puppet/puppet.conf.old')
+            contents = puppet_config.stringify()
+            util.write_file('/etc/puppet/puppet.conf', contents)
+
     # Set puppet to automatically start
     if os.path.exists('/etc/default/puppet'):
-        subprocess.check_call(['sed', '-i',
-                               '-e', 's/^START=.*/START=yes/',
-                               '/etc/default/puppet'])
+        util.subp(['sed', '-i',
+                  '-e', 's/^START=.*/START=yes/',
+                  '/etc/default/puppet'], capture=False)
     elif os.path.exists('/bin/systemctl'):
-        subprocess.check_call(['/bin/systemctl', 'enable', 'puppet.service'])
+        util.subp(['/bin/systemctl', 'enable', 'puppet.service'], capture=False)
     elif os.path.exists('/sbin/chkconfig'):
-        subprocess.check_call(['/sbin/chkconfig', 'puppet', 'on'])
+        util.subp(['/sbin/chkconfig', 'puppet', 'on'], capture=False)
     else:
-        log.warn("Do not know how to enable puppet service on this system")
+        log.warn(("Sorry we do not know how to enable"
+                  " puppet services on this system"))
+
     # Start puppetd
-    subprocess.check_call(['service', 'puppet', 'start'])
+    util.subp(['service', 'puppet', 'start'], capture=False)
diff --git a/cloudinit/transforms/cc_resizefs.py b/cloudinit/transforms/cc_resizefs.py
index 2dc66def..daaf4da9 100644
--- a/cloudinit/transforms/cc_resizefs.py
+++ b/cloudinit/transforms/cc_resizefs.py
@@ -18,91 +18,117 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import subprocess
+import errno
 import os
 import stat
 import sys
-import time
 import tempfile
-from cloudinit.CloudConfig import per_always
+import time
 
-frequency = per_always
+from cloudinit import util
+from cloudinit.settings import PER_ALWAYS
+
+frequency = PER_ALWAYS
+
+resize_fs_prefixes_cmds = [
+    ('ext', 'resize2fs'),
+    ('xfs', 'xfs_growfs'),
+]
 
 
-def handle(_name, cfg, _cloud, log, args):
+def nodeify_path(devpth, where, log):
+    try:
+        st_dev = os.stat(where).st_dev
+        dev = os.makedev(os.major(st_dev), os.minor(st_dev))
+        os.mknod(devpth, 0400 | stat.S_IFBLK, dev)
+        return st_dev
+    except:
+        if util.is_container():
+            log.debug("Inside container, ignoring mknod failure in resizefs")
+            return
+        log.warn("Failed to make device node to resize %s at %s", where, devpth)
+        raise
+
+
+def get_fs_type(st_dev, path, log):
+    try:
+        fs_type = util.find_devs_with(tag='TYPE', oformat='value',
+                                         no_cache=True, path=path)
+        return fs_type
+    except util.ProcessExecutionError:
+        util.logexc(log, ("Failed to get filesystem type"
+                          " of maj=%s, min=%s for path %s"),
+                    os.major(st_dev), os.minor(st_dev), path)
+        raise
+
+
+def handle(name, cfg, _cloud, log, args):
     if len(args) != 0:
-        resize_root = False
-        if str(args[0]).lower() in ['true', '1', 'on', 'yes']:
-            resize_root = True
+        resize_root = args[0]
     else:
         resize_root = util.get_cfg_option_str(cfg, "resize_rootfs", True)
 
-    if str(resize_root).lower() in ['false', '0']:
+    if not util.translate_bool(resize_root):
+        log.debug("Skipping module named %s,  resizing disabled", name)
         return
 
-    # we use mktemp rather than mkstemp because early in boot nothing
-    # else should be able to race us for this, and we need to mknod.
-    devpth = tempfile.mktemp(prefix="cloudinit.resizefs.", dir="/run")
+    # TODO is the directory ok to be used??
+    resize_root_d = util.get_cfg_option_str(cfg, "resize_rootfs_tmp", "/run")
+    util.ensure_dir(resize_root_d)
+    with util.SilentTemporaryFile(prefix="cloudinit.resizefs.",
+                                  dir=resize_root_d, delete=True) as tfh:
+        devpth = tfh.name
 
-    try:
-        st_dev = os.stat("/").st_dev
-        dev = os.makedev(os.major(st_dev), os.minor(st_dev))
-        os.mknod(devpth, 0400 | stat.S_IFBLK, dev)
-    except:
-        if util.is_container():
-            log.debug("inside container, ignoring mknod failure in resizefs")
+        # Delete the file so that mknod will work
+        # but don't change the file handle to know that its
+        # removed so that when a later call that recreates
+        # occurs this temporary file will still benefit from
+        # auto deletion
+        tfh.unlink_now()
+    
+        # TODO: allow what is to be resized to
+        # be configurable??
+        st_dev = nodeify_path(devpth, "/", log)
+        fs_type = get_fs_type(st_dev, devpath, log)
+    
+        resizer = None
+        fstype_lc = fstype.lower()
+        for (pfix, root_cmd) in resize_fs_prefixes_cmds:
+            if fstype_lc.startswith(pfix):
+                resizer = root_cmd
+                break
+
+        if not resizer:
+            log.warn("Not resizing unknown filesystem type %s", fs_type)
             return
-        log.warn("Failed to make device node to resize /")
-        raise
 
-    cmd = ['blkid', '-c', '/dev/null', '-sTYPE', '-ovalue', devpth]
-    try:
-        (fstype, _err) = util.subp(cmd)
-    except subprocess.CalledProcessError as e:
-        log.warn("Failed to get filesystem type of maj=%s, min=%s via: %s" %
-            (os.major(st_dev), os.minor(st_dev), cmd))
-        log.warn("output=%s\nerror=%s\n", e.output[0], e.output[1])
-        os.unlink(devpth)
-        raise
+        log.debug("Resizing using %s", resizer)
+        resize_cmd = [resizer, devpth]
 
-    if str(fstype).startswith("ext"):
-        resize_cmd = ['resize2fs', devpth]
-    elif fstype == "xfs":
-        resize_cmd = ['xfs_growfs', devpth]
-    else:
-        os.unlink(devpth)
-        log.debug("not resizing unknown filesystem %s" % fstype)
-        return
+        if resize_root == "noblock":
+            # Fork to a child that will run 
+            # the resize command
+            util.fork_cb(do_resize, resize_cmd, log)
+            # Don't delete the file now in the parent
+            tfh.delete = False
+        else:
+            do_resize(resize_cmd, log)
 
+    action = 'Resized'
     if resize_root == "noblock":
-        fid = os.fork()
-        if fid == 0:
-            try:
-                do_resize(resize_cmd, devpth, log)
-                os._exit(0)  # pylint: disable=W0212
-            except Exception as exc:
-                sys.stderr.write("Failed: %s" % exc)
-                os._exit(1)  # pylint: disable=W0212
-    else:
-        do_resize(resize_cmd, devpth, log)
-
-    log.debug("resizing root filesystem (type=%s, maj=%i, min=%i, val=%s)" %
-        (str(fstype).rstrip("\n"), os.major(st_dev), os.minor(st_dev),
-         resize_root))
-
-    return
+        action = 'Resizing (via forking)'
+    log.debug("%s root filesystem (type=%s, maj=%i, min=%i, val=%s)",
+              action, fs_type, os.major(st_dev), os.minor(st_dev), resize_root)
 
 
-def do_resize(resize_cmd, devpth, log):
+def do_resize(resize_cmd, log):
+    start = time.time()
     try:
-        start = time.time()
         util.subp(resize_cmd)
-    except subprocess.CalledProcessError as e:
-        log.warn("Failed to resize filesystem (%s)" % resize_cmd)
-        log.warn("output=%s\nerror=%s\n", e.output[0], e.output[1])
-        os.unlink(devpth)
+    except util.ProcessExecutionError as e:
+        util.logexc(log, "Failed to resize filesystem (using %s)", resize_cmd)
         raise
-
-    os.unlink(devpth)
-    log.debug("resize took %s seconds" % (time.time() - start))
+    tot_time = int(time.time() - start)
+    log.debug("Resizing took %s seconds", tot_time)
+    # TODO: Should we add a fsck check after this to make
+    # sure we didn't corrupt anything?
diff --git a/cloudinit/transforms/cc_rightscale_userdata.py b/cloudinit/transforms/cc_rightscale_userdata.py
index 5ed0848f..cde11b54 100644
--- a/cloudinit/transforms/cc_rightscale_userdata.py
+++ b/cloudinit/transforms/cc_rightscale_userdata.py
@@ -35,44 +35,64 @@
 ##
 ##
 
-import cloudinit.util as util
-from cloudinit.CloudConfig import per_instance
-from cloudinit import get_ipath_cur
+import os
+
+from cloudinit import url_helper as uhelp
+from cloudinit import util
+from cloudinit.settings import PER_INSTANCE
+
 from urlparse import parse_qs
 
-frequency = per_instance
+frequency = PER_INSTANCE
+
 my_name = "cc_rightscale_userdata"
 my_hookname = 'CLOUD_INIT_REMOTE_HOOK'
 
 
-def handle(_name, _cfg, cloud, log, _args):
+def handle(name, _cfg, cloud, log, _args):
     try:
         ud = cloud.get_userdata_raw()
     except:
-        log.warn("failed to get raw userdata in %s" % my_name)
+        log.warn("Failed to get raw userdata in module %s", name)
         return
 
     try:
         mdict = parse_qs(ud)
-        if not my_hookname in mdict:
+        if not mdict or not my_hookname in mdict:
+            log.debug("Skipping module %s, did not find %s in parsed raw userdata", name, my_hookname)
             return
     except:
-        log.warn("failed to urlparse.parse_qa(userdata_raw())")
+        log.warn("Failed to parse query string %s into a dictionary", ud)
         raise
 
-    scripts_d = get_ipath_cur('scripts')
-    i = 0
-    first_e = None
-    for url in mdict[my_hookname]:
-        fname = "%s/rightscale-%02i" % (scripts_d, i)
-        i = i + 1
-        try:
-            content = util.readurl(url)
-            util.write_file(fname, content, mode=0700)
-        except Exception as e:
-            if not first_e:
-                first_e = None
-            log.warn("%s failed to read %s: %s" % (my_name, url, e))
+    wrote_fns = []
+    captured_excps = []
+
+    # These will eventually be then ran by the cc_scripts_user
+    # TODO: maybe this should just be a new user data handler??
+    # Instead of a late transform that acts like a user data handler?
+    scripts_d = cloud.get_ipath_cur('scripts')
+    urls = mdict[my_hookname]
+    for (i, url) in enumerate(urls):
+        fname = os.path.join(scripts_d, "rightscale-%02i" % (i))
+        try:
+            (content, st) = uhelp.readurl(url)
+            # Ensure its a valid http response (and something gotten)
+            if uhelp.ok_http_code(st) and content:
+                util.write_file(fname, content, mode=0700)
+                wrote_fns.append(fname)
+        except Exception as e:
+            captured_excps.append(e)
+            util.logexc(log, "%s failed to read %s and write %s", my_name, url, fname)
+
+    if wrote_fns:
+        log.debug("Wrote out rightscale userdata to %s files", len(wrote_fns))
+
+    if len(wrote_fns) != len(urls):
+        skipped = len(urls) - len(wrote_fns)
+        log.debug("%s urls were skipped or failed", skipped)
+
+    if captured_excps:
+        log.warn("%s failed with exceptions, re-raising the last one", len(captured_excps))
+        raise captured_excps[-1]
 
-    if first_e:
-        raise(e)
diff --git a/cloudinit/transforms/cc_rsyslog.py b/cloudinit/transforms/cc_rsyslog.py
index ac7f2c74..ccbe68ff 100644
--- a/cloudinit/transforms/cc_rsyslog.py
+++ b/cloudinit/transforms/cc_rsyslog.py
@@ -18,16 +18,15 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit
-import logging
-import cloudinit.util as util
-import traceback
+import os
+
+from cloudinit import util
 
 DEF_FILENAME = "20-cloud-config.conf"
 DEF_DIR = "/etc/rsyslog.d"
 
 
-def handle(_name, cfg, _cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     # rsyslog:
     #  - "*.* @@192.158.1.1"
     #  - content: "*.*   @@192.0.2.1:10514"
@@ -37,17 +36,17 @@ def handle(_name, cfg, _cloud, log, _args):
 
     # process 'rsyslog'
     if not 'rsyslog' in cfg:
+        log.debug("Skipping module named %s, no 'rsyslog' key in configuration", name)
         return
 
     def_dir = cfg.get('rsyslog_dir', DEF_DIR)
     def_fname = cfg.get('rsyslog_filename', DEF_FILENAME)
 
     files = []
-    elst = []
-    for ent in cfg['rsyslog']:
+    for i, ent in enumerate(cfg['rsyslog']):
         if isinstance(ent, dict):
             if not "content" in ent:
-                elst.append((ent, "no 'content' entry"))
+                log.warn("No 'content' entry in config entry %s", i + 1)
                 continue
             content = ent['content']
             filename = ent.get("filename", def_fname)
@@ -55,8 +54,13 @@ def handle(_name, cfg, _cloud, log, _args):
             content = ent
             filename = def_fname
 
+        filename = filename.strip()
+        if not filename:
+            log.warn("Entry %s has an empty filename", i + 1)
+            continue
+
         if not filename.startswith("/"):
-            filename = "%s/%s" % (def_dir, filename)
+            filename = os.path.join(def_dir, filename)
 
         omode = "ab"
         # truncate filename first time you see it
@@ -67,35 +71,29 @@ def handle(_name, cfg, _cloud, log, _args):
         try:
             util.write_file(filename, content + "\n", omode=omode)
         except Exception as e:
-            log.debug(traceback.format_exc(e))
-            elst.append((content, "failed to write to %s" % filename))
+            util.logexc(log, "Failed to write to %s", filename)
 
-    # need to restart syslogd
+    # Attempt to restart syslogd
     restarted = False
     try:
-        # if this config module is running at cloud-init time
+        # If this config module is running at cloud-init time
         # (before rsyslog is running) we don't actually have to
         # restart syslog.
         #
-        # upstart actually does what we want here, in that it doesn't
+        # Upstart actually does what we want here, in that it doesn't
         # start a service that wasn't running already on 'restart'
         # it will also return failure on the attempt, so 'restarted'
-        # won't get set
-        log.debug("restarting rsyslog")
+        # won't get set.
+        log.debug("Restarting rsyslog")
         util.subp(['service', 'rsyslog', 'restart'])
         restarted = True
-
     except Exception as e:
-        elst.append(("restart", str(e)))
+        util.logexc("Failed restarting rsyslog")
 
     if restarted:
-        # this only needs to run if we *actually* restarted
+        # This only needs to run if we *actually* restarted
         # syslog above.
-        cloudinit.logging_set_from_cfg_file()
-        log = logging.getLogger()
-        log.debug("rsyslog configured %s" % files)
-
-    for e in elst:
-        log.warn("rsyslog error: %s\n" % ':'.join(e))
-
-    return
+        cloud.cycle_logging()
+        # This should now use rsyslog if
+        # the logging was setup to use it...
+        log.debug("%s configured %s files", name, files)
diff --git a/cloudinit/transforms/cc_runcmd.py b/cloudinit/transforms/cc_runcmd.py
index f7e8c671..19c0e721 100644
--- a/cloudinit/transforms/cc_runcmd.py
+++ b/cloudinit/transforms/cc_runcmd.py
@@ -18,15 +18,20 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
+import os
+
+from cloudinit import util
 
 
-def handle(_name, cfg, cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     if "runcmd" not in cfg:
+        log.debug("Skipping module named %s, no 'runcmd' key in configuration", name)
         return
-    outfile = "%s/runcmd" % cloud.get_ipath('scripts')
+
+    outfile = os.path.join(cloud.get_ipath('scripts'), "runcmd")
+    cmd = cfg["runcmd"]
     try:
-        content = util.shellify(cfg["runcmd"])
+        content = util.shellify(cmd)
         util.write_file(outfile, content, 0700)
     except:
-        log.warn("failed to open %s for runcmd" % outfile)
+        util.logexc(log, "Failed to shellify %s into file %s", cmd, outfile)
diff --git a/cloudinit/transforms/cc_salt_minion.py b/cloudinit/transforms/cc_salt_minion.py
index 1a3b5039..47cbc194 100644
--- a/cloudinit/transforms/cc_salt_minion.py
+++ b/cloudinit/transforms/cc_salt_minion.py
@@ -15,42 +15,43 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 import os
-import os.path
-import subprocess
-import cloudinit.CloudConfig as cc
-import yaml
+
+from cloudinit import util
+
+# Note: see http://saltstack.org/topics/installation/
 
 
-def handle(_name, cfg, _cloud, _log, _args):
+def handle(name, cfg, cloud, _log, _args):
     # If there isn't a salt key in the configuration don't do anything
     if 'salt_minion' not in cfg:
+        log.debug("Skipping module named %s, no 'salt_minion' key in configuration", name)
         return
+
     salt_cfg = cfg['salt_minion']
+
     # Start by installing the salt package ...
-    cc.install_packages(("salt",))
-    config_dir = '/etc/salt'
-    if not os.path.isdir(config_dir):
-        os.makedirs(config_dir)
+    cloud.distro.install_packages(("salt",))
+    
+    # Ensure we can configure files at the right dir
+    config_dir = salt_cfg.get("config_dir", '/etc/salt')
+    util.ensure_dir(config_dir)
+
     # ... and then update the salt configuration
     if 'conf' in salt_cfg:
         # Add all sections from the conf object to /etc/salt/minion
         minion_config = os.path.join(config_dir, 'minion')
-        yaml.dump(salt_cfg['conf'],
-                  file(minion_config, 'w'),
-                  default_flow_style=False)
+        minion_data = util.yaml_dumps(salt_cfg.get('conf'))
+        util.write_file(minion_config, minion_data)
+
     # ... copy the key pair if specified
     if 'public_key' in salt_cfg and 'private_key' in salt_cfg:
-        pki_dir = '/etc/salt/pki'
-        cumask = os.umask(077)
-        if not os.path.isdir(pki_dir):
-            os.makedirs(pki_dir)
-        pub_name = os.path.join(pki_dir, 'minion.pub')
-        pem_name = os.path.join(pki_dir, 'minion.pem')
-        with open(pub_name, 'w') as f:
-            f.write(salt_cfg['public_key'])
-        with open(pem_name, 'w') as f:
-            f.write(salt_cfg['private_key'])
-        os.umask(cumask)
+        pki_dir = salt_cfg.get('pki_dir', '/etc/salt/pki')
+        with util.umask(077):
+            util.ensure_dir(pki_dir)
+            pub_name = os.path.join(pki_dir, 'minion.pub')
+            pem_name = os.path.join(pki_dir, 'minion.pem')
+            util.write_file(pub_name, salt_cfg['public_key'])
+            util.write_file(pem_name, salt_cfg['private_key'])
 
     # Start salt-minion
-    subprocess.check_call(['service', 'salt-minion', 'start'])
+    util.subp(['service', 'salt-minion', 'start'], capture=False)
diff --git a/cloudinit/transforms/cc_scripts_per_boot.py b/cloudinit/transforms/cc_scripts_per_boot.py
index 41a74754..bcdf4400 100644
--- a/cloudinit/transforms/cc_scripts_per_boot.py
+++ b/cloudinit/transforms/cc_scripts_per_boot.py
@@ -18,17 +18,23 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-from cloudinit.CloudConfig import per_always
-from cloudinit import get_cpath
+import os
 
-frequency = per_always
-runparts_path = "%s/%s" % (get_cpath(), "scripts/per-boot")
+from cloudinit import util
+
+from cloudinit.settings import PER_ALWAYS
+
+frequency = PER_ALWAYS
+
+script_subdir = 'per-boot'
 
 
-def handle(_name, _cfg, _cloud, log, _args):
+def handle(_name, _cfg, cloud, log, _args):
+    # Comes from the following:
+    # https://forums.aws.amazon.com/thread.jspa?threadID=96918
+    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("failed to run-parts in %s" % runparts_path)
+        log.warn("Failed to run-parts(%s) in %s", script_subdir, runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_scripts_per_instance.py b/cloudinit/transforms/cc_scripts_per_instance.py
index a2981eab..8d6609a1 100644
--- a/cloudinit/transforms/cc_scripts_per_instance.py
+++ b/cloudinit/transforms/cc_scripts_per_instance.py
@@ -18,17 +18,23 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-from cloudinit.CloudConfig import per_instance
-from cloudinit import get_cpath
+import os
 
-frequency = per_instance
-runparts_path = "%s/%s" % (get_cpath(), "scripts/per-instance")
+from cloudinit import util
+
+from cloudinit.settings import PER_INSTANCE
+
+frequency = PER_INSTANCE
+
+script_subdir = 'per-instance'
 
 
-def handle(_name, _cfg, _cloud, log, _args):
+def handle(_name, _cfg, cloud, log, _args):
+    # Comes from the following:
+    # https://forums.aws.amazon.com/thread.jspa?threadID=96918
+    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("failed to run-parts in %s" % runparts_path)
+        log.warn("Failed to run-parts(%s) in %s", script_subdir, runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_scripts_per_once.py b/cloudinit/transforms/cc_scripts_per_once.py
index a69151da..dbcec05d 100644
--- a/cloudinit/transforms/cc_scripts_per_once.py
+++ b/cloudinit/transforms/cc_scripts_per_once.py
@@ -18,17 +18,23 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-from cloudinit.CloudConfig import per_once
-from cloudinit import get_cpath
+import os
 
-frequency = per_once
-runparts_path = "%s/%s" % (get_cpath(), "scripts/per-once")
+from cloudinit import util
+
+from cloudinit.settings import PER_ONCE
+
+frequency = PER_ONCE
+
+script_subdir = 'per-once'
 
 
-def handle(_name, _cfg, _cloud, log, _args):
+def handle(_name, _cfg, cloud, log, _args):
+    # Comes from the following:
+    # https://forums.aws.amazon.com/thread.jspa?threadID=96918
+    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("failed to run-parts in %s" % runparts_path)
+        log.warn("Failed to run-parts(%s) in %s", script_subdir, runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_scripts_user.py b/cloudinit/transforms/cc_scripts_user.py
index 933aa4e0..1e438ee6 100644
--- a/cloudinit/transforms/cc_scripts_user.py
+++ b/cloudinit/transforms/cc_scripts_user.py
@@ -18,17 +18,22 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-from cloudinit.CloudConfig import per_instance
-from cloudinit import get_ipath_cur
+import os
 
-frequency = per_instance
-runparts_path = "%s/%s" % (get_ipath_cur(), "scripts")
+from cloudinit import util
+
+from cloudinit.settings import PER_INSTANCE
+
+frequency = PER_INSTANCE
 
 
-def handle(_name, _cfg, _cloud, log, _args):
+def handle(_name, _cfg, cloud, log, _args):
+    # This is written to by the user data handlers
+    # Ie, any custom shell scripts that come down
+    # go here...
+    runparts_path = os.path.join(cloud.get_ipath_cur(), "scripts")
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("failed to run-parts in %s" % runparts_path)
+        log.warn("Failed to run-parts(%s) in %s", "user-data", runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_set_hostname.py b/cloudinit/transforms/cc_set_hostname.py
index acea74d9..fa2b59c2 100644
--- a/cloudinit/transforms/cc_set_hostname.py
+++ b/cloudinit/transforms/cc_set_hostname.py
@@ -18,25 +18,18 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
+from cloudinit import util
 
 
-def handle(_name, cfg, cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     if util.get_cfg_option_bool(cfg, "preserve_hostname", False):
-        log.debug("preserve_hostname is set. not setting hostname")
-        return(True)
+        log.debug(("Configuration option 'preserve_hostname' is set,"
+                    " not setting the hostname in %s"), name)
+        return
 
     (hostname, _fqdn) = util.get_hostname_fqdn(cfg, cloud)
     try:
-        set_hostname(hostname, log)
+        log.debug("Setting hostname to %s", hostname)
+        cloud.distro.set_hostname(hostname)
     except Exception:
-        util.logexc(log)
-        log.warn("failed to set hostname to %s\n", hostname)
-
-    return(True)
-
-
-def set_hostname(hostname, log):
-    util.subp(['hostname', hostname])
-    util.write_file("/etc/hostname", "%s\n" % hostname, 0644)
-    log.debug("populated /etc/hostname with %s on first boot", hostname)
+        util.logexc(log, "Failed to set hostname to %s", hostname)
diff --git a/cloudinit/transforms/cc_set_passwords.py b/cloudinit/transforms/cc_set_passwords.py
index 9d0bbdb8..4f2cdb97 100644
--- a/cloudinit/transforms/cc_set_passwords.py
+++ b/cloudinit/transforms/cc_set_passwords.py
@@ -18,13 +18,18 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
 import sys
-import random
-from string import letters, digits  # pylint: disable=W0402
+
+from cloudinit import util
+
+from string import letters, digits
+
+# We are removing certain 'painful' letters/numbers
+pw_set = (letters.translate(None, 'loLOI') +
+          digits.translate(None, '01'))
 
 
-def handle(_name, cfg, _cloud, log, args):
+def handle(_name, cfg, cloud, log, args):
     if len(args) != 0:
         # if run from command line, and give args, wipe the chpasswd['list']
         password = args[0]
@@ -62,68 +67,83 @@ def handle(_name, cfg, _cloud, log, args):
 
         ch_in = '\n'.join(plist_in)
         try:
+            log.debug("Changing password for %s:", users)
             util.subp(['chpasswd'], ch_in)
-            log.debug("changed password for %s:" % users)
         except Exception as e:
             errors.append(e)
-            log.warn("failed to set passwords with chpasswd: %s" % e)
+            util.logexc(log, "Failed to set passwords with chpasswd for %s", users)
 
         if len(randlist):
-            sys.stdout.write("%s\n%s\n" % ("Set the following passwords\n",
+            sys.stderr.write("%s\n%s\n" % ("Set the following 'random' passwords\n",
                 '\n'.join(randlist)))
 
         if expire:
-            enum = len(errors)
+            expired_users = []
             for u in users:
                 try:
                     util.subp(['passwd', '--expire', u])
+                    expired_users.append(u)
                 except Exception as e:
                     errors.append(e)
-                    log.warn("failed to expire account for %s" % u)
-            if enum == len(errors):
-                log.debug("expired passwords for: %s" % u)
+                    util.logexc(log, "Failed to set 'expire' for %s", u)
+            if expired_users:
+                log.debug("Expired passwords for: %s users", expired_users)
 
+    change_pwauth = False
+    pw_auth = None
     if 'ssh_pwauth' in cfg:
-        val = str(cfg['ssh_pwauth']).lower()
-        if val in ("true", "1", "yes"):
-            pw_auth = "yes"
-            change_pwauth = True
-        elif val in ("false", "0", "no"):
-            pw_auth = "no"
-            change_pwauth = True
-        else:
-            change_pwauth = False
+        change_pwauth = True
+        if util.is_true_str(cfg['ssh_pwauth']):
+            pw_auth = 'yes'
+        if util.is_false_str(cfg['ssh_pwauth']):
+            pw_auth = 'no'
 
     if change_pwauth:
-        pa_s = "\(#*\)\(PasswordAuthentication[[:space:]]\+\)\(yes\|no\)"
-        msg = "set PasswordAuthentication to '%s'" % pw_auth
-        try:
-            cmd = ['sed', '-i', 's,%s,\\2%s,' % (pa_s, pw_auth),
-                   '/etc/ssh/sshd_config']
-            util.subp(cmd)
-            log.debug(msg)
-        except Exception as e:
-            log.warn("failed %s" % msg)
-            errors.append(e)
+        new_lines = []
+        replaced_auth = False
+        replacement = "PasswordAuthentication %s" % (pw_auth)
+
+        # See http://linux.die.net/man/5/sshd_config
+        old_lines = util.load_file('/etc/ssh/sshd_config').splitlines()
+        for i, line in enumerate(old_lines):
+            if not line.strip() or line.startswith("#"):
+                new_lines.append(line)
+                continue
+            splitup = line.split(None, 1)
+            if len(splitup) <= 1:
+                new_lines.append(line)
+                continue
+            (cmd, args) = splitup
+            # Keywords are case-insensitive and arguments are case-sensitive
+            cmd = cmd.lower().strip()
+            if cmd == 'passwordauthentication':
+                log.debug("Replacing auth line %s with %s", i + 1, replacement)
+                replaced_auth = True
+                new_lines.append(replacement)
+            else:
+                new_lines.append(line)
+
+        if not replaced_auth:
+            log.debug("Adding new auth line %s", replacement)
+            replaced_auth = True
+            new_lines.append(replacement)
+
+        new_contents = "\n".join(new_lines)
+        util.write_file('/etc/ssh/sshd_config', new_contents)
 
         try:
-            p = util.subp(['service', cfg.get('ssh_svcname', 'ssh'),
-                           'restart'])
-            log.debug("restarted sshd")
+            cmd = ['service']
+            cmd.append(cloud.distro.get_option('ssh_svcname', 'ssh'))
+            cmd.append('restart')
+            util.subp(cmd)
+            log.debug("Restarted the ssh daemon")
         except:
-            log.warn("restart of ssh failed")
+            util.logexc(log, "Restarting of the ssh daemon failed")
 
     if len(errors):
-        raise(errors[0])
-
-    return
-
-
-def rand_str(strlen=32, select_from=letters + digits):
-    return("".join([random.choice(select_from) for _x in range(0, strlen)]))
+        log.debug("%s errors occured, re-raising the last one", len(errors))
+        raise errors[-1]
 
 
 def rand_user_password(pwlen=9):
-    selfrom = (letters.translate(None, 'loLOI') +
-               digits.translate(None, '01'))
-    return(rand_str(pwlen, select_from=selfrom))
+    return util.rand_str(pwlen, select_from=pw_set)
diff --git a/cloudinit/transforms/cc_ssh.py b/cloudinit/transforms/cc_ssh.py
index 48eb58bc..db6848d9 100644
--- a/cloudinit/transforms/cc_ssh.py
+++ b/cloudinit/transforms/cc_ssh.py
@@ -18,15 +18,34 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import cloudinit.SshUtil as sshutil
 import os
 import glob
-import subprocess
 
-DISABLE_ROOT_OPTS = "no-port-forwarding,no-agent-forwarding," \
-"no-X11-forwarding,command=\"echo \'Please login as the user \\\"$USER\\\" " \
-"rather than the user \\\"root\\\".\';echo;sleep 10\""
+from cloudinit import util
+from cloudinit import ssh_util
+
+DISABLE_ROOT_OPTS = ( "no-port-forwarding,no-agent-forwarding," 
+"no-X11-forwarding,command=\"echo \'Please login as the user \\\"$USER\\\" " 
+"rather than the user \\\"root\\\".\';echo;sleep 10\"")
+
+key2file = {
+    "rsa_private": ("/etc/ssh/ssh_host_rsa_key", 0600),
+    "rsa_public": ("/etc/ssh/ssh_host_rsa_key.pub", 0644),
+    "dsa_private": ("/etc/ssh/ssh_host_dsa_key", 0600),
+    "dsa_public": ("/etc/ssh/ssh_host_dsa_key.pub", 0644),
+    "ecdsa_private": ("/etc/ssh/ssh_host_ecdsa_key", 0600),
+    "ecdsa_public": ("/etc/ssh/ssh_host_ecdsa_key.pub", 0644),
+}
+
+priv2pub = {
+    'rsa_private': 'rsa_public', 
+    'dsa_private': 'dsa_public',
+    'ecdsa_private': 'ecdsa_public',
+}
+
+key_gen_tpl = 'o=$(ssh-keygen -yf "%s") && echo "$o" root@localhost > "%s"'
+
+generate_keys = ['rsa', 'dsa', 'ecdsa']
 
 
 def handle(_name, cfg, cloud, log, _args):
@@ -35,72 +54,70 @@ def handle(_name, cfg, cloud, log, _args):
     if cfg.get("ssh_deletekeys", True):
         for f in glob.glob("/etc/ssh/ssh_host_*key*"):
             try:
-                os.unlink(f)
+                util.del_file(f)
             except:
-                pass
-
+                util.logexc(log, "Failed deleting key file %s", f)
+    
     if "ssh_keys" in cfg:
         # if there are keys in cloud-config, use them
-        key2file = {
-            "rsa_private": ("/etc/ssh/ssh_host_rsa_key", 0600),
-            "rsa_public": ("/etc/ssh/ssh_host_rsa_key.pub", 0644),
-            "dsa_private": ("/etc/ssh/ssh_host_dsa_key", 0600),
-            "dsa_public": ("/etc/ssh/ssh_host_dsa_key.pub", 0644),
-            "ecdsa_private": ("/etc/ssh/ssh_host_ecdsa_key", 0600),
-            "ecdsa_public": ("/etc/ssh/ssh_host_ecdsa_key.pub", 0644),
-        }
-
-        for key, val in cfg["ssh_keys"].items():
+        for (key, val) in cfg["ssh_keys"].iteritems():
             if key in key2file:
-                util.write_file(key2file[key][0], val, key2file[key][1])
-
-        priv2pub = {'rsa_private': 'rsa_public', 'dsa_private': 'dsa_public',
-                    'ecdsa_private': 'ecdsa_public', }
-
+                tgt_fn = key2file[key][0]
+                tgt_perms = key2file[key][1]
+                util.write_file(tgt_fn, val, tgt_perms)
+    
         cmd = 'o=$(ssh-keygen -yf "%s") && echo "$o" root@localhost > "%s"'
         for priv, pub in priv2pub.iteritems():
             if pub in cfg['ssh_keys'] or not priv in cfg['ssh_keys']:
                 continue
             pair = (key2file[priv][0], key2file[pub][0])
-            subprocess.call(('sh', '-xc', cmd % pair))
-            log.debug("generated %s from %s" % pair)
+            cmd = ['sh', '-xc', key_gen_tpl % pair]
+            try:
+                # TODO: Is this guard needed?
+                with util.SeLinuxGuard("/etc/ssh", recursive=True):
+                    util.subp(cmd, capture=False)
+                log.debug("Generated a key for %s from %s", pair[0], pair[1])
+            except:
+                util.logexc(log, "Failed generated a key for %s from %s", pair[0], pair[1])
     else:
         # if not, generate them
-        for keytype in util.get_cfg_option_list_or_str(cfg, 'ssh_genkeytypes',
-                                                      ['rsa', 'dsa', 'ecdsa']):
+        for keytype in util.get_cfg_option_list_or_str(cfg, 'ssh_genkeytypes', generate_keys):
             keyfile = '/etc/ssh/ssh_host_%s_key' % keytype
             if not os.path.exists(keyfile):
-                subprocess.call(['ssh-keygen', '-t', keytype, '-N', '',
-                                 '-f', keyfile])
-
-    util.restorecon_if_possible('/etc/ssh', recursive=True)
+                cmd = ['ssh-keygen', '-t', keytype, '-N', '', '-f', keyfile]
+                try:
+                    # TODO: Is this guard needed?
+                    with util.SeLinuxGuard("/etc/ssh", recursive=True):
+                        util.subp(cmd, capture=False)
+                except:
+                    util.logexc(log, "Failed generating key type %s to file %s", keytype, keyfile)
 
     try:
         user = util.get_cfg_option_str(cfg, 'user')
         disable_root = util.get_cfg_option_bool(cfg, "disable_root", True)
         disable_root_opts = util.get_cfg_option_str(cfg, "disable_root_opts",
             DISABLE_ROOT_OPTS)
-        keys = cloud.get_public_ssh_keys()
 
+        keys = cloud.get_public_ssh_keys() or []
         if "ssh_authorized_keys" in cfg:
             cfgkeys = cfg["ssh_authorized_keys"]
             keys.extend(cfgkeys)
 
         apply_credentials(keys, user, disable_root, disable_root_opts, log)
     except:
-        util.logexc(log)
-        log.warn("applying credentials failed!\n")
+        util.logexc(log, "Applying ssh credentials failed!")
 
 
 def apply_credentials(keys, user, disable_root,
                       disable_root_opts=DISABLE_ROOT_OPTS, log=None):
+
     keys = set(keys)
     if user:
-        sshutil.setup_user_keys(keys, user, '', log)
+        ssh_util.setup_user_keys(keys, user, '')
 
-    if disable_root:
+    if disable_root and user:
         key_prefix = disable_root_opts.replace('$USER', user)
     else:
         key_prefix = ''
 
-    sshutil.setup_user_keys(keys, 'root', key_prefix, log)
+    ssh_util.setup_user_keys(keys, 'root', key_prefix)
diff --git a/cloudinit/transforms/cc_ssh_import_id.py b/cloudinit/transforms/cc_ssh_import_id.py
index bbf5bd83..019413d4 100644
--- a/cloudinit/transforms/cc_ssh_import_id.py
+++ b/cloudinit/transforms/cc_ssh_import_id.py
@@ -18,12 +18,14 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import subprocess
-import traceback
+from cloudinit import util
+
+# The ssh-import-id only seems to exist on ubuntu (for now)
+# https://launchpad.net/ssh-import-id
+distros = ['ubuntu']
 
 
-def handle(_name, cfg, _cloud, log, args):
+def handle(name, cfg, _cloud, log, args):
     if len(args) != 0:
         user = args[0]
         ids = []
@@ -34,17 +36,14 @@ def handle(_name, cfg, _cloud, log, args):
         ids = util.get_cfg_option_list_or_str(cfg, "ssh_import_id", [])
 
     if len(ids) == 0:
+        log.debug("Skipping module named %s, no ids found to import", name)
         return
 
     cmd = ["sudo", "-Hu", user, "ssh-import-id"] + ids
-
-    log.debug("importing ssh ids. cmd = %s" % cmd)
+    log.debug("Importing ssh ids for user %s.", user)
 
     try:
-        subprocess.check_call(cmd)
-    except subprocess.CalledProcessError as e:
-        log.debug(traceback.format_exc(e))
-        raise Exception("Cmd returned %s: %s" % (e.returncode, cmd))
-    except OSError as e:
-        log.debug(traceback.format_exc(e))
-        raise Exception("Cmd failed to execute: %s" % (cmd))
+        util.subp(cmd, capture=False)
+    except util.ProcessExecutionError as e:
+        util.logexc(log, "Failed to run command to import %s ssh ids", user)
+        raise e
diff --git a/cloudinit/transforms/cc_timezone.py b/cloudinit/transforms/cc_timezone.py
index e5c9901b..6fb5edc0 100644
--- a/cloudinit/transforms/cc_timezone.py
+++ b/cloudinit/transforms/cc_timezone.py
@@ -18,50 +18,19 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from cloudinit.CloudConfig import per_instance
-from cloudinit import util
-import os.path
-import shutil
+from cloudinit.settings import PER_INSTANCE
 
-frequency = per_instance
-tz_base = "/usr/share/zoneinfo"
+frequency = PER_INSTANCE
 
 
-def handle(_name, cfg, _cloud, log, args):
+def handle(_name, cfg, cloud, log, args):
     if len(args) != 0:
         timezone = args[0]
     else:
         timezone = util.get_cfg_option_str(cfg, "timezone", False)
 
     if not timezone:
+        log.debug("Skipping module named %s, no 'timezone' specified", name)
         return
 
-    tz_file = "%s/%s" % (tz_base, timezone)
-
-    if not os.path.isfile(tz_file):
-        log.debug("Invalid timezone %s" % tz_file)
-        raise Exception("Invalid timezone %s" % tz_file)
-
-    try:
-        fp = open("/etc/timezone", "wb")
-        fp.write("%s\n" % timezone)
-        fp.close()
-    except:
-        log.debug("failed to write to /etc/timezone")
-        raise
-    if os.path.exists("/etc/sysconfig/clock"):
-        try:
-            with open("/etc/sysconfig/clock", "w") as fp:
-                fp.write('ZONE="%s"\n' % timezone)
-        except:
-            log.debug("failed to write to /etc/sysconfig/clock")
-            raise
-
-    try:
-        shutil.copy(tz_file, "/etc/localtime")
-    except:
-        log.debug("failed to copy %s to /etc/localtime" % tz_file)
-        raise
-
-    log.debug("set timezone to %s" % timezone)
-    return
+    cloud.distro.set_timezone(timezone)
diff --git a/cloudinit/transforms/cc_update_etc_hosts.py b/cloudinit/transforms/cc_update_etc_hosts.py
index 6ad2fca8..361097a6 100644
--- a/cloudinit/transforms/cc_update_etc_hosts.py
+++ b/cloudinit/transforms/cc_update_etc_hosts.py
@@ -18,70 +18,34 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-from cloudinit.CloudConfig import per_always
-import StringIO
+from cloudinit import util
+from cloudinit import templater
 
-frequency = per_always
+from cloudinit.settings import PER_ALWAYS
+
+frequency = PER_ALWAYS
 
 
-def handle(_name, cfg, cloud, log, _args):
-    (hostname, fqdn) = util.get_hostname_fqdn(cfg, cloud)
-
+def handle(name, cfg, cloud, log, _args):
     manage_hosts = util.get_cfg_option_str(cfg, "manage_etc_hosts", False)
-    if manage_hosts in ("True", "true", True, "template"):
-        # render from template file
-        try:
-            if not hostname:
-                log.info("manage_etc_hosts was set, but no hostname found")
-                return
-
-            util.render_to_file('hosts', '/etc/hosts',
+    if util.translate_bool(manage_hosts, addons=['template']):
+        (hostname, fqdn) = util.get_hostname_fqdn(cfg, cloud)
+        # Render from template file
+        if not hostname:
+            log.warn("Option 'manage_etc_hosts' was set, but no hostname was found")
+            return
+        tpl_fn_name = cloud.get_template_filename("hosts.%s" % (cloud.distro.name()))
+        if not tpl_fn_name:
+            raise Exception("No hosts template could be found for distro %s" % (cloud.distro.name()))
+        templater.render_to_file(tpl_fn_name, '/etc/hosts',
                                 {'hostname': hostname, 'fqdn': fqdn})
-        except Exception:
-            log.warn("failed to update /etc/hosts")
-            raise
     elif manage_hosts == "localhost":
-        log.debug("managing 127.0.1.1 in /etc/hosts")
-        update_etc_hosts(hostname, fqdn, log)
-        return
+        log.debug("Managing localhost in /etc/hosts")
+        (hostname, fqdn) = util.get_hostname_fqdn(cfg, cloud)
+        if not hostname:
+            log.warn("Option 'manage_etc_hosts' was set, but no hostname was found")
+            return
+        cloud.distro.update_etc_hosts(hostname, fqdn)
     else:
-        if manage_hosts not in ("False", False):
-            log.warn("Unknown value for manage_etc_hosts.  Assuming False")
-        else:
-            log.debug("not managing /etc/hosts")
-
-
-def update_etc_hosts(hostname, fqdn, _log):
-    with open('/etc/hosts', 'r') as etchosts:
-        header = "# Added by cloud-init\n"
-        hosts_line = "127.0.1.1\t%s %s\n" % (fqdn, hostname)
-        need_write = False
-        need_change = True
-        new_etchosts = StringIO.StringIO()
-        for line in etchosts:
-            split_line = [s.strip() for s in line.split()]
-            if len(split_line) < 2:
-                new_etchosts.write(line)
-                continue
-            if line == header:
-                continue
-            ip, hosts = split_line[0], split_line[1:]
-            if ip == "127.0.1.1":
-                if sorted([hostname, fqdn]) == sorted(hosts):
-                    need_change = False
-                if need_change == True:
-                    line = "%s%s" % (header, hosts_line)
-                    need_change = False
-                    need_write = True
-            new_etchosts.write(line)
-        etchosts.close()
-        if need_change == True:
-            new_etchosts.write("%s%s" % (header, hosts_line))
-            need_write = True
-        if need_write == True:
-            new_etcfile = open('/etc/hosts', 'wb')
-            new_etcfile.write(new_etchosts.getvalue())
-            new_etcfile.close()
-        new_etchosts.close()
-    return
+        log.debug(("Configuration option 'manage_etc_hosts' is not set,"
+                    " not managing /etc/hosts in %s"), name)
diff --git a/cloudinit/transforms/cc_update_hostname.py b/cloudinit/transforms/cc_update_hostname.py
index b9d1919a..439bdcb3 100644
--- a/cloudinit/transforms/cc_update_hostname.py
+++ b/cloudinit/transforms/cc_update_hostname.py
@@ -18,84 +18,22 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import cloudinit.util as util
-import subprocess
-import errno
-from cloudinit.CloudConfig import per_always
+from cloudinit import util
+from cloudinit.settings import PER_ALWAYS
 
-frequency = per_always
+frequency = PER_ALWAYS
 
 
-def handle(_name, cfg, cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     if util.get_cfg_option_bool(cfg, "preserve_hostname", False):
-        log.debug("preserve_hostname is set. not updating hostname")
+        log.debug(("Configuration option 'preserve_hostname' is set,"
+                    " not updating the hostname in %s"), name)
         return
 
     (hostname, _fqdn) = util.get_hostname_fqdn(cfg, cloud)
     try:
-        prev = "%s/%s" % (cloud.get_cpath('data'), "previous-hostname")
-        update_hostname(hostname, prev, log)
+        prev_fn = os.path.join(cloud.get_cpath('data'), "previous-hostname")
+        cloud.distro.update_hostname(hostname, prev_fn)
     except Exception:
-        log.warn("failed to set hostname\n")
+        util.logexc(log, "Failed to set the hostname to %s", hostname)
         raise
-
-
-# read hostname from a 'hostname' file
-# allow for comments and stripping line endings.
-# if file doesn't exist, or no contents, return default
-def read_hostname(filename, default=None):
-    try:
-        fp = open(filename, "r")
-        lines = fp.readlines()
-        fp.close()
-        for line in lines:
-            hpos = line.find("#")
-            if hpos != -1:
-                line = line[0:hpos]
-            line = line.rstrip()
-            if line:
-                return line
-    except IOError as e:
-        if e.errno != errno.ENOENT:
-            raise
-    return default
-
-
-def update_hostname(hostname, prev_file, log):
-    etc_file = "/etc/hostname"
-
-    hostname_prev = None
-    hostname_in_etc = None
-
-    try:
-        hostname_prev = read_hostname(prev_file)
-    except Exception as e:
-        log.warn("Failed to open %s: %s" % (prev_file, e))
-
-    try:
-        hostname_in_etc = read_hostname(etc_file)
-    except:
-        log.warn("Failed to open %s" % etc_file)
-
-    update_files = []
-    if not hostname_prev or hostname_prev != hostname:
-        update_files.append(prev_file)
-
-    if (not hostname_in_etc or
-        (hostname_in_etc == hostname_prev and hostname_in_etc != hostname)):
-        update_files.append(etc_file)
-
-    try:
-        for fname in update_files:
-            util.write_file(fname, "%s\n" % hostname, 0644)
-            log.debug("wrote %s to %s" % (hostname, fname))
-    except:
-        log.warn("failed to write hostname to %s" % fname)
-
-    if hostname_in_etc and hostname_prev and hostname_in_etc != hostname_prev:
-        log.debug("%s differs from %s. assuming user maintained" %
-                  (prev_file, etc_file))
-
-    if etc_file in update_files:
-        log.debug("setting hostname to %s" % hostname)
-        subprocess.Popen(['hostname', hostname]).communicate()

From df9a110911eac485910d5e1d8de34ae10999dd7c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:24:04 -0700
Subject: [PATCH 110/434] Ensure when an exception is captured that we use the
 util.logexc helper.

---
 cloudinit/ssh_util.py | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index c97b3819..f6941a29 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -144,13 +144,13 @@ class AuthKeyEntry(object):
             return ' '.join(toks)
 
 
-def _update_authorized_keys(fname, keys):
+def update_authorized_keys(fname, keys):
     lines = []
     try:
         if os.path.isfile(fname):
             lines = util.load_file(fname).splitlines()
     except (IOError, OSError):
-        LOG.exception("Error reading lines from %s", fname)
+        util.logexc(LOG, "Error reading lines from %s", fname)
         lines = []
 
     to_add = list(keys)
@@ -199,7 +199,7 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn=None):
             # The following tokens are defined: %% is replaced by a literal
             # '%', %h is replaced by the home directory of the user being
             # authenticated and %u is replaced by the username of that user.
-            ssh_cfg = _parse_ssh_config(sshd_config_fn)
+            ssh_cfg = parse_ssh_config(sshd_config_fn)
             akeys = ssh_cfg.get("authorizedkeysfile", '')
             akeys = akeys.strip()
             if not akeys:
@@ -212,19 +212,19 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn=None):
             authorized_keys = akeys
         except (IOError, OSError):
             authorized_keys = os.path.join(ssh_dir, 'authorized_keys')
-            LOG.exception(("Failed extracting 'AuthorizedKeysFile'"
-                            " in ssh config"
-                            " from %s, using 'AuthorizedKeysFile' file"
-                            " %s instead"),
-                           sshd_config_fn, authorized_keys)
+            util.logexc(LOG, ("Failed extracting 'AuthorizedKeysFile'"
+                              " in ssh config"
+                              " from %s, using 'AuthorizedKeysFile' file"
+                              " %s instead"),
+                        sshd_config_fn, authorized_keys)
 
-        content = _update_authorized_keys(authorized_keys, key_entries)
+        content = update_authorized_keys(authorized_keys, key_entries)
         util.ensure_dir(os.path.dirname(authorized_keys), mode=0700)
         util.write_file(authorized_keys, content, mode=0600)
         util.chownbyid(authorized_keys, pwent.pw_uid, pwent.pw_gid)
 
 
-def _parse_ssh_config(fname):
+def parse_ssh_config(fname):
     # The file contains keyword-argument pairs, one per line.
     # Lines starting with '#' and empty lines are interpreted as comments.
     # Note: key-words are case-insensitive and arguments are case-sensitive

From c9d43b8d348136b016b4acc69d35b8b63d8b925b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:24:40 -0700
Subject: [PATCH 111/434] 1. Modify the check http code function to allow or
 not allow redirect status from being valid codes. 2. Log how much we will
 sleep for 3. If not headers are provided, add a set which will have a cloud
 init user agent + version

---
 cloudinit/url_helper.py | 23 +++++++++++++++--------
 1 file changed, 15 insertions(+), 8 deletions(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 1bf24c4f..7ae0226a 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -29,12 +29,16 @@ import urllib
 import urllib2
 
 from cloudinit import log as logging
+from cloudinit import version
 
 LOG = logging.getLogger(__name__)
 
 
-def ok_http_code(st):
-    return st in xrange(200, 400)
+def ok_http_code(st, redirects_ok=False):
+    if redirects_ok:
+        return st in xrange(200, 400)
+    else:
+        return st in xrange(200, 300)
 
 
 def readurl(url, data=None, timeout=None,
@@ -44,8 +48,13 @@ def readurl(url, data=None, timeout=None,
     req_args['url'] = url
     if data is not None:
         req_args['data'] = urllib.urlencode(data)
-    if headers is not None:
-        req_args['headers'] = dict(headers)
+
+    if not headers:
+        headers = {
+            'User-Agent': 'Cloud-Init/%s' % (version.version_string()),
+        }
+
+    req_args['headers'] = headers
     req = urllib2.Request(**req_args)
 
     retries = max(retries, 0)
@@ -70,19 +79,17 @@ def readurl(url, data=None, timeout=None,
                 return (content, status)
         except urllib2.HTTPError as e:
             last_excp = e
-            LOG.exception("Failed at reading from %s.", url)
         except urllib2.URLError as e:
             # This can be a message string or
             # another exception instance 
             # (socket.error for remote URLs, OSError for local URLs).
-            if (isinstance(e.reason, OSError) and
+            if (isinstance(e.reason, (OSError)) and
                 e.reason.errno == errno.ENOENT):
                 last_excp = e.reason
             else:
                 last_excp = e
-            LOG.exception("Failed at reading from %s", url)
         if i + 1 < attempts:
-            LOG.info("Please wait %s seconds while we wait to try again",
+            LOG.debug("Please wait %s seconds while we wait to try again",
                      sec_between)
             time.sleep(sec_between)
 

From 195a7172a832d2675143951757d52c7c372f4cc1 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:26:34 -0700
Subject: [PATCH 112/434] Inclusion of more utility functions included:

1. Adjustments to using more selinux guards around directory creation, chmod...
2. Adding util functions to check if values are false or true (used internally and externally)
3. Move find_devs_with to util.py and allow it to serve multiple use cases
4. Add fork_cb which will fork a process and then call a certain callback (used right now by the resize nonblocking mode)
5. Move functions that performed time_rfc2822 time fetching and uptime fetching to here.
6. Allow the subp util function to act in shell mode
7. Increase logging usefulness in shellify function
---
 cloudinit/util.py | 282 ++++++++++++++++++++++++++++++++++++----------
 1 file changed, 221 insertions(+), 61 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 7d5932c1..7259d933 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -28,14 +28,18 @@ import errno
 import glob
 import grp
 import gzip
+import hashlib
 import os
 import platform
 import pwd
+import random
 import shutil
 import socket
+import string
 import subprocess
 import sys
 import tempfile
+import time
 import traceback
 import types
 import urlparse
@@ -68,8 +72,11 @@ CONTAINER_TESTS = ['running-in-container', 'lxc-is-container']
 
 class ProcessExecutionError(IOError):
 
-    MESSAGE_TMPL = ('%(description)s\nCommand: %(cmd)s\n'
-                    'Exit code: %(exit_code)s\nStdout: %(stdout)r\n'
+    MESSAGE_TMPL = ('%(description)s\n'
+                    'Command: %(cmd)s\n'
+                    'Exit code: %(exit_code)s\n'
+                    'Reason: %(reason)s\n'
+                    'Stdout: %(stdout)r\n'
                     'Stderr: %(stderr)r')
 
     def __init__(self, stdout=None, stderr=None,
@@ -100,31 +107,37 @@ class ProcessExecutionError(IOError):
         else:
             self.stdout = stdout
 
+        if reason:
+            self.reason = reason
+        else:
+            self.reason = '-'
+
         message = self.MESSAGE_TMPL % {
             'description': self.description,
             'cmd': self.cmd,
             'exit_code': self.exit_code,
             'stdout': self.stdout,
             'stderr': self.stderr,
+            'reason': self.reason,
         }
         IOError.__init__(self, message)
-        self.reason = reason
 
 
 class SeLinuxGuard(object):
     def __init__(self, path, recursive=False):
         self.path = path
         self.recursive = recursive
-        self.engaged = False
+        self.enabled = False
         if HAVE_LIBSELINUX and selinux.is_selinux_enabled():
-            self.engaged = True
+            self.enabled = True
 
     def __enter__(self):
-        return self.engaged
+        # TODO: Should we try to engage selinux here??
+        return None
 
     def __exit__(self, excp_type, excp_value, excp_traceback):
-        if self.engaged:
-            LOG.debug("Disengaging selinux mode for %s: %s",
+        if self.enabled:
+            LOG.debug("Restoring selinux mode for %s (recursive=%s)",
                       self.path, self.recursive)
             selinux.restorecon(self.path, recursive=self.recursive)
 
@@ -133,16 +146,74 @@ class MountFailedError(Exception):
     pass
 
 
-def translate_bool(val):
-    if not val:
-        return False
-    if val is isinstance(val, bool):
-        return val
-    if str(val).lower().strip() in ['true', '1', 'on', 'yes']:
+def SilentTemporaryFile(**kwargs):
+    fh = tempfile.NamedTemporaryFile(**kwargs)
+    # Replace its unlink with a quiet version
+    # that does not raise errors when the
+    # file to unlink has been unlinked elsewhere..
+    LOG.debug("Created temporary file %s", fh.name)
+    fh.unlink = del_file
+    # Add a new method that will unlink 
+    # right 'now' but still lets the exit
+    # method attempt to remove it (which will
+    # not throw due to our del file being quiet
+    # about files that are not there)
+    def unlink_now():
+        fh.unlink(fh.name)
+    setattr(fh, 'unlink_now', unlink_now)
+    return fh
+
+
+def fork_cb(child_cb, *args):
+    fid = os.fork()
+    if fid == 0:
+        try:
+            child_cb(*args)
+            os._exit(0)  # pylint: disable=W0212
+        except:
+            logexc(LOG, "Failed forking and calling callback %s", obj_name(child_cb))
+            os._exit(1)  # pylint: disable=W0212
+    else:
+        LOG.debug("Forked child %s who will run callback %s",
+                  fid, obj_name(child_cb))
+
+
+def is_true_str(val, addons=None):
+    check_set = ['true', '1', 'on', 'yes']
+    if addons:
+        check_set = check_set + addons
+    if str(val).lower().strip() in check_set:
         return True
     return False
 
 
+def is_false_str(val, addons=None):
+    check_set = ['off', '0', 'no', 'false']
+    if addons:
+        check_set = check_set + addons
+    if str(val).lower().strip() in check_set:
+        return True
+    return False
+
+
+def translate_bool(val, addons=None):
+    if not val:
+        # This handles empty lists and false and 
+        # other things that python believes are false
+        return False
+    # If its already a boolean skip
+    if isinstance(val, (bool)):
+        return val
+    return is_true_str(val, addons)
+
+
+def rand_str(strlen=32, select_from=None):
+    if not select_from:
+        select_from = string.letters + string.digits
+    return "".join([random.choice(select_from) for _x in range(0, strlen)])
+
+
+
 def read_conf(fname):
     try:
         return load_yaml(load_file(fname), default={})
@@ -221,7 +292,10 @@ def get_cfg_option_bool(yobj, key, default=False):
 def get_cfg_option_str(yobj, key, default=None):
     if key not in yobj:
         return default
-    return yobj[key]
+    val = yobj[key]
+    if not isinstance(val, (str, basestring)):
+        val = str(val)
+    return val
 
 
 def system_info():
@@ -233,7 +307,7 @@ def system_info():
     }
 
 
-def get_cfg_option_list_or_str(yobj, key, default=None):
+def get_cfg_option_list(yobj, key, default=None):
     """
     Gets the C{key} config option from C{yobj} as a list of strings. If the
     key is present as a single string it will be returned as a list with one
@@ -249,9 +323,14 @@ def get_cfg_option_list_or_str(yobj, key, default=None):
         return default
     if yobj[key] is None:
         return []
-    if isinstance(yobj[key], (list)):
-        return yobj[key]
-    return [yobj[key]]
+    val = yobj[key]
+    if isinstance(val, (list)):
+        # Should we ensure they are all strings??
+        cval = [str(v) for v in val]
+        return cval
+    if not isinstance(val, (str, basestring)):
+        val = str(val)
+    return [val]
 
 
 # get a cfg entry by its path array
@@ -419,21 +498,21 @@ def runparts(dirp, skip_no_exist=True):
     if skip_no_exist and not os.path.isdir(dirp):
         return
 
-    failed = 0
-    attempted = 0
+    failed = []
+    attempted = []
     for exe_name in sorted(os.listdir(dirp)):
         exe_path = os.path.join(dirp, exe_name)
         if os.path.isfile(exe_path) and os.access(exe_path, os.X_OK):
-            attempted += 1
+            attempted.append(exe_path)
             try:
                 subp([exe_path])
             except ProcessExecutionError as e:
                 logexc(LOG, "Failed running %s [%s]", exe_path, e.exit_code)
-                failed += 1
+                failed.append(e)
 
     if failed and attempted:
         raise RuntimeError('Runparts: %s failures in %s attempted commands'
-                           % (failed, attempted))
+                           % (len(failed), len(attempted)))
 
 
 # read_optional_seed
@@ -470,7 +549,7 @@ def load_yaml(blob, default=None, allowed=(dict,)):
         converted = yaml.load(blob)
         if not isinstance(converted, allowed):
             # Yes this will just be caught, but thats ok for now...
-            raise TypeError("Yaml load allows %s types, but got %s instead" %
+            raise TypeError("Yaml load allows %s root types, but got %s instead" %
                             (allowed, obj_name(converted)))
         loaded = converted
     except (yaml.YAMLError, TypeError, ValueError) as exc:
@@ -718,7 +797,8 @@ def close_stdin():
         os.dup2(fp.fileno(), sys.stdin.fileno())
 
 
-def find_devs_with(criteria=None):
+def find_devs_with(criteria=None, oformat='device', 
+                    tag=None, no_cache=False, path=None):
     """
     find devices matching given criteria (via blkid)
     criteria can be *one* of:
@@ -726,38 +806,58 @@ def find_devs_with(criteria=None):
       LABEL=<label>
       UUID=<uuid>
     """
-    try:
-        blk_id_cmd = ['blkid']
-        if criteria:
-            # Search for block devices with tokens named NAME that 
-            # have the value 'value' and display any devices which are found.
-            # Common values for NAME include  TYPE, LABEL, and UUID.
-            # If there are no devices specified on the command line,
-            # all block devices will be searched; otherwise, 
-            # only search the devices specified by the user.
-            blk_id_cmd.append("-t%s" % (criteria))
-        # Only print the device name
-        blk_id_cmd.append('-odevice')
-        (out, _err) = subp(blk_id_cmd)
+    blk_id_cmd = ['blkid']
+    options = []
+    if criteria:
+        # Search for block devices with tokens named NAME that 
+        # have the value 'value' and display any devices which are found.
+        # Common values for NAME include  TYPE, LABEL, and UUID.
+        # If there are no devices specified on the command line,
+        # all block devices will be searched; otherwise, 
+        # only search the devices specified by the user.
+        options.append("-t%s" % (criteria))
+    if tag:
+        # For each (specified) device, show only the tags that match tag.
+        options.append("-s%s" % (tag))
+    if no_cache:
+        # If you want to start with a clean cache 
+        # (i.e. don't report devices previously scanned 
+        # but not necessarily available at this time), specify /dev/null.
+        options.extend(["-c", "/dev/null"])
+    if oformat:
+        # Display blkid's output using the specified format. 
+        # The format parameter may be:
+        # full, value, list, device, udev, export
+        options.append('-o%s' % (oformat))
+    if path:
+        options.append(path)
+    cmd = blk_id_cmd + options
+    (out, _err) = subp(cmd)
+    if path:
+        return out.strip()
+    else:
         entries = []
         for line in out.splitlines():
             line = line.strip()
             if line:
                 entries.append(line)
         return entries
-    except ProcessExecutionError:
-        return []
 
 
-def load_file(fname, read_cb=None):
-    LOG.debug("Reading from %s", fname)
-    with open(fname, 'rb') as ifh:
-        ofh = StringIO()
-        pipe_in_out(ifh, ofh, chunk_cb=read_cb)
-        ofh.flush()
-        contents = ofh.getvalue()
-        LOG.debug("Read %s bytes from %s", len(contents), fname)
-        return contents
+def load_file(fname, read_cb=None, quiet=False):
+    LOG.debug("Reading from %s (quiet=%s)", fname, quiet)
+    ofh = StringIO()
+    try:
+        with open(fname, 'rb') as ifh:
+            pipe_in_out(ifh, ofh, chunk_cb=read_cb)
+    except IOError as e:
+        if not quiet:
+            raise
+        if e.errno != errno.ENOENT:
+            raise
+    contents = ofh.getvalue()
+    LOG.debug("Read %s bytes from %s", len(contents), fname)
+    return contents
 
 
 def get_cmdline():
@@ -872,7 +972,7 @@ def get_output_cfg(cfg, mode="init"):
     return ret
 
 
-def logexc(log, msg='', *args):
+def logexc(log, msg, *args):
     # Setting this here allows this to change
     # levels easily (not always error level)
     # or even desirable to have that much junk
@@ -883,16 +983,46 @@ def logexc(log, msg='', *args):
     log.debug(msg, exc_info=1, *args)
 
 
+def hash_blob(blob, routine, mlen=None):
+    hasher = hashlib.new(routine)
+    hasher.update(blob)
+    digest = hasher.hexdigest()
+    # Don't get to long now
+    if mlen is not None:
+        return digest[0:mlen]
+    else:
+        return digest
+
+
+def rename(src, dest):
+    LOG.debug("Renaming %s to %s", src, dest)
+    # TODO use a se guard here??
+    os.rename(src, dest)
+
+
 def ensure_dirs(dirlist, mode=0755):
     for d in dirlist:
         ensure_dir(d, mode)
 
 
+def yaml_dumps(obj):
+    formatted = yaml.dump(obj,
+                    line_break="\n",
+                    indent=4,
+                    explicit_start=True,
+                    explicit_end=True,
+                    default_flow_style=False,
+                    )
+    return formatted
+
+
 def ensure_dir(path, mode=None):
     if not os.path.isdir(path):
         # Make the dir and adjust the mode
         LOG.debug("Ensuring directory exists at path %s", path)
-        os.makedirs(path)
+        # TODO: check if guard needed??
+        with SeLinuxGuard(path=os.path.dirname(path)):
+            os.makedirs(path)
         chmod(path, mode)
     else:
         # Just adjust the mode
@@ -996,6 +1126,32 @@ def del_file(path):
             raise e
 
 
+def copy(src, dest):
+    LOG.debug("Copying %s to %s", src, dest)
+    shutil.copy(src, dest)
+
+
+def time_rfc2822():
+    try:
+        ts = time.strftime("%a, %d %b %Y %H:%M:%S %z", time.gmtime())
+    except:
+        ts = "??"
+    return ts
+
+
+def uptime():
+    try:
+        uptimef = load_file("/proc/uptime").strip()
+        if not uptimef:
+            uptime = 'na'
+        else:
+            uptime = uptimef.split()[0]
+    except:
+        logexc(LOG, "Unable to read uptime from /proc/uptime")
+        uptime = '??'
+    return uptime
+
+
 def ensure_file(path):
     write_file(path, content='', omode="ab")
 
@@ -1009,7 +1165,9 @@ def chmod(path, mode):
     if path and real_mode:
         LOG.debug("Adjusting the permissions of %s (perms=%o)",
                  path, real_mode)
-        os.chmod(path, real_mode)
+        # TODO: check if guard needed??
+        with SeLinuxGuard(path=path):
+            os.chmod(path, real_mode)
 
 
 def write_file(filename, content, mode=0644, omode="wb"):
@@ -1024,11 +1182,12 @@ def write_file(filename, content, mode=0644, omode="wb"):
     """
     ensure_dir(os.path.dirname(filename))
     LOG.debug("Writing to %s - %s, %s bytes", filename, omode, len(content))
-    with open(filename, omode) as fh:
-        with SeLinuxGuard(filename):
+    # TODO: check if guard needed??
+    with SeLinuxGuard(path=filename):
+        with open(filename, omode) as fh:
             fh.write(content)
             fh.flush()
-            chmod(filename, mode)
+    chmod(filename, mode)
 
 
 def delete_dir_contents(dirname):
@@ -1057,9 +1216,6 @@ def subp(args, data=None, rcs=None, env=None, capture=True, shell=False):
         else:
             stdout = subprocess.PIPE
             stderr = subprocess.PIPE
-        # Always pipe stdin (for now)
-        # harlowja: I don't see why anyone would want to pipe stdin
-        # since cloud-init shuts it down (via the method close stdin)
         stdin = subprocess.PIPE
         sp = subprocess.Popen(args, stdout=stdout,
                         stderr=stderr, stdin=stdin,
@@ -1099,10 +1255,14 @@ def shellify(cmdlist, add_header=True):
         if isinstance(args, list):
             fixed = []
             for f in args:
-                fixed.append("'%s'" % str(f).replace("'", escaped))
+                fixed.append("'%s'" % (str(f).replace("'", escaped)))
             content = "%s%s\n" % (content, ' '.join(fixed))
+        elif isinstance(args, (str, basestring)):
+            content = "%s%s\n" % (content, args)
         else:
-            content = "%s%s\n" % (content, str(args))
+            raise RuntimeError(("Unable to shellify type %s"
+                                " which is not a list or string") % (obj_name(args)))
+    LOG.debug("Shellified %s to %s", cmdlist, content)
     return content
 
 

From b9af5cde303c003ae88355a06c8581e0efc99de7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:29:49 -0700
Subject: [PATCH 113/434] Update comment about distro handling its timezone

---
 cloudinit/transforms/cc_timezone.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/transforms/cc_timezone.py b/cloudinit/transforms/cc_timezone.py
index 6fb5edc0..02cbf2dc 100644
--- a/cloudinit/transforms/cc_timezone.py
+++ b/cloudinit/transforms/cc_timezone.py
@@ -32,5 +32,6 @@ def handle(_name, cfg, cloud, log, args):
     if not timezone:
         log.debug("Skipping module named %s, no 'timezone' specified", name)
         return
-
+    
+    # Let the distro handle settings its timezone
     cloud.distro.set_timezone(timezone)

From 4aa05f644714303f60fad396d78be66d332b8cb8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:31:52 -0700
Subject: [PATCH 114/434] Cleanup and renaming that should mostly complete this
 new module.

1. Renamed config to modules, then renamed to transforms
2. Enabled checking of transform frequencies before usage (warning the user that something is bad)
3. Adjusting how the cloud object is formed to comply with its new api.
---
 cloudinit/stages.py | 209 ++++++++++++++++++++++++++------------------
 1 file changed, 126 insertions(+), 83 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 2cb9d0ec..2615d59f 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -31,12 +31,12 @@ try:
 except ImportError:
     ConfigObj = None
 
-from cloudinit.settings import (PER_INSTANCE)
+from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
 from cloudinit.settings import (OLD_CLOUD_CONFIG)
 
 from cloudinit import cloud
 from cloudinit import distros
-from cloudinit import handlers
+from cloudinit import modules
 from cloudinit import helpers
 from cloudinit import importer
 from cloudinit import log as logging
@@ -50,15 +50,16 @@ LOG = logging.getLogger(__name__)
 
 class Init(object):
     def __init__(self, ds_deps=None):
-        self.datasource = None
         if ds_deps:
             self.ds_deps = ds_deps
         else:
             self.ds_deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
         # Created on first use
-        self.cached_cfg = None
-        self.cached_distro = None
-        self.cached_paths = None
+        self._cfg = None
+        self._paths = None
+        self._distro = None
+        # Created only when a fetch occurs
+        self.datasource = None
 
     def _read_cfg_old(self):
         # Support reading the old ConfigObj format file and merging
@@ -68,23 +69,40 @@ class Init(object):
         old_cfg = ConfigObj(OLD_CLOUD_CONFIG)
         return dict(old_cfg)
 
+    @property
+    def distro(self):
+        if not self._distro:
+            d_cfg = util.get_cfg_by_path(self.cfg, ('system_info'), {})
+            # Ensure not modified indirectly
+            d_cfg = copy.deepcopy(d_cfg)
+            d_cfg.pop('paths', None)
+            distro_cls = distros.fetch(sys_cfg.pop('distro', 'ubuntu'))
+            LOG.debug("Using distro class %s", distro_cls)
+            distro = distro_cls(d_cfg, helpers.Runners(self.paths))
+            self._distro = distro
+        return self._distro
+
     @property
     def cfg(self):
-        if self.cached_cfg is None:
-            self.cached_cfg = self._read_cfg()
-        return self.cached_cfg
+        # None check so that we don't keep on re-loading if empty
+        if self._cfg is None:
+            self._cfg = self._read_cfg()
+            LOG.debug("Loading init config %s", self._cfg)
+        return self._cfg
 
     @property
     def paths(self):
-        if not self.cached_paths:
-            sys_info = self.cfg.get('system_info', {})
-            self.cached_paths = helpers.Paths(copy.deepcopy(sys_info),
-                                          self.datasource)
-        return self.cached_paths
+        if not self._paths:
+            path_info = util.get_cfg_by_path(self.cfg, ('system_info', 'paths'), {})
+            # Ensure not modified indirectly
+            path_info = copy.deepcopy(path_info)
+            self._paths = helpers.Paths(path_info, self.datasource)
+        return self._paths
 
     def _initial_subdirs(self):
         c_dir = self.paths.cloud_dir
         initial_dirs = [
+            c_dir,
             os.path.join(c_dir, 'scripts'),
             os.path.join(c_dir, 'scripts', 'per-instance'),
             os.path.join(c_dir, 'scripts', 'per-once'),
@@ -139,8 +157,8 @@ class Init(object):
             # the file wont exist
             return pickle.loads(util.load_file(pickled_fn))
         except Exception as e:
-            LOG.exception(("Failed loading pickled datasource from"
-                           " %s due to: %s"), pickled_fn, e)
+            util.logexc(LOG, "Failed loading pickled datasource from %s",
+                        pickled_fn)
             return None
 
     def _write_to_cache(self):
@@ -149,8 +167,7 @@ class Init(object):
             contents = pickle.dumps(self.datasource)
             util.write_file(pickled_fn, contents, mode=0400)
         except Exception as e:
-            LOG.exception(("Failed pickling datasource to"
-                          " %s due to: %s"), pickled_fn, e)
+            util.logexc(LOG, "Failed pickling datasource to %s", pickled_fn)
             return False
 
     def _get_datasources(self):
@@ -171,19 +188,17 @@ class Init(object):
             LOG.debug("Restored from cache datasource: %s" % ds)
         else:
             (cfg_list, pkg_list) = self._get_datasources()
-            # Deep copy so that handlers can not modify (which will
-            # affect handlers down the line...)
+            # Deep copy so that user-data handlers can not modify
+            # (which will affect user-data handlers down the line...)
             sys_cfg = copy.deepcopy(self.cfg)
             ds_deps = copy.deepcopy(self.ds_deps)
-            distro = distros.fetch(sys_cfg,
-                                   cloud.Cloud(self.datasource,
-                                               self.paths, sys_cfg))
-            (ds, dsname) = sources.find_source(sys_cfg, distro, self.paths,
+            (ds, dsname) = sources.find_source(sys_cfg, self.distro, self.paths,
                                                ds_deps, cfg_list, pkg_list)
             LOG.debug("Loaded datasource %s - %s", dsname, ds)
         self.datasource = ds
-        if self.cached_paths:
-            self.cached_paths.datasource = ds
+        # Ensure we adjust our path members datasource
+        # now that we have one (thus allowing ipath to be used)
+        self.paths.datasource = ds
         return ds
 
     def _reflect_cur_instance(self):
@@ -231,12 +246,19 @@ class Init(object):
             previous_iid = iid
         util.write_file(c_iid_fn, "%s\n" % iid)
         util.write_file(p_iid_fn, "%s\n" % previous_iid)
+        return iid
 
     def fetch(self):
         return self._get_data_source()
 
     def instancify(self):
-        self._reflect_cur_instance()
+        return self._reflect_cur_instance()
+
+    def cloudify(self):
+        # Form the needed options to cloudify our members
+        return cloud.Cloud(self.datasource, 
+                           self.paths, self.cfg,
+                           self.distro, helpers.Runners(self.paths))
 
     def update(self):
         self._write_to_cache()
@@ -266,24 +288,24 @@ class Init(object):
             try:
                 mod = ud.fixup_module(importer.import_module(modname))
                 types = c_handlers.register(mod)
-                LOG.debug("Added handler for [%s] from %s", types, fname)
+                LOG.debug("Added handler for %s from %s", types, fname)
             except:
-                LOG.exception("Failed to register handler from %s", fname)
+                util.logexc(LOG, "Failed to register handler from %s", fname)
 
         def_handlers = c_handlers.register_defaults()
         if def_handlers:
-            LOG.debug("Registered default handlers for [%s]", def_handlers)
+            LOG.debug("Registered default handlers for %s", def_handlers)
 
-        # Form our cloud proxy
-        data = cloud.Cloud(self.datasource,
-                           self.paths, copy.deepcopy(self.cfg))
 
-        # Ensure userdata fetched before activation
-        ud_obj = data.get_userdata()
+        # Ensure userdata fetched before activation (just incase)
+        ud_obj = self.datasource.get_userdata()
+
+        # Form our cloud interface
+        data = self.cloudify()
 
         # Init the handlers first
         called = []
-        for (_mtype, mod) in c_handlers.iteritems():
+        for (_ctype, mod) in c_handlers.iteritems():
             if mod in called:
                 continue
             ud.call_begin(mod, data, frequency)
@@ -304,26 +326,28 @@ class Init(object):
 
         # Give callbacks opportunity to finalize
         called = []
-        for (_mtype, mod) in c_handlers.iteritems():
+        for (_ctype, mod) in c_handlers.iteritems():
             if mod in called:
                 continue
             ud.call_end(mod, data, frequency)
             called.append(mod)
 
 
-class Handlers(object):
-    def __init__(self, datasource, h_cloud, cfgfile=None, basecfg=None):
-        self.datasource = datasource
+class Transforms(object):
+    def __init__(self, cloudobj, cfgfile=None):
+        self.datasource = cloudobj.datasource
         self.cfgfile = cfgfile
-        self.basecfg = basecfg
-        self.h_cloud = h_cloud
-        self.cachedcfg = None
+        self.basecfg = copy.deepcopy(cloudobj.cfg)
+        self.cloudobj = cloudobj
+        # Created on first use
+        self._cachedcfg = None
 
     @property
     def cfg(self):
-        if self.cachedcfg is None:
-            self.cachedcfg = self._get_config(self.cfgfile)
-        return self.cachedcfg
+        if self._cachedcfg is None:
+            self._cachedcfg = self._get_config(self.cfgfile)
+            LOG.debug("Loading module config %s", self._cachedcfg)
+        return self._cachedcfg
 
     def _get_config(self, cfgfile):
         mcfg = None
@@ -332,8 +356,8 @@ class Handlers(object):
             try:
                 mcfg = util.read_conf(cfgfile)
             except:
-                LOG.exception(("Failed loading of cloud config '%s'. "
-                              "Continuing with an empty config."), cfgfile)
+                util.logexc(LOG, ("Failed loading of cloud config '%s'. "
+                                  "Continuing with an empty config."), cfgfile)
         if not mcfg:
             mcfg = {}
 
@@ -341,7 +365,7 @@ class Handlers(object):
         try:
             ds_cfg = self.datasource.get_config_obj()
         except:
-            LOG.exception("Failed loading of datasource config.")
+            util.logexc(LOG, "Failed loading of datasource config object.")
         if not ds_cfg:
             ds_cfg = {}
 
@@ -352,64 +376,83 @@ class Handlers(object):
             return mcfg
 
 
-    def _read_modules(self, name):
+    def _read_transforms(self, name):
         module_list = []
         if name not in self.cfg:
             return module_list
         cfg_mods = self.cfg[name]
-        # Create 'module_list', an array of arrays
-        # Where array[0] = module name
-        #       array[1] = frequency
-        #       array[2:] = arguments
+        # Create 'module_list', an array of hashes
+        # Where hash['mod'] = module name
+        #       hash['freq'] = frequency
+        #       hash['args'] = arguments
         for item in cfg_mods:
             if not item:
                 continue
-            if isinstance(item, str):
-                module_list.append([item])
-            elif isinstance(item, list):
-                module_list.append(item)
+            if isinstance(item, (str, basestring)):
+                module_list.append({
+                    'mod': item.strip(),
+                })
+            elif isinstance(item, (list)):
+                contents = {}
+                # Meant to fall through...
+                if len(item) >= 1:
+                    contents['mod'] = item[0].strip()
+                if len(item) >= 2:
+                    contents['freq'] = item[1].strip()
+                if len(item) >= 3:
+                    contents['args'] = item[2:]
+                if contents:
+                    module_list.append(contents)
             else:
-                raise TypeError("Failed to read '%s' item in config")
+                raise TypeError(("Failed to read '%s' item in config,"
+                                 " unknown type %s") %
+                                 (item, util.obj_name(item)))
         return module_list
 
-    def _form_modules(self, raw_mods):
+    def _transforms_modules(self, raw_mods):
         mostly_mods = []
         for raw_mod in raw_mods:
-            raw_name = raw_mod[0]
-            freq = None
-            run_args = None
-            if len(raw_mod) > 1:
-                freq = raw_mod[1]
-            if len(raw_mod) > 2:
-                run_args = raw_mod[2:]
-            if not run_args:
-                run_args = []
-            mod_name = handlers.form_module_name(raw_name)
+            raw_name = raw_mod['mod']
+            freq = raw_mod.get('freq')
+            run_args = raw_mod.get('args') or []
+            mod_name = modules.form_module_name(raw_name)
             if not mod_name:
                 continue
-            mod = handlers.fixup_module(importer.import_module(mod_name))
+            if freq and freq not in FREQUENCIES:
+                LOG.warn("Config specified module %s has an unknown frequency %s", raw_name, freq)
+                # Reset it so when ran it will get set to a known value
+                freq = None
+            mod = modules.fixup_module(importer.import_module(mod_name))
             mostly_mods.append([mod, raw_name, freq, run_args])
         return mostly_mods
 
-    def _run_modules(self, mostly_mods):
+    def _run_transforms(self, mostly_mods):
         failures = []
         for (mod, name, freq, args) in mostly_mods:
             try:
+                # Try the modules frequency, otherwise fallback to a known one
                 if not freq:
                     freq = mod.frequency
-                if not freq:
+                if not freq in FREQUENCIES:
                     freq = PER_INSTANCE
+                worked_distros = mod.distros
+                if worked_distros and self.cloud.distro.name() not in worked_distros:
+                    LOG.warn(("Module %s is verified on %s distros"
+                              " but not on %s distro. It may or may not work"
+                              " correctly."), name, worked_distros,
+                              self.cloud.distro.name())
+                # Deep copy the config so that modules can't alter it
                 func_args = [name, copy.deepcopy(self.cfg),
-                             self.h_cloud, LOG,
-                             args]
-                run_name = "config-" + name        
-                self.h_cloud.run(run_name, mod.handle, func_args, freq=freq)
-            except:
-                LOG.exception("Running %s failed", mod)
-                failures.append(name)
+                             self.cloudobj, LOG, args]
+                # This name will affect the semphapore name created
+                run_name = "config-%s" % (name)
+                self.cloudobj.run(run_name, mod.handle, func_args, freq=freq)
+            except Exception as e:
+                util.logexc(LOG, "Running %s failed", mod)
+                failures.append((name, e))
         return failures
 
     def run(self, name):
-        raw_mods = self._read_modules(name)
-        mostly_mods = self._form_modules(raw_mods)
-        return self._run_modules(mostly_mods)
+        raw_mods = self._read_transforms(name)
+        mostly_mods = self._transforms_modules(raw_mods)
+        return self._run_transforms(mostly_mods)

From 6b2dd9a9c743dc3da06644f09dad78946a4eea0c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:37:05 -0700
Subject: [PATCH 115/434] Variable name mismatch

---
 cloudinit/distros/ubuntu.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index b8aff03c..e68f3064 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -53,8 +53,7 @@ class Distro(distros.Distro):
         util.subp(['hostname', hostname])
 
     def update_hostname(self, hostname, prev_file):
-        hostname_prev = None 
-        prev_name = self._read_hostname(prev_file)
+        hostname_prev = self._read_hostname(prev_file)
         hostname_in_etc = self._read_hostname("/etc/hostname")
         update_files = []
         if not hostname_prev or hostname_prev != hostname:

From 303f07ba43d8c78f4914ea47e9a6272428132f64 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 18:38:10 -0700
Subject: [PATCH 116/434] Self variable missing

---
 cloudinit/distros/ubuntu.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index e68f3064..6b0aff47 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -73,7 +73,7 @@ class Distro(distros.Distro):
             LOG.debug("Setting hostname to %s", hostname)
             util.subp(['hostname', hostname])
 
-    def _read_hostname(filename, default=None):
+    def _read_hostname(self, filename, default=None):
         contents = util.load_file(filename, quiet=True)
         for line in contents.splitlines():
             hpos = line.find("#")

From 830131b1fdf3b0db2e0e157dd6a47e8895a27486 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 19:03:28 -0700
Subject: [PATCH 117/434] Ensure that this directory is treated as a module.

---
 cloudinit/handlers/__init__.py | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)
 create mode 100644 cloudinit/handlers/__init__.py

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
new file mode 100644
index 00000000..09163abb
--- /dev/null
+++ b/cloudinit/handlers/__init__.py
@@ -0,0 +1,22 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+

From 29e0ccd4ed0f5f2ba7c118edb3b24b428699f190 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 15 Jun 2012 21:33:55 -0700
Subject: [PATCH 118/434] Fixups to ensure that pylint does not find anything
 major wrong.

---
 cloudinit/cloud.py                            |  2 -
 cloudinit/distros/__init__.py                 | 21 ++--
 cloudinit/distros/ubuntu.py                   | 23 ++---
 cloudinit/handlers/boot_hook.py               | 14 +--
 cloudinit/handlers/cloud_config.py            |  4 +-
 cloudinit/handlers/shell_script.py            |  5 +-
 cloudinit/handlers/upstart_job.py             |  7 +-
 cloudinit/helpers.py                          | 41 ++------
 cloudinit/log.py                              |  2 +-
 cloudinit/sources/DataSourceCloudStack.py     |  2 +-
 cloudinit/sources/DataSourceConfigDrive.py    |  4 +-
 cloudinit/sources/DataSourceMAAS.py           | 14 +--
 cloudinit/sources/DataSourceNoCloud.py        |  3 +-
 cloudinit/sources/DataSourceOVF.py            | 12 ++-
 cloudinit/sources/__init__.py                 | 23 ++---
 cloudinit/stages.py                           | 98 ++++++++++++-------
 cloudinit/transforms/__init__.py              |  2 +-
 cloudinit/transforms/cc_apt_update_upgrade.py | 12 ++-
 cloudinit/transforms/cc_bootcmd.py            |  8 +-
 cloudinit/transforms/cc_byobu.py              |  2 +-
 cloudinit/transforms/cc_ca_certs.py           | 13 ++-
 cloudinit/transforms/cc_chef.py               |  3 +-
 .../transforms/cc_disable_ec2_metadata.py     |  3 +-
 cloudinit/transforms/cc_final_message.py      |  4 +-
 cloudinit/transforms/cc_foo.py                |  6 +-
 cloudinit/transforms/cc_grub_dpkg.py          |  4 +-
 cloudinit/transforms/cc_keys_to_console.py    | 23 +++--
 cloudinit/transforms/cc_landscape.py          |  3 +-
 cloudinit/transforms/cc_locale.py             |  2 +-
 cloudinit/transforms/cc_mcollective.py        |  9 +-
 cloudinit/transforms/cc_mounts.py             | 15 +--
 cloudinit/transforms/cc_phone_home.py         | 36 ++++---
 cloudinit/transforms/cc_puppet.py             | 17 ++--
 cloudinit/transforms/cc_resizefs.py           | 38 ++++---
 .../transforms/cc_rightscale_userdata.py      | 16 +--
 cloudinit/transforms/cc_rsyslog.py            | 14 +--
 cloudinit/transforms/cc_runcmd.py             |  9 +-
 cloudinit/transforms/cc_salt_minion.py        |  7 +-
 cloudinit/transforms/cc_scripts_per_boot.py   |  5 +-
 .../transforms/cc_scripts_per_instance.py     |  5 +-
 cloudinit/transforms/cc_scripts_per_once.py   |  5 +-
 cloudinit/transforms/cc_scripts_user.py       |  9 +-
 cloudinit/transforms/cc_set_hostname.py       |  2 +-
 cloudinit/transforms/cc_set_passwords.py      | 10 +-
 cloudinit/transforms/cc_ssh.py                | 22 +++--
 cloudinit/transforms/cc_ssh_import_id.py      |  8 +-
 cloudinit/transforms/cc_timezone.py           |  8 +-
 cloudinit/transforms/cc_update_etc_hosts.py   | 22 +++--
 cloudinit/transforms/cc_update_hostname.py    |  4 +-
 cloudinit/transforms/cc_welcome.py            |  6 +-
 cloudinit/user_data.py                        | 13 +--
 cloudinit/util.py                             | 48 +++++----
 52 files changed, 388 insertions(+), 300 deletions(-)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index b2dfc749..8372d123 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -23,8 +23,6 @@
 import copy
 import os
 
-from cloudinit import distros
-from cloudinit import helpers
 from cloudinit import log as logging
 
 LOG = logging.getLogger(__name__)
diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 90607668..fd4c70c1 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -20,29 +20,32 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from StringIO import StringIO
+
 import abc
 import copy
 
 from cloudinit import importer
+from cloudinit import log as logging
 from cloudinit import util
 
-from StringIO import StringIO
-
 # TODO: Make this via config??
 IFACE_ACTIONS = {
     'up': ['ifup', '--all'],
     'down': ['ifdown', '--all'],
 }
 
+LOG = logging.getLogger(__name__)
+
 
 class Distro(object):
 
     __metaclass__ = abc.ABCMeta
 
-    def __init__(self, cfg, runner):
+    def __init__(self, name, cfg, runner):
         self._runner = runner
-        self._cfg = util.get_cfg_by_path(cfg, ('system_info', ), {})
-        self.name = self._cfg.pop("distro", 'generic')
+        self._cfg = cfg
+        self.name = name
 
     @abc.abstractmethod
     def install_packages(self, pkglist):
@@ -135,10 +138,9 @@ class Distro(object):
                      action, cmd)
             (_out, err) = util.subp(cmd)
             if len(err):
-                LOG.warn("Running %s resulted in stderr output: %s",
-                         IF_UP_CMD, err)
+                LOG.warn("Running %s resulted in stderr output: %s", cmd, err)
             return True
-        except util.ProcessExecutionError as exc:
+        except util.ProcessExecutionError:
             util.logexc(LOG, "Running %s failed", cmd)
             return False
 
@@ -152,7 +154,8 @@ def fetch(distro_name, mods=(__name__, )):
         except RuntimeError:
             pass
     if not mod:
-        raise RuntimeError("No distribution found for distro %s" % (distro_name))
+        raise RuntimeError("No distribution found for distro %s"
+                           % (distro_name))
     distro_cls = getattr(mod, 'Distro')
     return distro_cls
     
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 6b0aff47..9252a1c4 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -20,17 +20,13 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from StringIO import StringIO
-
 import os
-import socket
 
 from cloudinit import distros
 from cloudinit import log as logging
-from cloudinit import templater
 from cloudinit import util
 
-from cloudinit.settings import (PER_INSTANCE)
+from cloudinit.settings import PER_INSTANCE
 
 LOG = logging.getLogger(__name__)
 
@@ -65,9 +61,11 @@ class Distro(distros.Distro):
             try:
                 util.write_file(fn, "%s\n" % hostname, 0644)
             except:
-                util.logexc(LOG, "Failed to write hostname %s to %s", hostname, fn)
-        if hostname_in_etc and hostname_prev and hostname_in_etc != hostname_prev:
-             LOG.debug(("%s differs from /etc/hostname."
+                util.logexc(LOG, "Failed to write hostname %s to %s",
+                            hostname, fn)
+        if (hostname_in_etc and hostname_prev and
+            hostname_in_etc != hostname_prev):
+            LOG.debug(("%s differs from /etc/hostname."
                         " Assuming user maintained hostname."), prev_file)
         if "/etc/hostname" in update_files:
             LOG.debug("Setting hostname to %s", hostname)
@@ -91,7 +89,8 @@ class Distro(distros.Distro):
     def set_timezone(self, tz):
         tz_file = os.path.join("/usr/share/zoneinfo", tz)
         if not os.path.isfile(tz_file):
-            raise Exception("Invalid timezone %s, no file found at %s" % (tz, tz_file))
+            raise Exception(("Invalid timezone %s,"
+                             " no file found at %s") % (tz, tz_file))
         tz_contents = "%s\n" % tz
         util.write_file("/etc/timezone", tz_contents)
         # TODO, this should be in a rhel distro subclass??
@@ -101,9 +100,6 @@ class Distro(distros.Distro):
         # This ensures that the correct tz will be used for the system
         util.copy(tz_file, "/etc/localtime")
 
-    def name(self):
-        return "ubuntu"
-
     # apt_get top level command (install, update...), and args to pass it
     def _apt_get(self, tlc, args=None):
         e = os.environ.copy()
@@ -116,4 +112,5 @@ class Distro(distros.Distro):
         util.subp(cmd, env=e, capture=False)
 
     def _update_package_sources(self):
-        self.runner.run("update-sources", self._apt_get, ["update"], freq=PER_INSTANCE)
\ No newline at end of file
+        self._runner.run("update-sources", self._apt_get,
+                         ["update"], freq=PER_INSTANCE)
\ No newline at end of file
diff --git a/cloudinit/handlers/boot_hook.py b/cloudinit/handlers/boot_hook.py
index c75aeb72..b3aab366 100644
--- a/cloudinit/handlers/boot_hook.py
+++ b/cloudinit/handlers/boot_hook.py
@@ -32,9 +32,9 @@ LOG = logging.getLogger(__name__)
 
 
 class BootHookPartHandler(ud.PartHandler):
-    def __init__(self, boothook_dir, instance_id):
+    def __init__(self, paths, instance_id, **_kwargs):
         ud.PartHandler.__init__(self, PER_ALWAYS)
-        self.boothook_dir = boothook_dir
+        self.boothook_dir = paths.get_ipath("boothooks")
         self.instance_id = instance_id
 
     def list_types(self):
@@ -54,13 +54,15 @@ class BootHookPartHandler(ud.PartHandler):
             start = len(prefix) + 1
 
         filepath = os.path.join(self.boothook_dir, filename)
-        util.write_file(filepath, payload[start:], 0700)
+        contents = payload[start:]
+        util.write_file(filepath, contents, 0700)
         try:
             env = os.environ.copy()
-            env['INSTANCE_ID'] = str(self.instance_id)
+            if self.instance_id:
+                env['INSTANCE_ID'] = str(self.instance_id)
             util.subp([filepath], env=env)
-        except util.ProcessExecutionError as e:
+        except util.ProcessExecutionError:
             util.logexc(LOG, "Boothooks script %s execution error", filepath)
-        except Exception as e:
+        except Exception:
             util.logexc(LOG, ("Boothooks unknown "
                               "error when running %s"), filepath)
diff --git a/cloudinit/handlers/cloud_config.py b/cloudinit/handlers/cloud_config.py
index f0e88eeb..12d1bd96 100644
--- a/cloudinit/handlers/cloud_config.py
+++ b/cloudinit/handlers/cloud_config.py
@@ -30,10 +30,10 @@ LOG = logging.getLogger(__name__)
 
 
 class CloudConfigPartHandler(ud.PartHandler):
-    def __init__(self, cloud_fn):
+    def __init__(self, paths, **_kwargs):
         ud.PartHandler.__init__(self, PER_ALWAYS)
         self.cloud_buf = []
-        self.cloud_fn = cloud_fn
+        self.cloud_fn = paths.get_ipath("cloud_config")
 
     def list_types(self):
         return [
diff --git a/cloudinit/handlers/shell_script.py b/cloudinit/handlers/shell_script.py
index 564e4623..f6e2ef16 100644
--- a/cloudinit/handlers/shell_script.py
+++ b/cloudinit/handlers/shell_script.py
@@ -32,10 +32,9 @@ LOG = logging.getLogger(__name__)
 
 
 class ShellScriptPartHandler(ud.PartHandler):
-
-    def __init__(self, script_dir):
+    def __init__(self, paths, **_kwargs):
         ud.PartHandler.__init__(self, PER_ALWAYS)
-        self.script_dir = script_dir
+        self.script_dir = paths.get_ipath_cur('scripts')
 
     def list_types(self):
         return [
diff --git a/cloudinit/handlers/upstart_job.py b/cloudinit/handlers/upstart_job.py
index 568a644a..059a4851 100644
--- a/cloudinit/handlers/upstart_job.py
+++ b/cloudinit/handlers/upstart_job.py
@@ -33,9 +33,9 @@ LOG = logging.getLogger(__name__)
 
 
 class UpstartJobPartHandler(ud.PartHandler):
-    def __init__(self, upstart_dir):
+    def __init__(self, paths, **_kwargs):
         ud.PartHandler.__init__(self, PER_INSTANCE)
-        self.upstart_dir = upstart_dir
+        self.upstart_dir = paths.upstart_conf_d
 
     def list_types(self):
         return [
@@ -46,6 +46,9 @@ class UpstartJobPartHandler(ud.PartHandler):
         if ctype in ud.CONTENT_SIGNALS:
             return
 
+        if not self.upstart_dir:
+            return
+
         filename = util.clean_filename(filename)
         (_name, ext) = os.path.splitext(filename)
         if not ext:
diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 2ecda3e9..c276a54c 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -30,11 +30,6 @@ from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE)
 from cloudinit import log as logging
 from cloudinit import util
 
-from cloudinit.user_data import boot_hook as bh_part
-from cloudinit.user_data import cloud_config as cc_part
-from cloudinit.user_data import shell_script as ss_part
-from cloudinit.user_data import upstart_job as up_part
-
 LOG = logging.getLogger(__name__)
 
 
@@ -77,7 +72,7 @@ class FileSemaphores(object):
         sem_file = self._get_path(name, freq)
         try:
             util.del_file(sem_file)
-        except (IOError, OSError) as e:
+        except (IOError, OSError):
             util.logexc(LOG, "Failed deleting semaphore %s", sem_file)
             return False
         return True
@@ -99,7 +94,7 @@ class FileSemaphores(object):
         contents = "%s: %s\n" % (os.getpid(), time())
         try:
             util.write_file(sem_file, contents)
-        except (IOError, OSError) as e:
+        except (IOError, OSError):
             util.logexc(LOG, "Failed writing semaphore file %s", sem_file)
             return None
         return sem_file
@@ -162,9 +157,10 @@ class Runners(object):
 
 class ContentHandlers(object):
 
-    def __init__(self, paths):
+    def __init__(self, paths, iid=None):
         self.paths = paths
         self.registered = {}
+        self.iid = iid
 
     def __contains__(self, item):
         return self.is_registered(item)
@@ -191,34 +187,9 @@ class ContentHandlers(object):
     def iteritems(self):
         return self.registered.iteritems()
 
-    def _get_default_handlers(self):
-        def_handlers = []
-
-        cc_path = self.paths.get_ipath("cloud_config")
-        if cc_path:
-            cc_h = cc_part.CloudConfigPartHandler(cc_path)
-            def_handlers.append(cc_h)
-
-        sc_path = self.paths.get_ipath_cur('scripts')
-        if sc_path:
-            ss_h = ss_part.ShellScriptPartHandler(sc_path)
-            def_handlers.append(ss_h)
-
-        bh_path = self.paths.get_ipath("boothooks")
-        if bh_path:
-            bh_h = bh_part.BootHookPartHandler(bh_path)
-            def_handlers.append(bh_h)
-
-        upstart_pth = self.paths.upstart_conf_d
-        if upstart_pth:
-            up_h = up_part.UpstartJobPartHandler(upstart_pth)
-            def_handlers.append(up_h)
-
-        return def_handlers
-
-    def register_defaults(self):
+    def register_defaults(self, defs):
         registered = set()
-        for mod in self._get_default_handlers():
+        for mod in defs:
             for t in mod.list_types():
                 if not self.is_registered(t):
                     self.registered[t] = mod
diff --git a/cloudinit/log.py b/cloudinit/log.py
index c247eb9e..5fcb77ef 100644
--- a/cloudinit/log.py
+++ b/cloudinit/log.py
@@ -56,7 +56,7 @@ def setupBasicLogging():
         cfile = logging.FileHandler('/var/log/cloud-init.log')
         cfile.setFormatter(logging.Formatter(DEF_CON_FORMAT))
         cfile.setLevel(DEBUG)
-        root.addHandle(cfile)
+        root.addHandler(cfile)
     except (IOError, OSError):
         # Likely that u can't write to that file...
         # Make console now have DEBUG??
diff --git a/cloudinit/sources/DataSourceCloudStack.py b/cloudinit/sources/DataSourceCloudStack.py
index 791df68f..27217e65 100644
--- a/cloudinit/sources/DataSourceCloudStack.py
+++ b/cloudinit/sources/DataSourceCloudStack.py
@@ -79,7 +79,7 @@ class DataSourceCloudStack(sources.DataSource):
             tot_time = (time.time() - start)
             LOG.debug("Crawl of metadata service took %s", int(tot_time))
             return True
-        except Exception as e:
+        except Exception:
             util.logexc(LOG, ('Failed fetching from metadata '
                               'service %s'), self.metadata_address)
             return False
diff --git a/cloudinit/sources/DataSourceConfigDrive.py b/cloudinit/sources/DataSourceConfigDrive.py
index 176b62b0..7450572f 100644
--- a/cloudinit/sources/DataSourceConfigDrive.py
+++ b/cloudinit/sources/DataSourceConfigDrive.py
@@ -51,8 +51,8 @@ class DataSourceConfigDrive(sources.DataSource):
         self.seed_dir = os.path.join(paths.seed_dir, 'config_drive')
 
     def __str__(self):
-        mstr = "%s[%s]" % (util.obj_name(self), self.dsmode)
-        mstr += " [seed=%s]" % (self.seed)
+        mstr = "%s [%s]" % (util.obj_name(self), self.dsmode)
+        mstr += "[seed=%s]" % (self.seed)
         return mstr
 
     def get_data(self):
diff --git a/cloudinit/sources/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
index 27196265..9e639649 100644
--- a/cloudinit/sources/DataSourceMAAS.py
+++ b/cloudinit/sources/DataSourceMAAS.py
@@ -18,9 +18,9 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import os
 import errno
 import oauth.oauth as oauth
+import os
 import time
 import urllib2
 
@@ -48,7 +48,7 @@ class DataSourceMAAS(sources.DataSource):
         self.seed_dir = os.path.join(paths.seed_dir, 'maas')
 
     def __str__(self):
-        return "%s[%s]" % (util.obj_name(self), self.base_url)
+        return "%s [%s]" % (util.obj_name(self), self.base_url)
 
     def get_data(self):
         mcfg = self.ds_cfg
@@ -122,9 +122,10 @@ class DataSourceMAAS(sources.DataSource):
 
         starttime = time.time()
         check_url = "%s/%s/meta-data/instance-id" % (url, MD_VERSION)
-        url = util.wait_for_url(urls=[check_url], max_wait=max_wait,
-                                timeout=timeout, status_cb=LOG.warn,
-                                headers_cb=self.md_headers)
+        urls = [check_url]
+        url = uhelp.wait_for_url(urls=urls, max_wait=max_wait,
+                                 timeout=timeout, status_cb=LOG.warn,
+                                 headers_cb=self.md_headers)
 
         if url:
             LOG.info("Using metadata source: '%s'", url)
@@ -185,7 +186,8 @@ def read_maas_seed_url(seed_url, header_cb=None, timeout=None,
             headers = {}
         try:
             (resp, sc) = uhelp.readurl(url, headers=headers, timeout=timeout)
-            md[name] = resp
+            if uhelp.ok_http_code(sc):
+                md[name] = resp
         except urllib2.HTTPError as e:
             if e.code != 404:
                 raise
diff --git a/cloudinit/sources/DataSourceNoCloud.py b/cloudinit/sources/DataSourceNoCloud.py
index 84d0f99d..2b016d1c 100644
--- a/cloudinit/sources/DataSourceNoCloud.py
+++ b/cloudinit/sources/DataSourceNoCloud.py
@@ -106,7 +106,8 @@ class DataSourceNoCloud(sources.DataSource):
                 if e.errno != errno.ENOENT:
                     raise
             except util.MountFailedError:
-                util.logexc(LOG, "Failed to mount %s when looking for seed", dev)
+                util.logexc(LOG, ("Failed to mount %s"
+                                  " when looking for data"), dev)
 
         # There was no indication on kernel cmdline or data
         # in the seeddir suggesting this handler should be used.
diff --git a/cloudinit/sources/DataSourceOVF.py b/cloudinit/sources/DataSourceOVF.py
index bb0f46c2..258d8d03 100644
--- a/cloudinit/sources/DataSourceOVF.py
+++ b/cloudinit/sources/DataSourceOVF.py
@@ -21,10 +21,10 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 from xml.dom import minidom
+
 import base64
 import os
 import re
-import tempfile
 
 from cloudinit import log as logging
 from cloudinit import sources
@@ -51,7 +51,7 @@ class DataSourceOVF(sources.DataSource):
         ud = ""
 
         defaults = {
-            "instance-id": "iid-dsovf"
+            "instance-id": "iid-dsovf",
         }
 
         (seedfile, contents) = get_ovf_env(self.paths.seed_dir)
@@ -198,7 +198,7 @@ def transport_iso9660(require_iso=True):
     for dev in devs:
         fullp = os.path.join("/dev/", dev)
 
-        if (fullp in mounted or
+        if (fullp in mounts or
             not cdmatch.match(dev) or os.path.isdir(fullp)):
             continue
 
@@ -210,7 +210,8 @@ def transport_iso9660(require_iso=True):
             continue
 
         try:
-            (fname, contents) = utils.mount_cb(fullp, get_ovf_env, mtype="iso9660")
+            (fname, contents) = util.mount_cb(fullp,
+                                               get_ovf_env, mtype="iso9660")
         except util.MountFailedError:
             util.logexc(LOG, "Failed mounting %s", fullp)
             continue
@@ -265,7 +266,8 @@ def get_properties(contents):
         raise XmlError("No 'PropertySection's")
 
     props = {}
-    propElems = find_child(propSections[0], lambda n: n.localName == "Property")
+    propElems = find_child(propSections[0],
+                            (lambda n: n.localName == "Property"))
 
     for elem in propElems:
         key = elem.attributes.getNamedItemNS(envNsURI, "key").value
diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 08669f5d..beb0f3d7 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -22,10 +22,9 @@
 
 from cloudinit import importer
 from cloudinit import log as logging
+from cloudinit import user_data as ud
 from cloudinit import util
 
-from cloudinit.user_data import processor as ud_proc
-
 DEP_FILESYSTEM = "FILESYSTEM"
 DEP_NETWORK = "NETWORK"
 DS_PREFIX = 'DataSource'
@@ -42,7 +41,6 @@ class DataSource(object):
         self.sys_cfg = sys_cfg
         self.distro = distro
         self.paths = paths
-        self.userdata_proc = ud_proc.UserDataProcessor(paths)
         self.userdata = None
         self.metadata = None
         self.userdata_raw = None
@@ -55,7 +53,7 @@ class DataSource(object):
     def get_userdata(self):
         if self.userdata is None:
             raw_data = self.get_userdata_raw()
-            self.userdata = self.userdata_proc.process(raw_data)
+            self.userdata = ud.UserDataProcessor(self.paths).process(raw_data)
         return self.userdata
 
     def get_userdata_raw(self):
@@ -73,7 +71,7 @@ class DataSource(object):
         if not self.metadata or 'public-keys' not in self.metadata:
             return keys
 
-        if isinstance(self.metadata['public-keys'], (str)):
+        if isinstance(self.metadata['public-keys'], (basestring, str)):
             return str(self.metadata['public-keys']).splitlines()
 
         if isinstance(self.metadata['public-keys'], (list, set)):
@@ -84,11 +82,12 @@ class DataSource(object):
                 # lp:506332 uec metadata service responds with
                 # data that makes boto populate a string for 'klist' rather
                 # than a list.
-                if isinstance(klist, (str)):
+                if isinstance(klist, (str, basestring)):
                     klist = [klist]
                 if isinstance(klist, (list, set)):
                     for pkey in klist:
-                        # there is an empty string at the end of the keylist, trim it
+                        # There is an empty string at
+                        # the end of the keylist, trim it
                         if pkey:
                             keys.append(pkey)
 
@@ -159,13 +158,14 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
     ds_list = list_sources(cfg_list, ds_deps, pkg_list)
     ds_names = [util.obj_name(f) for f in ds_list]
     LOG.info("Searching for data source in: %s", ds_names)
+
     for cls in ds_list:
         ds = util.obj_name(cls)
         try:
             s = cls(distro, sys_cfg, paths)
             if s.get_data():
                 return (s, ds)
-        except Exception as e:
+        except Exception:
             util.logexc(LOG, "Getting data from %s failed", ds)
 
     msg = "Did not find any data source, searched classes: %s" % (ds_names)
@@ -178,7 +178,8 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
 # return an ordered list of classes that match
 def list_sources(cfg_list, depends, pkg_list):
     src_list = []
-    LOG.info("Looking for for data source in: %s, %s that match %s", cfg_list, pkg_list, depends)
+    LOG.info(("Looking for for data source in: %s,"
+              " %s that matches %s"), cfg_list, pkg_list, depends)
     for ds_coll in cfg_list:
         ds_name = str(ds_coll)
         if not ds_name.startswith(DS_PREFIX):
@@ -201,8 +202,8 @@ def list_sources(cfg_list, depends, pkg_list):
             if not cls_matches:
                 continue
             src_list.extend(cls_matches)
-            LOG.debug("Found a match for data source %s in %s with matches %s", 
-                        ds_name, mod, cls_matches)
+            LOG.debug(("Found a match for data source %s"
+                       " in %s with matches %s"), ds_name, mod, cls_matches)
             break
     return src_list
 
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 2615d59f..b9076881 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -31,19 +31,23 @@ try:
 except ImportError:
     ConfigObj = None
 
-from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
 from cloudinit.settings import (OLD_CLOUD_CONFIG)
+from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
+
+from cloudinit.handlers import boot_hook as bh_part
+from cloudinit.handlers import cloud_config as cc_part
+from cloudinit.handlers import shell_script as ss_part
+from cloudinit.handlers import upstart_job as up_part
 
 from cloudinit import cloud
 from cloudinit import distros
-from cloudinit import modules
 from cloudinit import helpers
 from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import sources
-from cloudinit import util
-
+from cloudinit import transforms
 from cloudinit import user_data as ud
+from cloudinit import util
 
 LOG = logging.getLogger(__name__)
 
@@ -73,12 +77,19 @@ class Init(object):
     def distro(self):
         if not self._distro:
             d_cfg = util.get_cfg_by_path(self.cfg, ('system_info'), {})
+            # Ensure its a dictionary
+            if not isinstance(d_cfg, (dict)):
+                d_cfg = {}
             # Ensure not modified indirectly
             d_cfg = copy.deepcopy(d_cfg)
+            # Remove this since its path config, not distro config
             d_cfg.pop('paths', None)
-            distro_cls = distros.fetch(sys_cfg.pop('distro', 'ubuntu'))
+            # Try to find the right class to use
+            distro_name = d_cfg.pop('distro', 'ubuntu')
+            distro_cls = distros.fetch(distro_name)
             LOG.debug("Using distro class %s", distro_cls)
-            distro = distro_cls(d_cfg, helpers.Runners(self.paths))
+            distro = distro_cls(distro_name, d_cfg,
+                                helpers.Runners(self.paths))
             self._distro = distro
         return self._distro
 
@@ -93,7 +104,8 @@ class Init(object):
     @property
     def paths(self):
         if not self._paths:
-            path_info = util.get_cfg_by_path(self.cfg, ('system_info', 'paths'), {})
+            path_info = util.get_cfg_by_path(self.cfg,
+                                            ('system_info', 'paths'), {})
             # Ensure not modified indirectly
             path_info = copy.deepcopy(path_info)
             self._paths = helpers.Paths(path_info, self.datasource)
@@ -156,7 +168,7 @@ class Init(object):
             # by using the instance link, if purge_cache was called
             # the file wont exist
             return pickle.loads(util.load_file(pickled_fn))
-        except Exception as e:
+        except Exception:
             util.logexc(LOG, "Failed loading pickled datasource from %s",
                         pickled_fn)
             return None
@@ -166,7 +178,7 @@ class Init(object):
         try:
             contents = pickle.dumps(self.datasource)
             util.write_file(pickled_fn, contents, mode=0400)
-        except Exception as e:
+        except Exception:
             util.logexc(LOG, "Failed pickling datasource to %s", pickled_fn)
             return False
 
@@ -192,7 +204,8 @@ class Init(object):
             # (which will affect user-data handlers down the line...)
             sys_cfg = copy.deepcopy(self.cfg)
             ds_deps = copy.deepcopy(self.ds_deps)
-            (ds, dsname) = sources.find_source(sys_cfg, self.distro, self.paths,
+            (ds, dsname) = sources.find_source(sys_cfg, self.distro,
+                                               self.paths,
                                                ds_deps, cfg_list, pkg_list)
             LOG.debug("Loaded datasource %s - %s", dsname, ds)
         self.datasource = ds
@@ -270,6 +283,20 @@ class Init(object):
         processed_ud = "%s" % (self.datasource.get_userdata())
         util.write_file(self.paths.get_ipath('userdata'), processed_ud, 0600)
 
+    def _default_userdata_handlers(self):
+        opts = {
+            'paths': self.paths,
+            'instance_id': self.datasource.get_instance_id(),
+        }
+        # TODO Hmmm, should we dynamically import these??
+        def_handlers = [
+            cc_part.CloudConfigPartHandler(**opts),
+            ss_part.ShellScriptPartHandler(**opts),
+            bh_part.BootHookPartHandler(**opts),
+            up_part.UpstartJobPartHandler(**opts),
+        ]
+        return def_handlers
+
     def consume(self, frequency=PER_INSTANCE):
         cdir = self.paths.get_cpath("handlers")
         idir = self.paths.get_ipath("handlers")
@@ -279,8 +306,11 @@ class Init(object):
         sys.path.insert(0, cdir)
         sys.path.insert(0, idir)
 
+        # Ensure datasource fetched before activation (just incase)
+        ud_obj = self.datasource.get_userdata()
+
         # This keeps track of all the active handlers
-        c_handlers = helpers.ContentHandlers(self.paths)
+        c_handlers = helpers.ContentHandlers(paths=self.paths)
 
         # Add handlers in cdir
         potential_handlers = util.find_modules(cdir)
@@ -292,13 +322,10 @@ class Init(object):
             except:
                 util.logexc(LOG, "Failed to register handler from %s", fname)
 
-        def_handlers = c_handlers.register_defaults()
-        if def_handlers:
-            LOG.debug("Registered default handlers for %s", def_handlers)
-
-
-        # Ensure userdata fetched before activation (just incase)
-        ud_obj = self.datasource.get_userdata()
+        def_handlers = self._default_userdata_handlers()
+        applied_def_handlers = c_handlers.register_defaults(def_handlers)
+        if applied_def_handlers:
+            LOG.debug("Registered default handlers: %s", applied_def_handlers)
 
         # Form our cloud interface
         data = self.cloudify()
@@ -334,11 +361,11 @@ class Init(object):
 
 
 class Transforms(object):
-    def __init__(self, cloudobj, cfgfile=None):
-        self.datasource = cloudobj.datasource
+    def __init__(self, init, cfgfile=None):
+        self.datasource = init.fetch()
         self.cfgfile = cfgfile
-        self.basecfg = copy.deepcopy(cloudobj.cfg)
-        self.cloudobj = cloudobj
+        self.basecfg = copy.deepcopy(init.cfg)
+        self.init = init
         # Created on first use
         self._cachedcfg = None
 
@@ -409,25 +436,28 @@ class Transforms(object):
                                  (item, util.obj_name(item)))
         return module_list
 
-    def _transforms_modules(self, raw_mods):
+    def _fixup_transforms(self, raw_mods):
         mostly_mods = []
         for raw_mod in raw_mods:
             raw_name = raw_mod['mod']
             freq = raw_mod.get('freq')
             run_args = raw_mod.get('args') or []
-            mod_name = modules.form_module_name(raw_name)
+            mod_name = transforms.form_module_name(raw_name)
             if not mod_name:
                 continue
             if freq and freq not in FREQUENCIES:
-                LOG.warn("Config specified module %s has an unknown frequency %s", raw_name, freq)
+                LOG.warn(("Config specified transform %s"
+                          " has an unknown frequency %s"), raw_name, freq)
                 # Reset it so when ran it will get set to a known value
                 freq = None
-            mod = modules.fixup_module(importer.import_module(mod_name))
+            mod = transforms.fixup_module(importer.import_module(mod_name))
             mostly_mods.append([mod, raw_name, freq, run_args])
         return mostly_mods
 
     def _run_transforms(self, mostly_mods):
         failures = []
+        d_name = self.init.distro.name
+        c_cloud = self.init.cloudify()
         for (mod, name, freq, args) in mostly_mods:
             try:
                 # Try the modules frequency, otherwise fallback to a known one
@@ -436,17 +466,17 @@ class Transforms(object):
                 if not freq in FREQUENCIES:
                     freq = PER_INSTANCE
                 worked_distros = mod.distros
-                if worked_distros and self.cloud.distro.name() not in worked_distros:
-                    LOG.warn(("Module %s is verified on %s distros"
+                if (worked_distros and d_name not in worked_distros):
+                    LOG.warn(("Transform %s is verified on %s distros"
                               " but not on %s distro. It may or may not work"
-                              " correctly."), name, worked_distros,
-                              self.cloud.distro.name())
+                              " correctly."), name, worked_distros, d_name)
                 # Deep copy the config so that modules can't alter it
+                # Use the transforms logger and not our own
                 func_args = [name, copy.deepcopy(self.cfg),
-                             self.cloudobj, LOG, args]
-                # This name will affect the semphapore name created
+                             c_cloud, transforms.LOG, args]
+                # This name will affect the semaphore name created
                 run_name = "config-%s" % (name)
-                self.cloudobj.run(run_name, mod.handle, func_args, freq=freq)
+                c_cloud.run(run_name, mod.handle, func_args, freq=freq)
             except Exception as e:
                 util.logexc(LOG, "Running %s failed", mod)
                 failures.append((name, e))
@@ -454,5 +484,5 @@ class Transforms(object):
 
     def run(self, name):
         raw_mods = self._read_transforms(name)
-        mostly_mods = self._transforms_modules(raw_mods)
+        mostly_mods = self._fixup_transforms(raw_mods)
         return self._run_transforms(mostly_mods)
diff --git a/cloudinit/transforms/__init__.py b/cloudinit/transforms/__init__.py
index 8275b375..40affc4b 100644
--- a/cloudinit/transforms/__init__.py
+++ b/cloudinit/transforms/__init__.py
@@ -44,7 +44,7 @@ def fixup_module(mod, def_freq=PER_INSTANCE):
     else:
         freq = mod.frequency
         if freq and freq not in FREQUENCIES:
-            LOG.warn("Module %s has an unknown frequency %s", mod, freq)
+            LOG.warn("Transform %s has an unknown frequency %s", mod, freq)
     if not hasattr(mod, 'handle'):
         def empty_handle(_name, _cfg, _cloud, _log, _args):
             pass
diff --git a/cloudinit/transforms/cc_apt_update_upgrade.py b/cloudinit/transforms/cc_apt_update_upgrade.py
index c4a543ed..a4e058c6 100644
--- a/cloudinit/transforms/cc_apt_update_upgrade.py
+++ b/cloudinit/transforms/cc_apt_update_upgrade.py
@@ -71,7 +71,7 @@ def handle(_name, cfg, cloud, log, _args):
         except:
             util.logexc(log, "Failed to run debconf-set-selections")
 
-    pkglist = util.get_cfg_option_list_or_str(cfg, 'packages', [])
+    pkglist = util.get_cfg_option_list(cfg, 'packages', [])
 
     errors = []
     if update or len(pkglist) or upgrade:
@@ -96,7 +96,9 @@ def handle(_name, cfg, cloud, log, _args):
             errors.append(e)
 
     if len(errors):
-        raise errors[0]
+        log.warn("%s failed with exceptions, re-raising the last one",
+                 len(errors))
+        raise errors[-1]
 
 
 def mirror2lists_fileprefix(mirror):
@@ -186,7 +188,8 @@ def add_sources(srclist, template_params=None):
         try:
             util.write_file(ent['filename'], source + "\n", omode="ab")
         except:
-            errorlist.append([source, "failed write to file %s" % ent['filename']])
+            errorlist.append([source,
+                             "failed write to file %s" % ent['filename']])
 
     return errorlist
 
@@ -219,9 +222,10 @@ def find_apt_mirror(cloud, cfg):
             doms.extend((".localdomain", "",))
 
             mirror_list = []
+            distro = cloud.distro.name
             mirrorfmt = "http://%s-mirror%s/%s" % (distro, "%s", distro)
             for post in doms:
-                mirror_list.append(mirrorfmt % post)
+                mirror_list.append(mirrorfmt % (post))
 
             mirror = util.search_for_mirror(mirror_list)
 
diff --git a/cloudinit/transforms/cc_bootcmd.py b/cloudinit/transforms/cc_bootcmd.py
index a2efad32..80afb5e7 100644
--- a/cloudinit/transforms/cc_bootcmd.py
+++ b/cloudinit/transforms/cc_bootcmd.py
@@ -30,7 +30,8 @@ frequency = PER_ALWAYS
 def handle(name, cfg, cloud, log, _args):
 
     if "bootcmd" not in cfg:
-        log.debug("Skipping module named %s,  no 'bootcomd' key in configuration", name)
+        log.debug(("Skipping transform named %s,"
+                   " no 'bootcomd' key in configuration"), name)
         return
 
     with tempfile.NamedTemporaryFile(suffix=".sh") as tmpf:
@@ -39,7 +40,7 @@ def handle(name, cfg, cloud, log, _args):
             tmpf.write(content)
             tmpf.flush()
         except:
-            log.warn("Failed to shellify bootcmd")
+            util.logexc(log, "Failed to shellify bootcmd")
             raise
 
         try:
@@ -48,5 +49,6 @@ def handle(name, cfg, cloud, log, _args):
             cmd = ['/bin/sh', tmpf.name]
             util.subp(cmd, env=env, capture=False)
         except:
-            log.warn("Failed to run commands from bootcmd")
+            util.logexc(log,
+                        ("Failed to run bootcmd transform %s"), name)
             raise
diff --git a/cloudinit/transforms/cc_byobu.py b/cloudinit/transforms/cc_byobu.py
index 38586174..741aa934 100644
--- a/cloudinit/transforms/cc_byobu.py
+++ b/cloudinit/transforms/cc_byobu.py
@@ -30,7 +30,7 @@ def handle(name, cfg, _cloud, log, args):
         value = util.get_cfg_option_str(cfg, "byobu_by_default", "")
 
     if not value:
-        log.debug("Skipping module named %s, no 'byobu' values found", name)
+        log.debug("Skipping transform named %s, no 'byobu' values found", name)
         return
 
     if value == "user" or value == "system":
diff --git a/cloudinit/transforms/cc_ca_certs.py b/cloudinit/transforms/cc_ca_certs.py
index 8ca9a200..e0802bfe 100644
--- a/cloudinit/transforms/cc_ca_certs.py
+++ b/cloudinit/transforms/cc_ca_certs.py
@@ -23,6 +23,8 @@ CA_CERT_FILENAME = "cloud-init-ca-certs.crt"
 CA_CERT_CONFIG = "/etc/ca-certificates.conf"
 CA_CERT_SYSTEM_PATH = "/etc/ssl/certs/"
 
+distros = ['ubuntu']
+
 
 def update_ca_certs():
     """
@@ -70,22 +72,25 @@ def handle(name, cfg, _cloud, log, _args):
     """
     # If there isn't a ca-certs section in the configuration don't do anything
     if "ca-certs" not in cfg:
-        log.debug("Skipping module named %s, no 'ca-certs' key in configuration", name)
+        log.debug(("Skipping transform named %s,"
+                   " no 'ca-certs' key in configuration"), name)
         return
+
     ca_cert_cfg = cfg['ca-certs']
 
     # If there is a remove-defaults option set to true, remove the system
     # default trusted CA certs first.
     if ca_cert_cfg.get("remove-defaults", False):
-        log.debug("removing default certificates")
+        log.debug("Removing default certificates")
         remove_default_ca_certs()
 
     # If we are given any new trusted CA certs to add, add them.
     if "trusted" in ca_cert_cfg:
-        trusted_certs = util.get_cfg_option_list_or_str(ca_cert_cfg, "trusted")
+        trusted_certs = util.get_cfg_option_list(ca_cert_cfg, "trusted")
         if trusted_certs:
-            log.debug("adding %d certificates" % len(trusted_certs))
+            log.debug("Adding %d certificates" % len(trusted_certs))
             add_ca_certs(trusted_certs)
 
     # Update the system with the new cert configuration.
+    log.debug("Updating certificates")
     update_ca_certs()
diff --git a/cloudinit/transforms/cc_chef.py b/cloudinit/transforms/cc_chef.py
index 12c2f539..473e5f8b 100644
--- a/cloudinit/transforms/cc_chef.py
+++ b/cloudinit/transforms/cc_chef.py
@@ -31,7 +31,8 @@ def handle(name, cfg, cloud, log, _args):
 
     # If there isn't a chef key in the configuration don't do anything
     if 'chef' not in cfg:
-        log.debug("Skipping module named %s, no 'chef' key in configuration", name)
+        log.debug(("Skipping transform named %s,"
+                  " no 'chef' key in configuration"), name)
         return
     chef_cfg = cfg['chef']
 
diff --git a/cloudinit/transforms/cc_disable_ec2_metadata.py b/cloudinit/transforms/cc_disable_ec2_metadata.py
index 4d2a7f55..3c0dd57b 100644
--- a/cloudinit/transforms/cc_disable_ec2_metadata.py
+++ b/cloudinit/transforms/cc_disable_ec2_metadata.py
@@ -28,5 +28,6 @@ reject_cmd = ['route', 'add', '-host', '169.254.169.254', 'reject']
 
 
 def handle(_name, cfg, _cloud, _log, _args):
-    if util.get_cfg_option_bool(cfg, "disable_ec2_metadata", False):
+    disabled = util.get_cfg_option_bool(cfg, "disable_ec2_metadata", False)
+    if disabled:
         util.subp(reject_cmd)
diff --git a/cloudinit/transforms/cc_final_message.py b/cloudinit/transforms/cc_final_message.py
index dc4ae34c..c257b6d0 100644
--- a/cloudinit/transforms/cc_final_message.py
+++ b/cloudinit/transforms/cc_final_message.py
@@ -32,7 +32,7 @@ final_message_def = ("Cloud-init v. {{version}} finished at {{timestamp}}."
                      " Up {{uptime}} seconds.")
 
 
-def handle(name, cfg, cloud, log, args):
+def handle(_name, cfg, cloud, log, args):
 
     msg_in = None
     if len(args) != 0:
@@ -60,7 +60,7 @@ def handle(name, cfg, cloud, log, args):
         # Use stdout, stderr or the logger??
         content = templater.render_string(msg_in, subs)
         sys.stderr.write("%s\n" % (content))
-    except Exception as e:
+    except Exception:
         util.logexc(log, "Failed to render final message template")
 
     boot_fin_fn = cloud.paths.boot_finished
diff --git a/cloudinit/transforms/cc_foo.py b/cloudinit/transforms/cc_foo.py
index 8007f981..99135704 100644
--- a/cloudinit/transforms/cc_foo.py
+++ b/cloudinit/transforms/cc_foo.py
@@ -45,8 +45,8 @@ from cloudinit.settings import PER_INSTANCE
 #    informational purposes. If non existent all distros are assumed and 
 #    no warning occurs.
 
-frequency = settings.PER_INSTANCE
+frequency = PER_INSTANCE
 
 
-def handle(name, _cfg, _cloud, _log, _args):
-    print("Hi from %s" % (name))
+def handle(name, _cfg, _cloud, log, _args):
+    log.debug("Hi from transform %s", name)
diff --git a/cloudinit/transforms/cc_grub_dpkg.py b/cloudinit/transforms/cc_grub_dpkg.py
index c048d5cc..02f05ce3 100644
--- a/cloudinit/transforms/cc_grub_dpkg.py
+++ b/cloudinit/transforms/cc_grub_dpkg.py
@@ -54,9 +54,9 @@ def handle(_name, cfg, _cloud, log, _args):
     # now idevs and idevs_empty are set to determined values
     # or, those set by user
 
-    dconf_sel = ("grub-pc grub-pc/install_devices string %s\n"
+    dconf_sel = (("grub-pc grub-pc/install_devices string %s\n"
                  "grub-pc grub-pc/install_devices_empty boolean %s\n") %
-                (idevs, idevs_empty)
+                 (idevs, idevs_empty))
 
     log.debug("Setting grub debconf-set-selections with '%s','%s'" %
         (idevs, idevs_empty))
diff --git a/cloudinit/transforms/cc_keys_to_console.py b/cloudinit/transforms/cc_keys_to_console.py
index 2f2a5297..e974375f 100644
--- a/cloudinit/transforms/cc_keys_to_console.py
+++ b/cloudinit/transforms/cc_keys_to_console.py
@@ -18,23 +18,34 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+import os
+
 from cloudinit.settings import PER_INSTANCE
 from cloudinit import util
 
 frequency = PER_INSTANCE
 
+# This is a tool that cloud init provides
+helper_tool = '/usr/lib/cloud-init/write-ssh-key-fingerprints'
 
-def handle(_name, cfg, _cloud, log, _args):
-    cmd = ['/usr/lib/cloud-init/write-ssh-key-fingerprints']
-    fp_blacklist = util.get_cfg_option_list_or_str(cfg,
+
+def handle(name, cfg, _cloud, log, _args):
+    if not os.path.exists(helper_tool):
+        log.warn(("Unable to activate transform %s,"
+                  " helper tool not found at %s"), name, helper_tool)
+        return
+
+    fp_blacklist = util.get_cfg_option_list(cfg,
         "ssh_fp_console_blacklist", [])
-    key_blacklist = util.get_cfg_option_list_or_str(cfg,
+    key_blacklist = util.get_cfg_option_list(cfg,
         "ssh_key_console_blacklist", ["ssh-dss"])
+
     try:
+        cmd = [helper_tool]
         cmd.append(','.join(fp_blacklist))
         cmd.append(','.join(key_blacklist))
-        (stdout, stderr) = util.subp(cmd)
+        (stdout, _stderr) = util.subp(cmd)
         util.write_file('/dev/console', stdout)
     except:
-        log.warn("Writing keys to console failed!")
+        log.warn("Writing keys to /dev/console failed!")
         raise
diff --git a/cloudinit/transforms/cc_landscape.py b/cloudinit/transforms/cc_landscape.py
index 48491992..19948d0e 100644
--- a/cloudinit/transforms/cc_landscape.py
+++ b/cloudinit/transforms/cc_landscape.py
@@ -55,7 +55,8 @@ def handle(name, cfg, _cloud, log, _args):
     /etc/landscape/client.conf
     """
     if not ConfigObj:
-        log.warn("'ConfigObj' support not enabled, running %s disabled", name)
+        log.warn(("'ConfigObj' support not available,"
+                  " running transform %s disabled"), name)
         return
 
     ls_cloudcfg = cfg.get("landscape", {})
diff --git a/cloudinit/transforms/cc_locale.py b/cloudinit/transforms/cc_locale.py
index 3fb4c5d9..7f273123 100644
--- a/cloudinit/transforms/cc_locale.py
+++ b/cloudinit/transforms/cc_locale.py
@@ -49,7 +49,7 @@ def handle(name, cfg, cloud, log, args):
                                              "/etc/default/locale")
 
     if not locale:
-        log.debug(("Skipping module named %s, "
+        log.debug(("Skipping transform named %s, "
                    "no 'locale' configuration found"), name)
         return
 
diff --git a/cloudinit/transforms/cc_mcollective.py b/cloudinit/transforms/cc_mcollective.py
index aeeda9d2..5464fe8c 100644
--- a/cloudinit/transforms/cc_mcollective.py
+++ b/cloudinit/transforms/cc_mcollective.py
@@ -19,13 +19,10 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-from ConfigParser import ConfigParser
 from StringIO import StringIO
 
-import os
-
+from cloudinit import cfg as config
 from cloudinit import util
-from cloudinit import cfg
 
 pubcert_file = "/etc/mcollective/ssl/server-public.pem"
 pricert_file = "/etc/mcollective/ssl/server-private.pem"
@@ -35,7 +32,7 @@ def handle(name, cfg, cloud, log, _args):
 
     # If there isn't a mcollective key in the configuration don't do anything
     if 'mcollective' not in cfg:
-        log.debug(("Skipping module named %s, "
+        log.debug(("Skipping transform named %s, "
                    "no 'mcollective' key in configuration"), name)
         return
 
@@ -47,7 +44,7 @@ def handle(name, cfg, cloud, log, _args):
     # ... and then update the mcollective configuration
     if 'conf' in mcollective_cfg:
         # Create object for reading server.cfg values
-        mcollective_config = cfg.DefaultingConfigParser()
+        mcollective_config = config.DefaultingConfigParser()
         # Read server.cfg values from original file in order to be able to mix
         # the rest up
         old_contents = util.load_file('/etc/mcollective/server.cfg')
diff --git a/cloudinit/transforms/cc_mounts.py b/cloudinit/transforms/cc_mounts.py
index babcbda1..44182b87 100644
--- a/cloudinit/transforms/cc_mounts.py
+++ b/cloudinit/transforms/cc_mounts.py
@@ -20,7 +20,6 @@
 
 from string import whitespace  # pylint: disable=W0402
 
-import os
 import re
 
 from cloudinit import util
@@ -28,7 +27,7 @@ from cloudinit import util
 # shortname matches 'sda', 'sda1', 'xvda', 'hda', 'sdb', xvdb, vda, vdd1
 shortname_filter = r"^[x]{0,1}[shv]d[a-z][0-9]*$"
 shortname = re.compile(shortname_filter)
-ws = re.compile("[%s]+" % whitespace)
+ws = re.compile("[%s]+" % (whitespace))
 
 
 def is_mdname(name):
@@ -65,13 +64,14 @@ def handle(_name, cfg, cloud, log, _args):
             continue
 
         startname = str(cfgmnt[i][0])
-        LOG.debug("Attempting to determine the real name of %s", startname)
+        log.debug("Attempting to determine the real name of %s", startname)
 
         # workaround, allow user to specify 'ephemeral'
         # rather than more ec2 correct 'ephemeral0'
         if startname == "ephemeral":
             cfgmnt[i][0] = "ephemeral0"
-            log.debug("Adjusted mount option %s name from ephemeral to ephemeral0", (i + 1))
+            log.debug(("Adjusted mount option %s "
+                       "name from ephemeral to ephemeral0"), (i + 1))
 
         if is_mdname(startname):
             newname = cloud.device_name_to_device(startname)
@@ -136,7 +136,8 @@ def handle(_name, cfg, cloud, log, _args):
                 break
 
         if cfgmnt_has:
-            log.debug("Not including %s, already previously included", startname)
+            log.debug(("Not including %s, already"
+                       " previously included"), startname)
             continue
         cfgmnt.append(defmnt)
 
@@ -159,7 +160,7 @@ def handle(_name, cfg, cloud, log, _args):
     dirs = []
     for line in actlist:
         # write 'comment' in the fs_mntops, entry,  claiming this
-        line[3] = "%s,comment=cloudconfig" % line[3]
+        line[3] = "%s,%s" % (line[3], comment)
         if line[2] == "swap":
             needswap = True
         if line[1].startswith("/"):
@@ -168,7 +169,7 @@ def handle(_name, cfg, cloud, log, _args):
 
     fstab_lines = []
     fstab = util.load_file("/etc/fstab")
-    for line in fstab.read().splitlines():
+    for line in fstab.splitlines():
         try:
             toks = ws.split(line)
             if toks[3].find(comment) != -1:
diff --git a/cloudinit/transforms/cc_phone_home.py b/cloudinit/transforms/cc_phone_home.py
index 36af6dfa..98ff2b85 100644
--- a/cloudinit/transforms/cc_phone_home.py
+++ b/cloudinit/transforms/cc_phone_home.py
@@ -24,9 +24,8 @@ from cloudinit import util
 
 from cloudinit.settings import PER_INSTANCE
 
-from time import sleep
-
 frequency = PER_INSTANCE
+
 post_list_all = ['pub_key_dsa', 'pub_key_rsa', 'pub_key_ecdsa',
                  'instance_id', 'hostname']
 
@@ -49,7 +48,7 @@ def handle(name, cfg, cloud, log, args):
         ph_cfg = cfg['phone_home']
 
     if 'url' not in ph_cfg:
-        log.warn(("Skipping module named %s, "
+        log.warn(("Skipping transform named %s, "
                   "no 'url' found in 'phone_home' configuration"), name)
         return
 
@@ -60,7 +59,8 @@ def handle(name, cfg, cloud, log, args):
         tries = int(tries)
     except:
         tries = 10
-        util.logexc(log, "Configuration entry 'tries' is not an integer, using %s", tries)
+        util.logexc(log, ("Configuration entry 'tries'"
+                          " is not an integer, using %s instead"), tries)
 
     if post_list == "all":
         post_list = post_list_all
@@ -75,23 +75,37 @@ def handle(name, cfg, cloud, log, args):
         'pub_key_ecdsa': '/etc/ssh/ssh_host_ecdsa_key.pub',
     }
 
-    for n, path in pubkeys.iteritems():
+    for (n, path) in pubkeys.iteritems():
         try:
             all_keys[n] = util.load_file(path)
         except:
-            util.logexc(log, "%s: failed to open, can not phone home that data", path)
+            util.logexc(log, ("%s: failed to open, can not"
+                              " phone home that data"), path)
 
     submit_keys = {}
     for k in post_list:
         if k in all_keys:
             submit_keys[k] = all_keys[k]
         else:
-            submit_keys[k] = "N/A"
-            log.warn("Requested key %s from 'post' configuration list not available", k)
+            submit_keys[k] = None
+            log.warn(("Requested key %s from 'post'"
+                      " configuration list not available"), k)
 
-    url = templater.render_string(url, {'INSTANCE_ID': all_keys['instance_id']})
+    # Get them read to be posted
+    real_submit_keys = {}
+    for (k, v) in submit_keys.iteritems():
+        if v is None:
+            real_submit_keys[k] = 'N/A'
+        else:
+            real_submit_keys[k] = str(v)
 
+    # Incase the url is parameterized
+    url_params = {
+        'INSTANCE_ID': all_keys['instance_id'],
+    }
+    url = templater.render_string(url, url_params)
     try:
-        uhelp.readurl(url, data=submit_keys, retries=tries, sec_between=3)
+        uhelp.readurl(url, data=real_submit_keys, retries=tries, sec_between=3)
     except:
-        util.logexc(log, "Failed to post phone home data to %s in %s tries", url, tries)
+        util.logexc(log, ("Failed to post phone home data to"
+                          " %s in %s tries"), url, tries)
diff --git a/cloudinit/transforms/cc_puppet.py b/cloudinit/transforms/cc_puppet.py
index 0a21a929..76cc9732 100644
--- a/cloudinit/transforms/cc_puppet.py
+++ b/cloudinit/transforms/cc_puppet.py
@@ -24,31 +24,32 @@ import os
 import pwd
 import socket
 
+from cloudinit import cfg as config
 from cloudinit import util
-from cloudinit import cfg
 
 
 def handle(name, cfg, cloud, log, _args):
     # If there isn't a puppet key in the configuration don't do anything
     if 'puppet' not in cfg:
-        log.debug(("Skipping module named %s,"
+        log.debug(("Skipping transform named %s,"
                    " no 'puppet' configuration found"), name)
         return
 
     puppet_cfg = cfg['puppet']
 
     # Start by installing the puppet package ...
-    cloud.distro.install_packages(("puppet",))
+    cloud.distro.install_packages(["puppet"])
 
     # ... and then update the puppet configuration
     if 'conf' in puppet_cfg:
         # Add all sections from the conf object to puppet.conf
         contents = util.load_file('/etc/puppet/puppet.conf')
         # Create object for reading puppet.conf values
-        puppet_config = cfg.DefaultingConfigParser()
+        puppet_config = config.DefaultingConfigParser()
         # Read puppet.conf values from original file in order to be able to
         # mix the rest up. First clean them up (TODO is this really needed??)
-        cleaned_contents = '\n'.join([i.lstrip() for i in contents.splitlines()])
+        cleaned_lines = [i.lstrip() for i in contents.splitlines()]
+        cleaned_contents = '\n'.join(cleaned_lines)
         puppet_config.readfp(StringIO(cleaned_contents),
                              filename='/etc/puppet/puppet.conf')
         for (cfg_name, cfg) in puppet_cfg['conf'].iteritems():
@@ -81,7 +82,8 @@ def handle(name, cfg, cloud, log, _args):
                     puppet_config.set(cfg_name, o, v)
             # We got all our config as wanted we'll rename
             # the previous puppet.conf and create our new one
-            util.rename('/etc/puppet/puppet.conf', '/etc/puppet/puppet.conf.old')
+            util.rename('/etc/puppet/puppet.conf',
+                        '/etc/puppet/puppet.conf.old')
             contents = puppet_config.stringify()
             util.write_file('/etc/puppet/puppet.conf', contents)
 
@@ -91,7 +93,8 @@ def handle(name, cfg, cloud, log, _args):
                   '-e', 's/^START=.*/START=yes/',
                   '/etc/default/puppet'], capture=False)
     elif os.path.exists('/bin/systemctl'):
-        util.subp(['/bin/systemctl', 'enable', 'puppet.service'], capture=False)
+        util.subp(['/bin/systemctl', 'enable', 'puppet.service'],
+                  capture=False)
     elif os.path.exists('/sbin/chkconfig'):
         util.subp(['/sbin/chkconfig', 'puppet', 'on'], capture=False)
     else:
diff --git a/cloudinit/transforms/cc_resizefs.py b/cloudinit/transforms/cc_resizefs.py
index daaf4da9..fe012417 100644
--- a/cloudinit/transforms/cc_resizefs.py
+++ b/cloudinit/transforms/cc_resizefs.py
@@ -18,11 +18,8 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import errno
 import os
 import stat
-import sys
-import tempfile
 import time
 
 from cloudinit import util
@@ -46,15 +43,18 @@ def nodeify_path(devpth, where, log):
         if util.is_container():
             log.debug("Inside container, ignoring mknod failure in resizefs")
             return
-        log.warn("Failed to make device node to resize %s at %s", where, devpth)
+        log.warn("Failed to make device node to resize %s at %s",
+                 where, devpth)
         raise
 
 
 def get_fs_type(st_dev, path, log):
     try:
-        fs_type = util.find_devs_with(tag='TYPE', oformat='value',
+        dev_entries = util.find_devs_with(tag='TYPE', oformat='value',
                                          no_cache=True, path=path)
-        return fs_type
+        if not dev_entries:
+            return None
+        return dev_entries[0].strip()
     except util.ProcessExecutionError:
         util.logexc(log, ("Failed to get filesystem type"
                           " of maj=%s, min=%s for path %s"),
@@ -69,12 +69,16 @@ def handle(name, cfg, _cloud, log, args):
         resize_root = util.get_cfg_option_str(cfg, "resize_rootfs", True)
 
     if not util.translate_bool(resize_root):
-        log.debug("Skipping module named %s,  resizing disabled", name)
+        log.debug("Skipping transform named %s, resizing disabled", name)
         return
 
     # TODO is the directory ok to be used??
     resize_root_d = util.get_cfg_option_str(cfg, "resize_rootfs_tmp", "/run")
     util.ensure_dir(resize_root_d)
+
+    # TODO: allow what is to be resized to
+    # be configurable??
+    resize_what = "/"
     with util.SilentTemporaryFile(prefix="cloudinit.resizefs.",
                                   dir=resize_root_d, delete=True) as tfh:
         devpth = tfh.name
@@ -86,23 +90,25 @@ def handle(name, cfg, _cloud, log, args):
         # auto deletion
         tfh.unlink_now()
     
-        # TODO: allow what is to be resized to
-        # be configurable??
-        st_dev = nodeify_path(devpth, "/", log)
-        fs_type = get_fs_type(st_dev, devpath, log)
+        st_dev = nodeify_path(devpth, resize_what, log)
+        fs_type = get_fs_type(st_dev, devpth, log)
+        if not fs_type:
+            log.warn("Could not determine filesystem type of %s", resize_what)
+            return
     
         resizer = None
-        fstype_lc = fstype.lower()
+        fstype_lc = fs_type.lower()
         for (pfix, root_cmd) in resize_fs_prefixes_cmds:
             if fstype_lc.startswith(pfix):
                 resizer = root_cmd
                 break
 
         if not resizer:
-            log.warn("Not resizing unknown filesystem type %s", fs_type)
+            log.warn("Not resizing unknown filesystem type %s for %s",
+                     fs_type, resize_what)
             return
 
-        log.debug("Resizing using %s", resizer)
+        log.debug("Resizing %s (%s) using %s", resize_what, fs_type, resizer)
         resize_cmd = [resizer, devpth]
 
         if resize_root == "noblock":
@@ -125,8 +131,8 @@ def do_resize(resize_cmd, log):
     start = time.time()
     try:
         util.subp(resize_cmd)
-    except util.ProcessExecutionError as e:
-        util.logexc(log, "Failed to resize filesystem (using %s)", resize_cmd)
+    except util.ProcessExecutionError:
+        util.logexc(log, "Failed to resize filesystem (cmd=%s)", resize_cmd)
         raise
     tot_time = int(time.time() - start)
     log.debug("Resizing took %s seconds", tot_time)
diff --git a/cloudinit/transforms/cc_rightscale_userdata.py b/cloudinit/transforms/cc_rightscale_userdata.py
index cde11b54..40d76c89 100644
--- a/cloudinit/transforms/cc_rightscale_userdata.py
+++ b/cloudinit/transforms/cc_rightscale_userdata.py
@@ -53,16 +53,19 @@ def handle(name, _cfg, cloud, log, _args):
     try:
         ud = cloud.get_userdata_raw()
     except:
-        log.warn("Failed to get raw userdata in module %s", name)
+        log.warn("Failed to get raw userdata in transform %s", name)
         return
 
     try:
         mdict = parse_qs(ud)
         if not mdict or not my_hookname in mdict:
-            log.debug("Skipping module %s, did not find %s in parsed raw userdata", name, my_hookname)
+            log.debug(("Skipping transform %s, "
+                       "did not find %s in parsed"
+                       " raw userdata"), name, my_hookname)
             return
     except:
-        log.warn("Failed to parse query string %s into a dictionary", ud)
+        util.logexc(log, ("Failed to parse query string %s"
+                           " into a dictionary"), ud)
         raise
 
     wrote_fns = []
@@ -83,7 +86,8 @@ def handle(name, _cfg, cloud, log, _args):
                 wrote_fns.append(fname)
         except Exception as e:
             captured_excps.append(e)
-            util.logexc(log, "%s failed to read %s and write %s", my_name, url, fname)
+            util.logexc(log, "%s failed to read %s and write %s",
+                        my_name, url, fname)
 
     if wrote_fns:
         log.debug("Wrote out rightscale userdata to %s files", len(wrote_fns))
@@ -93,6 +97,6 @@ def handle(name, _cfg, cloud, log, _args):
         log.debug("%s urls were skipped or failed", skipped)
 
     if captured_excps:
-        log.warn("%s failed with exceptions, re-raising the last one", len(captured_excps))
+        log.warn("%s failed with exceptions, re-raising the last one",
+                 len(captured_excps))
         raise captured_excps[-1]
-
diff --git a/cloudinit/transforms/cc_rsyslog.py b/cloudinit/transforms/cc_rsyslog.py
index ccbe68ff..71b74711 100644
--- a/cloudinit/transforms/cc_rsyslog.py
+++ b/cloudinit/transforms/cc_rsyslog.py
@@ -36,7 +36,8 @@ def handle(name, cfg, cloud, log, _args):
 
     # process 'rsyslog'
     if not 'rsyslog' in cfg:
-        log.debug("Skipping module named %s, no 'rsyslog' key in configuration", name)
+        log.debug(("Skipping transform named %s,"
+                   " no 'rsyslog' key in configuration"), name)
         return
 
     def_dir = cfg.get('rsyslog_dir', DEF_DIR)
@@ -62,15 +63,16 @@ def handle(name, cfg, cloud, log, _args):
         if not filename.startswith("/"):
             filename = os.path.join(def_dir, filename)
 
+        # Truncate filename first time you see it
         omode = "ab"
-        # truncate filename first time you see it
         if filename not in files:
             omode = "wb"
             files.append(filename)
 
         try:
-            util.write_file(filename, content + "\n", omode=omode)
-        except Exception as e:
+            contents = "%s\n" % (content)
+            util.write_file(filename, contents, omode=omode)
+        except Exception:
             util.logexc(log, "Failed to write to %s", filename)
 
     # Attempt to restart syslogd
@@ -87,8 +89,8 @@ def handle(name, cfg, cloud, log, _args):
         log.debug("Restarting rsyslog")
         util.subp(['service', 'rsyslog', 'restart'])
         restarted = True
-    except Exception as e:
-        util.logexc("Failed restarting rsyslog")
+    except Exception:
+        util.logexc(log, "Failed restarting rsyslog")
 
     if restarted:
         # This only needs to run if we *actually* restarted
diff --git a/cloudinit/transforms/cc_runcmd.py b/cloudinit/transforms/cc_runcmd.py
index 19c0e721..31a254a5 100644
--- a/cloudinit/transforms/cc_runcmd.py
+++ b/cloudinit/transforms/cc_runcmd.py
@@ -25,13 +25,14 @@ from cloudinit import util
 
 def handle(name, cfg, cloud, log, _args):
     if "runcmd" not in cfg:
-        log.debug("Skipping module named %s, no 'runcmd' key in configuration", name)
+        log.debug(("Skipping transform named %s,"
+                   " no 'runcmd' key in configuration"), name)
         return
 
-    outfile = os.path.join(cloud.get_ipath('scripts'), "runcmd")
+    out_fn = os.path.join(cloud.get_ipath('scripts'), "runcmd")
     cmd = cfg["runcmd"]
     try:
         content = util.shellify(cmd)
-        util.write_file(outfile, content, 0700)
+        util.write_file(out_fn, content, 0700)
     except:
-        util.logexc(log, "Failed to shellify %s into file %s", cmd, outfile)
+        util.logexc(log, "Failed to shellify %s into file %s", cmd, out_fn)
diff --git a/cloudinit/transforms/cc_salt_minion.py b/cloudinit/transforms/cc_salt_minion.py
index 47cbc194..d05d2a1e 100644
--- a/cloudinit/transforms/cc_salt_minion.py
+++ b/cloudinit/transforms/cc_salt_minion.py
@@ -21,16 +21,17 @@ from cloudinit import util
 # Note: see http://saltstack.org/topics/installation/
 
 
-def handle(name, cfg, cloud, _log, _args):
+def handle(name, cfg, cloud, log, _args):
     # If there isn't a salt key in the configuration don't do anything
     if 'salt_minion' not in cfg:
-        log.debug("Skipping module named %s, no 'salt_minion' key in configuration", name)
+        log.debug(("Skipping transform named %s,"
+                   " no 'salt_minion' key in configuration"), name)
         return
 
     salt_cfg = cfg['salt_minion']
 
     # Start by installing the salt package ...
-    cloud.distro.install_packages(("salt",))
+    cloud.distro.install_packages(["salt"])
     
     # Ensure we can configure files at the right dir
     config_dir = salt_cfg.get("config_dir", '/etc/salt')
diff --git a/cloudinit/transforms/cc_scripts_per_boot.py b/cloudinit/transforms/cc_scripts_per_boot.py
index bcdf4400..364e1d02 100644
--- a/cloudinit/transforms/cc_scripts_per_boot.py
+++ b/cloudinit/transforms/cc_scripts_per_boot.py
@@ -29,12 +29,13 @@ frequency = PER_ALWAYS
 script_subdir = 'per-boot'
 
 
-def handle(_name, _cfg, cloud, log, _args):
+def handle(name, _cfg, cloud, log, _args):
     # Comes from the following:
     # https://forums.aws.amazon.com/thread.jspa?threadID=96918
     runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run-parts(%s) in %s", script_subdir, runparts_path)
+        log.warn("Failed to run transform %s (%s in %s)",
+                 name, script_subdir, runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_scripts_per_instance.py b/cloudinit/transforms/cc_scripts_per_instance.py
index 8d6609a1..d75ab47d 100644
--- a/cloudinit/transforms/cc_scripts_per_instance.py
+++ b/cloudinit/transforms/cc_scripts_per_instance.py
@@ -29,12 +29,13 @@ frequency = PER_INSTANCE
 script_subdir = 'per-instance'
 
 
-def handle(_name, _cfg, cloud, log, _args):
+def handle(name, _cfg, cloud, log, _args):
     # Comes from the following:
     # https://forums.aws.amazon.com/thread.jspa?threadID=96918
     runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run-parts(%s) in %s", script_subdir, runparts_path)
+        log.warn("Failed to run transform %s (%s in %s)",
+                 name, script_subdir, runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_scripts_per_once.py b/cloudinit/transforms/cc_scripts_per_once.py
index dbcec05d..80f8c325 100644
--- a/cloudinit/transforms/cc_scripts_per_once.py
+++ b/cloudinit/transforms/cc_scripts_per_once.py
@@ -29,12 +29,13 @@ frequency = PER_ONCE
 script_subdir = 'per-once'
 
 
-def handle(_name, _cfg, cloud, log, _args):
+def handle(name, _cfg, cloud, log, _args):
     # Comes from the following:
     # https://forums.aws.amazon.com/thread.jspa?threadID=96918
     runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run-parts(%s) in %s", script_subdir, runparts_path)
+        log.warn("Failed to run transform %s (%s in %s)",
+                 name, script_subdir, runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_scripts_user.py b/cloudinit/transforms/cc_scripts_user.py
index 1e438ee6..f4fe3a2a 100644
--- a/cloudinit/transforms/cc_scripts_user.py
+++ b/cloudinit/transforms/cc_scripts_user.py
@@ -26,14 +26,17 @@ from cloudinit.settings import PER_INSTANCE
 
 frequency = PER_INSTANCE
 
+script_subdir = 'scripts'
 
-def handle(_name, _cfg, cloud, log, _args):
+
+def handle(name, _cfg, cloud, log, _args):
     # This is written to by the user data handlers
     # Ie, any custom shell scripts that come down
     # go here...
-    runparts_path = os.path.join(cloud.get_ipath_cur(), "scripts")
+    runparts_path = os.path.join(cloud.get_ipath_cur(), script_subdir)
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run-parts(%s) in %s", "user-data", runparts_path)
+        log.warn("Failed to run transform %s (%s in %s)",
+                 name, script_subdir, runparts_path)
         raise
diff --git a/cloudinit/transforms/cc_set_hostname.py b/cloudinit/transforms/cc_set_hostname.py
index fa2b59c2..3ac8a8fa 100644
--- a/cloudinit/transforms/cc_set_hostname.py
+++ b/cloudinit/transforms/cc_set_hostname.py
@@ -24,7 +24,7 @@ from cloudinit import util
 def handle(name, cfg, cloud, log, _args):
     if util.get_cfg_option_bool(cfg, "preserve_hostname", False):
         log.debug(("Configuration option 'preserve_hostname' is set,"
-                    " not setting the hostname in %s"), name)
+                    " not setting the hostname in transform %s"), name)
         return
 
     (hostname, _fqdn) = util.get_hostname_fqdn(cfg, cloud)
diff --git a/cloudinit/transforms/cc_set_passwords.py b/cloudinit/transforms/cc_set_passwords.py
index 4f2cdb97..c0cc4e84 100644
--- a/cloudinit/transforms/cc_set_passwords.py
+++ b/cloudinit/transforms/cc_set_passwords.py
@@ -22,7 +22,7 @@ import sys
 
 from cloudinit import util
 
-from string import letters, digits
+from string import letters, digits  # pylint: disable=W0402
 
 # We are removing certain 'painful' letters/numbers
 pw_set = (letters.translate(None, 'loLOI') +
@@ -71,11 +71,13 @@ def handle(_name, cfg, cloud, log, args):
             util.subp(['chpasswd'], ch_in)
         except Exception as e:
             errors.append(e)
-            util.logexc(log, "Failed to set passwords with chpasswd for %s", users)
+            util.logexc(log,
+                        "Failed to set passwords with chpasswd for %s", users)
 
         if len(randlist):
-            sys.stderr.write("%s\n%s\n" % ("Set the following 'random' passwords\n",
-                '\n'.join(randlist)))
+            blurb = ("Set the following 'random' passwords\n",
+                     '\n'.join(randlist))
+            sys.stderr.write("%s\n%s\n" % blurb)
 
         if expire:
             expired_users = []
diff --git a/cloudinit/transforms/cc_ssh.py b/cloudinit/transforms/cc_ssh.py
index db6848d9..3c2b3622 100644
--- a/cloudinit/transforms/cc_ssh.py
+++ b/cloudinit/transforms/cc_ssh.py
@@ -65,8 +65,7 @@ def handle(_name, cfg, cloud, log, _args):
                 tgt_fn = key2file[key][0]
                 tgt_perms = key2file[key][1]
                 util.write_file(tgt_fn, val, tgt_perms)
-    
-        cmd = 'o=$(ssh-keygen -yf "%s") && echo "$o" root@localhost > "%s"'
+
         for priv, pub in priv2pub.iteritems():
             if pub in cfg['ssh_keys'] or not priv in cfg['ssh_keys']:
                 continue
@@ -78,11 +77,15 @@ def handle(_name, cfg, cloud, log, _args):
                     util.subp(cmd, capture=False)
                 log.debug("Generated a key for %s from %s", pair[0], pair[1])
             except:
-                util.logexc(log, "Failed generated a key for %s from %s", pair[0], pair[1])
+                util.logexc(log, ("Failed generated a key"
+                                  " for %s from %s"), pair[0], pair[1])
     else:
         # if not, generate them
-        for keytype in util.get_cfg_option_list_or_str(cfg, 'ssh_genkeytypes', generate_keys):
-            keyfile = '/etc/ssh/ssh_host_%s_key' % keytype
+        genkeys = util.get_cfg_option_list(cfg,
+                                            'ssh_genkeytypes', 
+                                            generate_keys)
+        for keytype in genkeys:
+            keyfile = '/etc/ssh/ssh_host_%s_key' % (keytype)
             if not os.path.exists(keyfile):
                 cmd = ['ssh-keygen', '-t', keytype, '-N', '', '-f', keyfile]
                 try:
@@ -90,26 +93,27 @@ def handle(_name, cfg, cloud, log, _args):
                     with util.SeLinuxGuard("/etc/ssh", recursive=True):
                         util.subp(cmd, capture=False)
                 except:
-                    util.logexc(log, "Failed generating key type %s to file %s", keytype, keyfile)
+                    util.logexc(log, ("Failed generating key type"
+                                      " %s to file %s"), keytype, keyfile)
 
     try:
         user = util.get_cfg_option_str(cfg, 'user')
         disable_root = util.get_cfg_option_bool(cfg, "disable_root", True)
         disable_root_opts = util.get_cfg_option_str(cfg, "disable_root_opts",
-            DISABLE_ROOT_OPTS)
+                                                    DISABLE_ROOT_OPTS)
 
         keys = cloud.get_public_ssh_keys() or []
         if "ssh_authorized_keys" in cfg:
             cfgkeys = cfg["ssh_authorized_keys"]
             keys.extend(cfgkeys)
 
-        apply_credentials(keys, user, disable_root, disable_root_opts, log)
+        apply_credentials(keys, user, disable_root, disable_root_opts)
     except:
         util.logexc(log, "Applying ssh credentials failed!")
 
 
 def apply_credentials(keys, user, disable_root,
-                      disable_root_opts=DISABLE_ROOT_OPTS, log=None):
+                      disable_root_opts=DISABLE_ROOT_OPTS):
 
     keys = set(keys)
     if user:
diff --git a/cloudinit/transforms/cc_ssh_import_id.py b/cloudinit/transforms/cc_ssh_import_id.py
index 019413d4..d57e4665 100644
--- a/cloudinit/transforms/cc_ssh_import_id.py
+++ b/cloudinit/transforms/cc_ssh_import_id.py
@@ -33,10 +33,14 @@ def handle(name, cfg, _cloud, log, args):
             ids = args[1:]
     else:
         user = util.get_cfg_option_str(cfg, "user", "ubuntu")
-        ids = util.get_cfg_option_list_or_str(cfg, "ssh_import_id", [])
+        ids = util.get_cfg_option_list(cfg, "ssh_import_id", [])
 
     if len(ids) == 0:
-        log.debug("Skipping module named %s, no ids found to import", name)
+        log.debug("Skipping transform named %s, no ids found to import", name)
+        return
+
+    if not user:
+        log.debug("Skipping transform named %s, no user found to import", name)
         return
 
     cmd = ["sudo", "-Hu", user, "ssh-import-id"] + ids
diff --git a/cloudinit/transforms/cc_timezone.py b/cloudinit/transforms/cc_timezone.py
index 02cbf2dc..747c436c 100644
--- a/cloudinit/transforms/cc_timezone.py
+++ b/cloudinit/transforms/cc_timezone.py
@@ -18,20 +18,22 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from cloudinit import util
+
 from cloudinit.settings import PER_INSTANCE
 
 frequency = PER_INSTANCE
 
 
-def handle(_name, cfg, cloud, log, args):
+def handle(name, cfg, cloud, log, args):
     if len(args) != 0:
         timezone = args[0]
     else:
         timezone = util.get_cfg_option_str(cfg, "timezone", False)
 
     if not timezone:
-        log.debug("Skipping module named %s, no 'timezone' specified", name)
+        log.debug("Skipping transform named %s, no 'timezone' specified", name)
         return
-    
+
     # Let the distro handle settings its timezone
     cloud.distro.set_timezone(timezone)
diff --git a/cloudinit/transforms/cc_update_etc_hosts.py b/cloudinit/transforms/cc_update_etc_hosts.py
index 361097a6..d0e56183 100644
--- a/cloudinit/transforms/cc_update_etc_hosts.py
+++ b/cloudinit/transforms/cc_update_etc_hosts.py
@@ -30,22 +30,30 @@ def handle(name, cfg, cloud, log, _args):
     manage_hosts = util.get_cfg_option_str(cfg, "manage_etc_hosts", False)
     if util.translate_bool(manage_hosts, addons=['template']):
         (hostname, fqdn) = util.get_hostname_fqdn(cfg, cloud)
-        # Render from template file
         if not hostname:
-            log.warn("Option 'manage_etc_hosts' was set, but no hostname was found")
+            log.warn(("Option 'manage_etc_hosts' was set,"
+                     " but no hostname was found"))
             return
-        tpl_fn_name = cloud.get_template_filename("hosts.%s" % (cloud.distro.name()))
+
+        # Render from a template file
+        distro_n = cloud.distro.name
+        tpl_fn_name = cloud.get_template_filename("hosts.%s" % (distro_n))
         if not tpl_fn_name:
-            raise Exception("No hosts template could be found for distro %s" % (cloud.distro.name()))
+            raise Exception(("No hosts template could be"
+                             " found for distro %s") % (distro_n))
+
         templater.render_to_file(tpl_fn_name, '/etc/hosts',
                                 {'hostname': hostname, 'fqdn': fqdn})
+
     elif manage_hosts == "localhost":
-        log.debug("Managing localhost in /etc/hosts")
         (hostname, fqdn) = util.get_hostname_fqdn(cfg, cloud)
         if not hostname:
-            log.warn("Option 'manage_etc_hosts' was set, but no hostname was found")
+            log.warn(("Option 'manage_etc_hosts' was set,"
+                     " but no hostname was found"))
             return
+
+        log.debug("Managing localhost in /etc/hosts")
         cloud.distro.update_etc_hosts(hostname, fqdn)
     else:
         log.debug(("Configuration option 'manage_etc_hosts' is not set,"
-                    " not managing /etc/hosts in %s"), name)
+                    " not managing /etc/hosts in transform %s"), name)
diff --git a/cloudinit/transforms/cc_update_hostname.py b/cloudinit/transforms/cc_update_hostname.py
index 439bdcb3..58444fab 100644
--- a/cloudinit/transforms/cc_update_hostname.py
+++ b/cloudinit/transforms/cc_update_hostname.py
@@ -18,6 +18,8 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+import os
+
 from cloudinit import util
 from cloudinit.settings import PER_ALWAYS
 
@@ -27,7 +29,7 @@ frequency = PER_ALWAYS
 def handle(name, cfg, cloud, log, _args):
     if util.get_cfg_option_bool(cfg, "preserve_hostname", False):
         log.debug(("Configuration option 'preserve_hostname' is set,"
-                    " not updating the hostname in %s"), name)
+                    " not updating the hostname in transform %s"), name)
         return
 
     (hostname, _fqdn) = util.get_hostname_fqdn(cfg, cloud)
diff --git a/cloudinit/transforms/cc_welcome.py b/cloudinit/transforms/cc_welcome.py
index 0db71125..04691d21 100644
--- a/cloudinit/transforms/cc_welcome.py
+++ b/cloudinit/transforms/cc_welcome.py
@@ -35,9 +35,9 @@ welcome_message_def = ("Cloud-init v. {{version}} starting stage {{stage}} at "
 frequency = PER_ALWAYS
 
 
-def handle(name, cfg, cloud, log, args):
+def handle(_name, cfg, cloud, log, args):
 
-    welcome_msg = util.get_cfg_option_str(cfg, "welcome_msg"):
+    welcome_msg = util.get_cfg_option_str(cfg, "welcome_msg")
     if not welcome_msg:
         tpl_fn = cloud.get_template_filename("welcome_msg")
         if tpl_fn:
@@ -54,7 +54,7 @@ def handle(name, cfg, cloud, log, args):
         'stage': stage,
         'version': version.version_string(),
         'uptime': util.uptime(),
-        'timestamp', util.time_rfc2822(),
+        'timestamp': util.time_rfc2822(),
     }
     try:
         contents = templater.render_string(welcome_msg, tpl_params)
diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 64fc2734..9915b8b0 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -22,14 +22,15 @@
 
 
 import os
-import glob
 
 import email
-
+from email.mime.multipart import MIMEMultipart
+from email.mime.text import MIMEText
 from email.mime.base import MIMEBase
 
 from cloudinit import importer
 from cloudinit import log as logging
+from cloudinit import url_helper
 from cloudinit import util
 
 from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE, FREQUENCIES)
@@ -86,7 +87,7 @@ class UserDataProcessor(object):
         self.paths = paths
 
     def process(self, blob):
-        base_msg = ud.convert_string(blob)
+        base_msg = convert_string(blob)
         process_msg = MIMEMultipart()
         self._process_msg(base_msg, process_msg)
         return process_msg
@@ -105,7 +106,7 @@ class UserDataProcessor(object):
                 ctype_orig = UNDEF_TYPE
     
             if ctype_orig in TYPE_NEEDED:
-                ctype = ud.type_from_starts_with(payload)
+                ctype = type_from_starts_with(payload)
     
             if ctype is None:
                 ctype = ctype_orig
@@ -158,7 +159,7 @@ class UserDataProcessor(object):
                 if not url_helper.ok_http_code(st):
                     content = ''
 
-            new_msg = ud.convert_string(content)
+            new_msg = convert_string(content)
             self._process_msg(new_msg, append_msg)
 
     def _explode_archive(self, archive, append_msg):
@@ -179,7 +180,7 @@ class UserDataProcessor(object):
             content = ent.get('content', '')
             mtype = ent.get('type')
             if not mtype:
-                mtype = ud.type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
+                mtype = type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
 
             maintype, subtype = mtype.split('/', 1)
             if maintype == "text":
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 7259d933..1f884df8 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -22,8 +22,8 @@
 
 from StringIO import StringIO
 
+import copy as obj_copy
 import contextlib
-import copy
 import errno
 import glob
 import grp
@@ -35,12 +35,11 @@ import pwd
 import random
 import shutil
 import socket
-import string
+import string # pylint: disable=W0402
 import subprocess
 import sys
 import tempfile
 import time
-import traceback
 import types
 import urlparse
 
@@ -171,7 +170,8 @@ def fork_cb(child_cb, *args):
             child_cb(*args)
             os._exit(0)  # pylint: disable=W0212
         except:
-            logexc(LOG, "Failed forking and calling callback %s", obj_name(child_cb))
+            logexc(LOG, ("Failed forking and"
+                         " calling callback %s"), obj_name(child_cb))
             os._exit(1)  # pylint: disable=W0212
     else:
         LOG.debug("Forked child %s who will run callback %s",
@@ -549,10 +549,11 @@ def load_yaml(blob, default=None, allowed=(dict,)):
         converted = yaml.load(blob)
         if not isinstance(converted, allowed):
             # Yes this will just be caught, but thats ok for now...
-            raise TypeError("Yaml load allows %s root types, but got %s instead" %
+            raise TypeError(("Yaml load allows %s root types,"
+                             " but got %s instead") %
                             (allowed, obj_name(converted)))
         loaded = converted
-    except (yaml.YAMLError, TypeError, ValueError) as exc:
+    except (yaml.YAMLError, TypeError, ValueError):
         logexc(LOG, "Failed loading yaml blob")
     return loaded
 
@@ -833,15 +834,12 @@ def find_devs_with(criteria=None, oformat='device',
         options.append(path)
     cmd = blk_id_cmd + options
     (out, _err) = subp(cmd)
-    if path:
-        return out.strip()
-    else:
-        entries = []
-        for line in out.splitlines():
-            line = line.strip()
-            if line:
-                entries.append(line)
-        return entries
+    entries = []
+    for line in out.splitlines():
+        line = line.strip()
+        if line:
+            entries.append(line)
+    return entries
 
 
 def load_file(fname, read_cb=None, quiet=False):
@@ -1109,7 +1107,7 @@ def mount_cb(device, callback, data=None, rw=False, mtype=None):
 
 def get_builtin_cfg():
     # Deep copy so that others can't modify
-    return copy.deepcopy(CFG_BUILTIN)
+    return obj_copy.deepcopy(CFG_BUILTIN)
 
 
 def sym_link(source, link):
@@ -1140,16 +1138,14 @@ def time_rfc2822():
 
 
 def uptime():
+    uptime_str = '??'
     try:
-        uptimef = load_file("/proc/uptime").strip()
-        if not uptimef:
-            uptime = 'na'
-        else:
-            uptime = uptimef.split()[0]
+        contents = load_file("/proc/uptime").strip()
+        if contents:
+            uptime_str = contents.split()[0]
     except:
         logexc(LOG, "Unable to read uptime from /proc/uptime")
-        uptime = '??'
-    return uptime
+    return uptime_str
 
 
 def ensure_file(path):
@@ -1261,7 +1257,8 @@ def shellify(cmdlist, add_header=True):
             content = "%s%s\n" % (content, args)
         else:
             raise RuntimeError(("Unable to shellify type %s"
-                                " which is not a list or string") % (obj_name(args)))
+                                " which is not a list or string")
+                               % (obj_name(args)))
     LOG.debug("Shellified %s to %s", cmdlist, content)
     return content
 
@@ -1275,8 +1272,7 @@ def is_container():
         try:
             # try to run a helper program. if it returns true/zero
             # then we're inside a container. otherwise, no
-            cmd = [helper]
-            subp(cmd, allowed_rc=[0])
+            subp([helper])
             return True
         except (IOError, OSError):
             pass

From b0b8296481c93b714fad3c17687268b3e48e5d5e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:32:18 -0700
Subject: [PATCH 119/434] Add the running of 2to3 via the makefile.

---
 Makefile | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 0a73f987..783ebd76 100644
--- a/Makefile
+++ b/Makefile
@@ -12,5 +12,8 @@ pyflakes:
 test:
 	nosetests tests/unittests/
 
-.PHONY: test pylint pyflakes
+2to3:
+	2to3 $(PY_FILES)
+
+.PHONY: test pylint pyflakes 2to3
 

From bf1ed422b0bd0bb5a0656743a983fb12cb1d0a58 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:32:51 -0700
Subject: [PATCH 120/434] 1. Add in one function that will do output
 redirection from config for a given mode. 2. Adjust the usage of items() to
 iteritems() which will help translation to python 3.

---
 cloudinit/util.py | 24 +++++++++++++++++++-----
 1 file changed, 19 insertions(+), 5 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 1f884df8..15444fed 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -225,7 +225,7 @@ def read_conf(fname):
 
 
 def clean_filename(fn):
-    for (k, v) in FN_REPLACEMENTS.items():
+    for (k, v) in FN_REPLACEMENTS.iteritems():
         fn = fn.replace(k, v)
     return fn.strip()
 
@@ -344,6 +344,11 @@ def get_cfg_by_path(yobj, keyp, default=None):
     return cur
 
 
+def fixup_output(cfg, mode):
+    (outfmt, errfmt) = get_output_cfg(cfg, mode)
+    redirect_output(outfmt, errfmt)
+
+
 # redirect_output(outfmt, errfmt, orig_out, orig_err)
 #  replace orig_out and orig_err with filehandles specified in outfmt or errfmt
 #  fmt can be:
@@ -353,8 +358,14 @@ def get_cfg_by_path(yobj, keyp, default=None):
 #
 #   with a '|', arguments are passed to shell, so one level of
 #   shell escape is required.
-def redirect_output(outfmt, errfmt, o_out=sys.stdout, o_err=sys.stderr):
+def redirect_output(outfmt, errfmt, o_out=None, o_err=None):
+    if not o_out:
+        o_out = sys.stdout
+    if not o_err:
+        o_err = sys.stderr
+
     if outfmt:
+        LOG.debug("Redirecting %s to %s", o_out, outfmt)
         (mode, arg) = outfmt.split(" ", 1)
         if mode == ">" or mode == ">>":
             owith = "ab"
@@ -365,15 +376,18 @@ def redirect_output(outfmt, errfmt, o_out=sys.stdout, o_err=sys.stderr):
             proc = subprocess.Popen(arg, shell=True, stdin=subprocess.PIPE)
             new_fp = proc.stdin
         else:
-            raise TypeError("Invalid type for outfmt: %s" % outfmt)
+            raise TypeError("Invalid type for output format: %s" % outfmt)
 
         if o_out:
             os.dup2(new_fp.fileno(), o_out.fileno())
+
         if errfmt == outfmt:
+            LOG.debug("Redirecting %s to %s", o_err, outfmt)
             os.dup2(new_fp.fileno(), o_err.fileno())
             return
 
     if errfmt:
+        LOG.debug("Redirecting %s to %s", o_err, errfmt)
         (mode, arg) = errfmt.split(" ", 1)
         if mode == ">" or mode == ">>":
             owith = "ab"
@@ -384,7 +398,7 @@ def redirect_output(outfmt, errfmt, o_out=sys.stdout, o_err=sys.stderr):
             proc = subprocess.Popen(arg, shell=True, stdin=subprocess.PIPE)
             new_fp = proc.stdin
         else:
-            raise TypeError("Invalid type for errfmt: %s" % errfmt)
+            raise TypeError("Invalid type for error format: %s" % errfmt)
 
         if o_err:
             os.dup2(new_fp.fileno(), o_err.fileno())
@@ -912,7 +926,7 @@ def chownbyname(fname, user=None, group=None):
 #     output: "| logger -p"
 #     error: "> /dev/null"
 # this returns the specific 'mode' entry, cleanly formatted, with value
-def get_output_cfg(cfg, mode="init"):
+def get_output_cfg(cfg, mode):
     ret = [None, None]
     if not cfg or not 'output' in cfg:
         return ret

From ffb83c5c9f198bf458ad693002f27de3e6eeb39a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:33:39 -0700
Subject: [PATCH 121/434] Adjust the usage of map items() to iteritems() which
 will help later translation to python 3.

---
 cloudinit/sources/DataSourceEc2.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/sources/DataSourceEc2.py b/cloudinit/sources/DataSourceEc2.py
index 38be71fa..0108954f 100644
--- a/cloudinit/sources/DataSourceEc2.py
+++ b/cloudinit/sources/DataSourceEc2.py
@@ -198,7 +198,7 @@ class DataSourceEc2(sources.DataSource):
         # 'ephemeral0': '/dev/sdb',
         # 'root': '/dev/sda1'}
         found = None
-        for (entname, device) in self.metadata['block-device-mapping'].items():
+        for (entname, device) in self.metadata['block-device-mapping'].iteritems():
             if entname == name:
                 found = device
                 break

From 6ba90f8058737dde57c24eb4003788b55f451830 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:34:35 -0700
Subject: [PATCH 122/434] Adjust the usage of map	items()	to iteritems()
 which will help later translation to python 3.

---
 cloudinit/sources/DataSourceOVF.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/sources/DataSourceOVF.py b/cloudinit/sources/DataSourceOVF.py
index 258d8d03..f38fb4b9 100644
--- a/cloudinit/sources/DataSourceOVF.py
+++ b/cloudinit/sources/DataSourceOVF.py
@@ -65,7 +65,7 @@ class DataSourceOVF(sources.DataSource):
             np = {'iso': transport_iso9660,
                   'vmware-guestd': transport_vmware_guestd, }
             name = None
-            for name, transfunc in np.iteritems():
+            for (name, transfunc) in np.iteritems():
                 (contents, _dev, _fname) = transfunc()
                 if contents:
                     break

From ecc68ef3ac6602716933539c0d1d8d0902353dab Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:34:52 -0700
Subject: [PATCH 123/434] Adjust the usage of map items() to iteritems() which
 will help later translation to python 3.

---
 cloudinit/sources/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index beb0f3d7..55900119 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -78,7 +78,7 @@ class DataSource(object):
             return list(self.metadata['public-keys'])
 
         if isinstance(self.metadata['public-keys'], (dict)):
-            for _keyname, klist in self.metadata['public-keys'].items():
+            for (_keyname, klist) in self.metadata['public-keys'].iteritems():
                 # lp:506332 uec metadata service responds with
                 # data that makes boto populate a string for 'klist' rather
                 # than a list.

From 4da2470198906439f6cc722210f1e8935398c2e4 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:36:29 -0700
Subject: [PATCH 124/434] Only set an env variable for instance id if we
 actually got one.

---
 cloudinit/transforms/cc_bootcmd.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/cloudinit/transforms/cc_bootcmd.py b/cloudinit/transforms/cc_bootcmd.py
index 80afb5e7..0c45a307 100644
--- a/cloudinit/transforms/cc_bootcmd.py
+++ b/cloudinit/transforms/cc_bootcmd.py
@@ -45,7 +45,9 @@ def handle(name, cfg, cloud, log, _args):
 
         try:
             env = os.environ.copy()
-            env['INSTANCE_ID'] = cloud.get_instance_id()
+            iid = cloud.get_instance_id()
+            if iid:
+                env['INSTANCE_ID'] = str(iid)
             cmd = ['/bin/sh', tmpf.name]
             util.subp(cmd, env=env, capture=False)
         except:

From 71fcd1463cf3d9a025e090ffc83fc3c7c1859b12 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:37:35 -0700
Subject: [PATCH 125/434] Some simple fixes that will make the python 3
 translation easier

---
 cloudinit/user_data.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 9915b8b0..866bf6de 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -68,7 +68,8 @@ INCLUSION_TYPES_MAP = {
 }
 
 # Sorted longest first
-INCLUSION_SRCH = sorted(INCLUSION_TYPES_MAP.keys(), key=(lambda e: 0 - len(e)))
+INCLUSION_SRCH = sorted(list(INCLUSION_TYPES_MAP.keys()),
+                        key=(lambda e: 0 - len(e)))
 
 # Various special content types
 TYPE_NEEDED = ["text/plain", "text/x-not-multipart"]
@@ -193,7 +194,7 @@ class UserDataProcessor(object):
                 msg.add_header('Content-Disposition', 'attachment',
                                 filename=ent['filename'])
 
-            for header in ent.keys():
+            for header in list(ent.keys()):
                 if header in ('content', 'filename', 'type'):
                     continue
                 msg.add_header(header, ent['header'])
@@ -363,7 +364,7 @@ def convert_string(raw_data, headers=None):
     data = util.decomp_str(raw_data)
     if "mime-version:" in data[0:4096].lower():
         msg = email.message_from_string(data)
-        for (key, val) in headers.items():
+        for (key, val) in headers.iteritems():
             if key in msg:
                 msg.replace_header(key, val)
             else:

From e7750ba1f25334da3e537d206c6742948b7a73e9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:38:41 -0700
Subject: [PATCH 126/434] Some simple fixes that will make the python 3
 translation easier

---
 cloudinit/transforms/cc_chef.py | 2 +-
 cloudinit/transforms/cc_ssh.py  | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/transforms/cc_chef.py b/cloudinit/transforms/cc_chef.py
index 473e5f8b..31bfb85f 100644
--- a/cloudinit/transforms/cc_chef.py
+++ b/cloudinit/transforms/cc_chef.py
@@ -69,7 +69,7 @@ def handle(name, cfg, cloud, log, _args):
         initial_json['run_list'] = chef_cfg['run_list']
     if 'initial_attributes' in chef_cfg:
         initial_attributes = chef_cfg['initial_attributes']
-        for k in initial_attributes.keys():
+        for k in list(initial_attributes.keys()):
             initial_json[k] = initial_attributes[k]
     util.write_file('/etc/chef/firstboot.json', json.dumps(initial_json))
 
diff --git a/cloudinit/transforms/cc_ssh.py b/cloudinit/transforms/cc_ssh.py
index 3c2b3622..f5c22e28 100644
--- a/cloudinit/transforms/cc_ssh.py
+++ b/cloudinit/transforms/cc_ssh.py
@@ -66,7 +66,7 @@ def handle(_name, cfg, cloud, log, _args):
                 tgt_perms = key2file[key][1]
                 util.write_file(tgt_fn, val, tgt_perms)
 
-        for priv, pub in priv2pub.iteritems():
+        for (priv, pub) in priv2pub.iteritems():
             if pub in cfg['ssh_keys'] or not priv in cfg['ssh_keys']:
                 continue
             pair = (key2file[priv][0], key2file[pub][0])

From 85e7f52f991cefb11ee8d71d33e207bfeaa0439e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:39:42 -0700
Subject: [PATCH 127/434] Some simple fixes that will make the python 3
 translation easier

---
 cloudinit/sources/DataSourceMAAS.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/sources/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
index 9e639649..40ace947 100644
--- a/cloudinit/sources/DataSourceMAAS.py
+++ b/cloudinit/sources/DataSourceMAAS.py
@@ -204,7 +204,7 @@ def check_seed_contents(content, seed):
     if len(content) == 0:
         raise MAASSeedDirNone("%s: no data files found" % seed)
 
-    found = content.keys()
+    found = list(content.keys())
     missing = [k for k in md_required if k not in found]
     if len(missing):
         raise MAASSeedDirMalformed("%s: missing files %s" % (seed, missing))

From 68b6d7861498b6f00e0e50bffe73ba7a65a92026 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 07:39:56 -0700
Subject: [PATCH 128/434] Cleanups around the usage of the apt pipe line value.

1. Add a comment onto why this is done
2. Fix the usage of range to search the list and not a string
3. Make the filecontents template just one multiline variable.
---
 cloudinit/transforms/cc_apt_pipelining.py | 20 ++++++++++++--------
 1 file changed, 12 insertions(+), 8 deletions(-)

diff --git a/cloudinit/transforms/cc_apt_pipelining.py b/cloudinit/transforms/cc_apt_pipelining.py
index 69027b0c..3c24d7c3 100644
--- a/cloudinit/transforms/cc_apt_pipelining.py
+++ b/cloudinit/transforms/cc_apt_pipelining.py
@@ -25,31 +25,35 @@ distros = ['ubuntu', 'debian']
 
 default_file = "/etc/apt/apt.conf.d/90cloud-init-pipelining"
 
+# Acquire::http::Pipeline-Depth can be a value
+# from 0 to 5 indicating how many outstanding requests APT should send.
+# A value of zero MUST be specified if the remote host does not properly linger
+# on TCP connections - otherwise data corruption will occur.
+
 
 def handle(_name, cfg, _cloud, log, _args):
 
     apt_pipe_value = util.get_cfg_option_str(cfg, "apt_pipelining", False)
-    apt_pipe_value = str(apt_pipe_value).lower()
+    apt_pipe_value_s = str(apt_pipe_value).lower().strip()
 
-    if apt_pipe_value == "false":
+    if apt_pipe_value_s == "false":
         write_apt_snippet("0", log)
 
-    elif apt_pipe_value in ("none", "unchanged", "os"):
+    elif apt_pipe_value_s in ("none", "unchanged", "os"):
         return
 
-    elif apt_pipe_value in str(range(0, 6)):
-        write_apt_snippet(apt_pipe_value, log)
+    elif apt_pipe_value_s in [str(b) for b in xrange(0, 6)]:
+        write_apt_snippet(apt_pipe_value_s, log)
 
     else:
-        log.warn("Invalid option for apt_pipeling: %s" % apt_pipe_value)
+        log.warn("Invalid option for apt_pipeling: %s", apt_pipe_value)
 
 
 def write_apt_snippet(setting, log, f_name=default_file):
     """ Writes f_name with apt pipeline depth 'setting' """
 
-    acquire_pipeline_depth = 'Acquire::http::Pipeline-Depth "%s";\n'
     file_contents = ("//Written by cloud-init per 'apt_pipelining'\n"
-                     + (acquire_pipeline_depth % setting))
+                     'Acquire::http::Pipeline-Depth "%s";\n') % (setting)
 
     util.write_file(f_name, file_contents)
 

From 651861e3f83110c923ee1e58bfa108d11923516f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:53:09 -0700
Subject: [PATCH 129/434] 1. Remove path function, since we have a path class
 2. Be explict with file perms (even though its duplicated)

---
 cloudinit/distros/__init__.py | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index fd4c70c1..e85e702e 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -75,10 +75,6 @@ class Distro(object):
     def get_package_mirror(self):
         return self.get_option('package_mirror')
 
-    def get_paths(self):
-        paths = self.get_option("paths") or {}
-        return copy.deepcopy(paths)
-
     def apply_network(self, settings, bring_up=True):
         # Write it out
         self._write_network(settings)
@@ -127,7 +123,7 @@ class Distro(object):
             need_write = True
         if need_write:
             contents = new_etchosts.getvalue()
-            util.write_file("/etc/hosts", contents)
+            util.write_file("/etc/hosts", contents, mode=0644)
 
     def _interface_action(self, action):
         if action not in IFACE_ACTIONS:

From a170a6e225b21214b069123eab1d1902fbc2b5de Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:53:51 -0700
Subject: [PATCH 130/434] Have the contents formed on a previous line which
 seems prettier.

---
 cloudinit/distros/ubuntu.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 9252a1c4..ad12400a 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -44,7 +44,8 @@ class Distro(distros.Distro):
         self._apt_get(command, args)
 
     def set_hostname(self, hostname):
-        util.write_file("/etc/hostname", "%s\n" % hostname, 0644)
+        contents = "%s\n" % (hostname)
+        util.write_file("/etc/hostname", contents, 0644)
         LOG.debug("Setting hostname to %s", hostname)
         util.subp(['hostname', hostname])
 
@@ -59,7 +60,8 @@ class Distro(distros.Distro):
             update_files.append("/etc/hostname")
         for fn in update_files:
             try:
-                util.write_file(fn, "%s\n" % hostname, 0644)
+                contents = "%s\n" % (hostname)
+                util.write_file(fn, contents, 0644)
             except:
                 util.logexc(LOG, "Failed to write hostname %s to %s",
                             hostname, fn)

From 9b3dd45833b49deaeaa495b47c33b32be8173ead Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:54:20 -0700
Subject: [PATCH 131/434] 1. Remove content handler iid param, not used. 2.
 Ensure if iid is found that it is converted to a string before path joining.

---
 cloudinit/helpers.py | 18 ++++++++++--------
 1 file changed, 10 insertions(+), 8 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index c276a54c..5e47794b 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -80,16 +80,17 @@ class FileSemaphores(object):
     def clear_all(self):
         try:
             util.del_dir(self.sem_path)
-        except (IOError, OSError) as e:
-            LOG.debug("Failed deleting semaphore directory %s due to %s",
-                      self.sem_path, e)
+        except (IOError, OSError):
+            util.logexc(LOG, "Failed deleting semaphore directory %s", 
+                        self.sem_path)
 
     def _acquire(self, name, freq):
+        # Check again if its been already gotten
         if self.has_run(name, freq):
             return None
         # This is a race condition since nothing atomic is happening
         # here, but this should be ok due to the nature of when
-        # and where cloud-init runs... (file writing is not a lock..)
+        # and where cloud-init runs... (file writing is not a lock...)
         sem_file = self._get_path(name, freq)
         contents = "%s: %s\n" % (os.getpid(), time())
         try:
@@ -100,9 +101,11 @@ class FileSemaphores(object):
         return sem_file
 
     def has_run(self, name, freq):
-        if freq == PER_ALWAYS:
+        if not freq or freq == PER_ALWAYS:
             return False
         sem_file = self._get_path(name, freq)
+        # This isn't really a good atomic check
+        # but it suffices for where and when cloudinit runs
         if os.path.exists(sem_file):
             return True
         return False
@@ -157,10 +160,9 @@ class Runners(object):
 
 class ContentHandlers(object):
 
-    def __init__(self, paths, iid=None):
+    def __init__(self, paths):
         self.paths = paths
         self.registered = {}
-        self.iid = iid
 
     def __contains__(self, item):
         return self.is_registered(item)
@@ -245,7 +247,7 @@ class Paths(object):
         iid = self.datasource.get_instance_id()
         if iid is None:
             return None
-        ipath = os.path.join(self.cloud_dir, 'instances', iid)
+        ipath = os.path.join(self.cloud_dir, 'instances', str(iid))
         add_on = self.lookups.get(name)
         if add_on:
             ipath = os.path.join(ipath, add_on)

From a9c9de637647801c04cbadcfbd1ee7c2ca8dea76 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:54:52 -0700
Subject: [PATCH 132/434] For now just stick to using newline joining.

---
 cloudinit/netinfo.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index 0d729502..013f8178 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -126,7 +126,7 @@ def netdev_pformat():
         max_len = len(max(netdev_s.splitlines(), key=len))
         header = util.center("Net device info", "+", max_len)
         lines.extend([header, netdev_s])
-    return os.linesep.join(lines)
+    return "\n".join(lines)
 
 
 def route_pformat():
@@ -149,11 +149,11 @@ def route_pformat():
         max_len = len(max(route_s.splitlines(), key=len))
         header = util.center("Route info", "+", max_len)
         lines.extend([header, route_s])
-    return os.linesep.join(lines)
+    return "\n".join(lines)
 
 
 def debug_info():
     lines = []
     lines.append(netdev_pformat())
     lines.append(route_pformat())
-    return os.linesep.join(lines)
+    return "\n".join(lines)

From 8527291a38be92693c97be5b5d07bb49896c5ba2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:55:13 -0700
Subject: [PATCH 133/434] Fix pylint line length to big issue.

---
 cloudinit/sources/DataSourceEc2.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/cloudinit/sources/DataSourceEc2.py b/cloudinit/sources/DataSourceEc2.py
index 0108954f..c2c3b9b7 100644
--- a/cloudinit/sources/DataSourceEc2.py
+++ b/cloudinit/sources/DataSourceEc2.py
@@ -198,13 +198,15 @@ class DataSourceEc2(sources.DataSource):
         # 'ephemeral0': '/dev/sdb',
         # 'root': '/dev/sda1'}
         found = None
-        for (entname, device) in self.metadata['block-device-mapping'].iteritems():
+        bdm_items = self.metadata['block-device-mapping'].iteritems()
+        for (entname, device) in bdm_items:
             if entname == name:
                 found = device
                 break
             # LP: #513842 mapping in Euca has 'ephemeral' not 'ephemeral0'
             if entname == "ephemeral" and name == "ephemeral0":
                 found = device
+
         if found is None:
             LOG.debug("Unable to convert %s to a device", name)
             return None
@@ -212,6 +214,7 @@ class DataSourceEc2(sources.DataSource):
         ofound = found
         if not found.startswith("/"):
             found = "/dev/%s" % found
+
         if os.path.exists(found):
             return found
 

From 58135f1538a1bb5c68937d53dc85d2b414ec4c2c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:55:39 -0700
Subject: [PATCH 134/434] Adjust how config is extracted in that it now can be
 extracted via 3 different modes.

1. Restricted - which doesn't give back the system info (used by handlers/transforms/public cfg api)
2. System - which only gives back the system info (used by distro class)
3. Paths - gives back only the system/path info (used by the path class)
---
 cloudinit/stages.py | 29 ++++++++++++++++-------------
 1 file changed, 16 insertions(+), 13 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index b9076881..63b7cf12 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -76,15 +76,8 @@ class Init(object):
     @property
     def distro(self):
         if not self._distro:
-            d_cfg = util.get_cfg_by_path(self.cfg, ('system_info'), {})
-            # Ensure its a dictionary
-            if not isinstance(d_cfg, (dict)):
-                d_cfg = {}
-            # Ensure not modified indirectly
-            d_cfg = copy.deepcopy(d_cfg)
-            # Remove this since its path config, not distro config
-            d_cfg.pop('paths', None)
             # Try to find the right class to use
+            d_cfg = self._extract_cfg('system')
             distro_name = d_cfg.pop('distro', 'ubuntu')
             distro_cls = distros.fetch(distro_name)
             LOG.debug("Using distro class %s", distro_cls)
@@ -95,19 +88,29 @@ class Init(object):
 
     @property
     def cfg(self):
+        return self._extract_cfg('restricted')
+
+    def _extract_cfg(self, restriction):
         # None check so that we don't keep on re-loading if empty
         if self._cfg is None:
             self._cfg = self._read_cfg()
             LOG.debug("Loading init config %s", self._cfg)
-        return self._cfg
+        # Nobody gets the real config
+        ocfg = copy.deepcopy(self._cfg)
+        if restriction == 'restricted':
+            ocfg.pop('system_info', None)
+        elif restriction == 'system':
+            ocfg = util.get_cfg_by_path(ocfg, ('system_info',), {})
+        elif restriction == 'paths':
+            ocfg = util.get_cfg_by_path(ocfg, ('system_info', 'paths'), {})
+        if not isinstance(ocfg, (dict)):
+            ocfg = {}
+        return ocfg
 
     @property
     def paths(self):
         if not self._paths:
-            path_info = util.get_cfg_by_path(self.cfg,
-                                            ('system_info', 'paths'), {})
-            # Ensure not modified indirectly
-            path_info = copy.deepcopy(path_info)
+            path_info = self._extract_cfg('paths')
             self._paths = helpers.Paths(path_info, self.datasource)
         return self._paths
 

From 09abe287ab82b5a9f0dd4dbc186577d0a69e7e5b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:57:05 -0700
Subject: [PATCH 135/434] Allow file rendering to pass in a file permission
 when writing.

---
 cloudinit/templater.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/templater.py b/cloudinit/templater.py
index 41315adf..c4259fa0 100644
--- a/cloudinit/templater.py
+++ b/cloudinit/templater.py
@@ -29,9 +29,9 @@ def render_from_file(fn, params):
     return render_string(util.load_file(fn), params, name=fn)
 
 
-def render_to_file(fn, outfn, params):
+def render_to_file(fn, outfn, params, mode=0644):
     contents = render_from_file(fn, params)
-    util.write_file(outfn, contents)
+    util.write_file(outfn, contents, mode=mode)
 
 
 def render_string(content, params, name=None):

From ff74db9447da6e010e92ec0020d319f2319b6463 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:57:28 -0700
Subject: [PATCH 136/434] Clean up this log statement to be more useful.

---
 cloudinit/transforms/cc_apt_pipelining.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/transforms/cc_apt_pipelining.py b/cloudinit/transforms/cc_apt_pipelining.py
index 3c24d7c3..d8e574b9 100644
--- a/cloudinit/transforms/cc_apt_pipelining.py
+++ b/cloudinit/transforms/cc_apt_pipelining.py
@@ -57,4 +57,4 @@ def write_apt_snippet(setting, log, f_name=default_file):
 
     util.write_file(f_name, file_contents)
 
-    log.debug("Wrote %s with APT pipeline setting" % f_name)
+    log.debug("Wrote %s with apt pipeline depth setting %s", f_name, setting)

From 113e28f07b8bcc08dcbe73090d748a5fced59b76 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:58:08 -0700
Subject: [PATCH 137/434] 1. Add comment as to what http proxy setting means 2.
 Adjust so file contents will join with a string instead of appending to
 something that might not be a string

---
 cloudinit/transforms/cc_apt_update_upgrade.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/transforms/cc_apt_update_upgrade.py b/cloudinit/transforms/cc_apt_update_upgrade.py
index a4e058c6..d49d8bd2 100644
--- a/cloudinit/transforms/cc_apt_update_upgrade.py
+++ b/cloudinit/transforms/cc_apt_update_upgrade.py
@@ -49,6 +49,7 @@ def handle(_name, cfg, cloud, log, _args):
     proxy_filename = "/etc/apt/apt.conf.d/95cloud-init-proxy"
     if proxy:
         try:
+            # See http://linux.die.net/man/5/apt.conf
             contents = "Acquire::HTTP::Proxy \"%s\";\n"
             util.write_file(proxy_filename, contents % (proxy))
         except Exception as e:
@@ -186,7 +187,7 @@ def add_sources(srclist, template_params=None):
                 errorlist.append([source, "failed add key"])
 
         try:
-            util.write_file(ent['filename'], source + "\n", omode="ab")
+            util.write_file(ent['filename'], "%s\n" % (source), omode="ab")
         except:
             errorlist.append([source,
                              "failed write to file %s" % ent['filename']])

From 83c3f385b77b92cad04280aefdb810291d12d874 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 08:58:54 -0700
Subject: [PATCH 138/434] Have the ensure file function be able to take in a
 file permission.

---
 cloudinit/util.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 15444fed..ed12dada 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1162,8 +1162,8 @@ def uptime():
     return uptime_str
 
 
-def ensure_file(path):
-    write_file(path, content='', omode="ab")
+def ensure_file(path, mode=0644):
+    write_file(path, content='', omode="ab", mode=mode)
 
 
 def chmod(path, mode):

From 5ec781a4cef3849ada44c61bd2459aa4e644d671 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 09:31:52 -0700
Subject: [PATCH 139/434] Rename to fixup transform/fixup handler/form
 transform name instead of form mod*

---
 cloudinit/stages.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 63b7cf12..9c772243 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -319,7 +319,7 @@ class Init(object):
         potential_handlers = util.find_modules(cdir)
         for (fname, modname) in potential_handlers.iteritems():
             try:
-                mod = ud.fixup_module(importer.import_module(modname))
+                mod = ud.fixup_handler(importer.import_module(modname))
                 types = c_handlers.register(mod)
                 LOG.debug("Added handler for %s from %s", types, fname)
             except:
@@ -445,7 +445,7 @@ class Transforms(object):
             raw_name = raw_mod['mod']
             freq = raw_mod.get('freq')
             run_args = raw_mod.get('args') or []
-            mod_name = transforms.form_module_name(raw_name)
+            mod_name = transforms.form_transform_name(raw_name)
             if not mod_name:
                 continue
             if freq and freq not in FREQUENCIES:
@@ -453,7 +453,7 @@ class Transforms(object):
                           " has an unknown frequency %s"), raw_name, freq)
                 # Reset it so when ran it will get set to a known value
                 freq = None
-            mod = transforms.fixup_module(importer.import_module(mod_name))
+            mod = transforms.fixup_transform(importer.import_module(mod_name))
             mostly_mods.append([mod, raw_name, freq, run_args])
         return mostly_mods
 

From 8da6397f2894aa52af1383968c32b59691275992 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 09:32:22 -0700
Subject: [PATCH 140/434] 1. Change to fixup transform/form transform name 2.
 Check lowercase name against .py instead of unknown case.

---
 cloudinit/transforms/__init__.py | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/cloudinit/transforms/__init__.py b/cloudinit/transforms/__init__.py
index 40affc4b..2460f316 100644
--- a/cloudinit/transforms/__init__.py
+++ b/cloudinit/transforms/__init__.py
@@ -26,9 +26,9 @@ from cloudinit import log as logging
 LOG = logging.getLogger(__name__)
 
 
-def form_module_name(name):
+def form_transform_name(name):
     canon_name = name.replace("-", "_")
-    if canon_name.endswith(".py"):
+    if canon_name.lower().endswith(".py"):
         canon_name = canon_name[0:(len(canon_name) - 3)]
     canon_name = canon_name.strip()
     if not canon_name:
@@ -38,7 +38,7 @@ def form_module_name(name):
     return canon_name
 
 
-def fixup_module(mod, def_freq=PER_INSTANCE):
+def fixup_transform(mod, def_freq=PER_INSTANCE):
     if not hasattr(mod, 'frequency'):
         setattr(mod, 'frequency', def_freq)
     else:
@@ -49,7 +49,6 @@ def fixup_module(mod, def_freq=PER_INSTANCE):
         def empty_handle(_name, _cfg, _cloud, _log, _args):
             pass
         setattr(mod, 'handle', empty_handle)
-    # Used only for warning if possibly running on a not checked distro...
     if not hasattr(mod, 'distros'):
         setattr(mod, 'distros', None)
     return mod

From 90b382fd98fbd305e7681721beb0854f72521d92 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 09:33:27 -0700
Subject: [PATCH 141/434] 1. Change to fixup handler instead of fixup module 2.
 Add logging of unknown content types + seperate payload logging detail
 message into a separate function.

---
 cloudinit/user_data.py | 36 ++++++++++++++++++++++++------------
 1 file changed, 24 insertions(+), 12 deletions(-)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 866bf6de..f64a1707 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -250,7 +250,7 @@ class PartHandler(object):
         raise NotImplementedError()
 
 
-def fixup_module(mod, def_freq=PER_INSTANCE):
+def fixup_handler(mod, def_freq=PER_INSTANCE):
     if not hasattr(mod, "handler_version"):
         setattr(mod, "handler_version", 1)
     if not hasattr(mod, 'list_types'):
@@ -307,7 +307,7 @@ def walker_handle_handler(pdata, _ctype, _filename, payload):
     util.write_file(modfname, payload, 0600)
     handlers = pdata['handlers']
     try:
-        mod = fixup_module(importer.import_module(modname))
+        mod = fixup_handler(importer.import_module(modname))
         handlers.register(mod)
         call_begin(mod, pdata['data'], frequency)
         pdata['handlercount'] = curcount + 1
@@ -315,23 +315,35 @@ def walker_handle_handler(pdata, _ctype, _filename, payload):
         util.logexc(LOG, "Failed at registered python file: %s", modfname)
 
 
+def extract_first_or_bytes(blob, size):
+    # Extract the first line upto X bytes or X bytes from more than the
+    # first line if the first line does not contain enough bytes
+    first_line = blob.split("\n", 1)[0]
+    if len(first_line) >= size:
+        start = first_line[:size]
+    else:
+        start = blob[0:size]
+    return start
+
+
 def walker_callback(pdata, ctype, filename, payload):
     if ctype in PART_CONTENT_TYPES:
         walker_handle_handler(pdata, ctype, filename, payload)
         return
     handlers = pdata['handlers']
     if ctype not in handlers:
+        # Extract the first line or 24 bytes for displaying in the log
+        start = extract_first_or_bytes(payload, 24)
+        details = "'%s...'" % (start.encode("string-escape"))
         if ctype == NOT_MULTIPART_TYPE:
-            # Extract the first line or 24 bytes for displaying in the log
-            start = payload.split("\n", 1)[0][:24]
-            if start < payload:
-                details = "starting '%s...'" % start.encode("string-escape")
-            else:
-                details = repr(payload)
-            LOG.warning("Unhandled non-multipart userdata: %s", details)
-        return
-    run_part(handlers[ctype], pdata['data'], ctype, filename,
-             payload, pdata['frequency'])
+            LOG.warning("Unhandled non-multipart (%s) userdata: %s",
+                        ctype, details)
+        else:
+            LOG.warning("Unhandled unknown content-type (%s) userdata: %s",
+                        ctype, details)
+    else:
+        run_part(handlers[ctype], pdata['data'], ctype, filename,
+                 payload, pdata['frequency'])
 
 
 # Callback is a function that will be called with 

From e186f3d5187016664a6b04f7e80f7d472c4b6a3e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 09:39:12 -0700
Subject: [PATCH 142/434] 1. Add a constant for the "cc_" prefix, so that it
 can be easily changed if desired.

---
 cloudinit/transforms/__init__.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/cloudinit/transforms/__init__.py b/cloudinit/transforms/__init__.py
index 2460f316..391a916e 100644
--- a/cloudinit/transforms/__init__.py
+++ b/cloudinit/transforms/__init__.py
@@ -25,6 +25,9 @@ from cloudinit import log as logging
 
 LOG = logging.getLogger(__name__)
 
+# TODO remove this from being a prefix??
+TRANSFORM_PREFIX = "cc_"
+
 
 def form_transform_name(name):
     canon_name = name.replace("-", "_")
@@ -33,8 +36,8 @@ def form_transform_name(name):
     canon_name = canon_name.strip()
     if not canon_name:
         return None
-    if not canon_name.startswith("cc_"):
-        canon_name = 'cc_%s' % (canon_name)
+    if not canon_name.startswith(TRANSFORM_PREFIX):
+        canon_name = '%s%s' % (TRANSFORM_PREFIX, canon_name)
     return canon_name
 
 

From e2eb9bbc7efd79df5c2a0b381063d54bdc2e42d1 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 09:41:13 -0700
Subject: [PATCH 143/434] Unused import removed

---
 cloudinit/netinfo.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index 013f8178..a6b9116d 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -20,8 +20,6 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import os
-
 import cloudinit.util as util
 
 from prettytable import PrettyTable

From 433b4dba27283989487095240023b587985d3138 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 09:44:47 -0700
Subject: [PATCH 144/434] For the different base classes, ensure we are using
 the 'abc' module + appropriate annotations + metaclasses.

---
 cloudinit/sources/__init__.py | 5 +++++
 cloudinit/user_data.py        | 7 ++++++-
 2 files changed, 11 insertions(+), 1 deletion(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 55900119..46350255 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -20,6 +20,8 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+import abc
+
 from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import user_data as ud
@@ -37,6 +39,9 @@ class DataSourceNotFoundException(Exception):
 
 
 class DataSource(object):
+
+    __metaclass__ = abc.ABCMeta
+
     def __init__(self, sys_cfg, distro, paths):
         self.sys_cfg = sys_cfg
         self.distro = distro
diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index f64a1707..28c9f2ce 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -20,7 +20,7 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-
+import abc
 import os
 
 import email
@@ -233,6 +233,9 @@ class UserDataProcessor(object):
 
 
 class PartHandler(object):
+
+    __metaclass__ = abc.ABCMeta
+
     def __init__(self, frequency, version=2):
         self.handler_version = version
         self.frequency = frequency
@@ -240,12 +243,14 @@ class PartHandler(object):
     def __repr__(self):
         return "%s: [%s]" % (util.obj_name(self), self.list_types())
 
+    @abc.abstractmethod
     def list_types(self):
         raise NotImplementedError()
 
     def handle_part(self, data, ctype, filename, payload, frequency):
         return self._handle_part(data, ctype, filename, payload, frequency)
 
+    @abc.abstractmethod
     def _handle_part(self, data, ctype, filename, payload, frequency):
         raise NotImplementedError()
 

From a9538d6e203fc06422350f5f40d1e5a8bd6de58c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 09:51:45 -0700
Subject: [PATCH 145/434] Content handlers does not need the paths variable
 anymore so removed that.

---
 cloudinit/helpers.py | 3 +--
 cloudinit/stages.py  | 2 +-
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 5e47794b..76faa1d5 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -160,8 +160,7 @@ class Runners(object):
 
 class ContentHandlers(object):
 
-    def __init__(self, paths):
-        self.paths = paths
+    def __init__(self):
         self.registered = {}
 
     def __contains__(self, item):
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 9c772243..5dc289ea 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -313,7 +313,7 @@ class Init(object):
         ud_obj = self.datasource.get_userdata()
 
         # This keeps track of all the active handlers
-        c_handlers = helpers.ContentHandlers(paths=self.paths)
+        c_handlers = helpers.ContentHandlers()
 
         # Add handlers in cdir
         potential_handlers = util.find_modules(cdir)

From dd8d2f3ca4b2873c94413fd1f8995ee30f08ef7a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 10:56:08 -0700
Subject: [PATCH 146/434] Make the top level __init__ similar to the other top
 level __inits__ where just util functions and base classes are defined there.

---
 cloudinit/handlers/__init__.py     | 196 +++++++++++++++++++++++++++++
 cloudinit/handlers/boot_hook.py    |  21 ++--
 cloudinit/handlers/cloud_config.py |  28 +++--
 cloudinit/handlers/shell_script.py |  10 +-
 cloudinit/handlers/upstart_job.py  |  10 +-
 5 files changed, 235 insertions(+), 30 deletions(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 09163abb..0ff80a9e 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -20,3 +20,199 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+import abc
+import os
+
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE, FREQUENCIES)
+
+from cloudinit import importer
+from cloudinit import log as logging
+from cloudinit import url_helper
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
+
+# Used as the content type when a message is not multipart
+# and it doesn't contain its own content-type
+NOT_MULTIPART_TYPE = "text/x-not-multipart"
+
+# When none is assigned this gets used
+OCTET_TYPE = 'application/octet-stream'
+
+# Special content types that signal the start and end of processing
+CONTENT_END = "__end__"
+CONTENT_START = "__begin__"
+CONTENT_SIGNALS = [CONTENT_START, CONTENT_END]
+
+# Used when a part-handler type is encountered
+# to allow for registration of new types.
+PART_CONTENT_TYPES = ["text/part-handler"]
+PART_HANDLER_FN_TMPL = 'part-handler-%03d'
+
+# For parts without filenames
+PART_FN_TPL = 'part-%03d'
+
+# Different file beginnings to there content type
+INCLUSION_TYPES_MAP = {
+    '#include': 'text/x-include-url',
+    '#include-once': 'text/x-include-once-url',
+    '#!': 'text/x-shellscript',
+    '#cloud-config': 'text/cloud-config',
+    '#upstart-job': 'text/upstart-job',
+    '#part-handler': 'text/part-handler',
+    '#cloud-boothook': 'text/cloud-boothook',
+    '#cloud-config-archive': 'text/cloud-config-archive',
+}
+
+# Sorted longest first
+INCLUSION_SRCH = sorted(list(INCLUSION_TYPES_MAP.keys()),
+                        key=(lambda e: 0 - len(e)))
+
+
+class Handler(object):
+
+    __metaclass__ = abc.ABCMeta
+
+    def __init__(self, frequency, version=2):
+        self.handler_version = version
+        self.frequency = frequency
+
+    def __repr__(self):
+        return "%s: [%s]" % (util.obj_name(self), self.list_types())
+
+    @abc.abstractmethod
+    def list_types(self):
+        raise NotImplementedError()
+
+    def handle_part(self, data, ctype, filename, payload, frequency):
+        return self._handle_part(data, ctype, filename, payload, frequency)
+
+    @abc.abstractmethod
+    def _handle_part(self, data, ctype, filename, payload, frequency):
+        raise NotImplementedError()
+
+
+def run_part(mod, data, ctype, filename, payload, frequency):
+    mod_freq = mod.frequency
+    if not (mod_freq == PER_ALWAYS or
+            (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
+        return
+    mod_ver = mod.handler_version
+    try:
+        if mod_ver == 1:
+            mod.handle_part(data, ctype, filename, payload)
+        else:
+            mod.handle_part(data, ctype, filename, payload, frequency)
+    except:
+        util.logexc(LOG, ("Failed calling mod %s (%s, %s, %s)"
+                         " with frequency %s"), 
+                    mod, ctype, filename,
+                    mod_ver, frequency)
+
+
+def call_begin(mod, data, frequency):
+    run_part(mod, data, CONTENT_START, None, None, frequency)
+
+
+def call_end(mod, data, frequency):
+    run_part(mod, data, CONTENT_END, None, None, frequency)
+
+
+def walker_handle_handler(pdata, _ctype, _filename, payload):
+    curcount = pdata['handlercount']
+    modname = PART_HANDLER_FN_TMPL % (curcount)
+    frequency = pdata['frequency']
+    modfname = os.path.join(pdata['handlerdir'], "%s" % (modname))
+    if not modfname.endswith(".py"):
+        modfname = "%s.py" % (modfname)
+    # TODO: Check if path exists??
+    util.write_file(modfname, payload, 0600)
+    handlers = pdata['handlers']
+    try:
+        mod = fixup_handler(importer.import_module(modname))
+        handlers.register(mod)
+        call_begin(mod, pdata['data'], frequency)
+        pdata['handlercount'] = curcount + 1
+    except:
+        util.logexc(LOG, "Failed at registered python file: %s", modfname)
+
+
+def _extract_first_or_bytes(blob, size):
+    # Extract the first line upto X bytes or X bytes from more than the
+    # first line if the first line does not contain enough bytes
+    first_line = blob.split("\n", 1)[0]
+    if len(first_line) >= size:
+        start = first_line[:size]
+    else:
+        start = blob[0:size]
+    return start
+
+
+def walker_callback(pdata, ctype, filename, payload):
+    if ctype in PART_CONTENT_TYPES:
+        walker_handle_handler(pdata, ctype, filename, payload)
+        return
+    handlers = pdata['handlers']
+    if ctype not in handlers:
+        # Extract the first line or 24 bytes for displaying in the log
+        start = _extract_first_or_bytes(payload, 24)
+        details = "'%s...'" % (start.encode("string-escape"))
+        if ctype == NOT_MULTIPART_TYPE:
+            LOG.warning("Unhandled non-multipart (%s) userdata: %s",
+                        ctype, details)
+        else:
+            LOG.warning("Unhandled unknown content-type (%s) userdata: %s",
+                        ctype, details)
+    else:
+        run_part(handlers[ctype], pdata['data'], ctype, filename,
+                 payload, pdata['frequency'])
+
+
+# Callback is a function that will be called with 
+# (data, content_type, filename, payload)
+def walk(msg, callback, data):
+    partnum = 0
+    for part in msg.walk():
+        # multipart/* are just containers
+        if part.get_content_maintype() == 'multipart':
+            continue
+
+        ctype = part.get_content_type()
+        if ctype is None:
+            ctype = OCTET_TYPE
+
+        filename = part.get_filename()
+        if not filename:
+            filename = PART_FN_TPL % (partnum)
+
+        callback(data, ctype, filename, part.get_payload(decode=True))
+        partnum = partnum + 1
+
+
+def fixup_handler(mod, def_freq=PER_INSTANCE):
+    if not hasattr(mod, "handler_version"):
+        setattr(mod, "handler_version", 1)
+    if not hasattr(mod, 'list_types'):
+        def empty_types():
+            return []
+        setattr(mod, 'list_types', empty_types)
+    if not hasattr(mod, 'frequency'):
+        setattr(mod, 'frequency', def_freq)
+    else:
+        freq = mod.frequency
+        if freq and freq not in FREQUENCIES:
+            LOG.warn("Handler %s has an unknown frequency %s", mod, freq)
+    if not hasattr(mod, 'handle_part'):
+        def empty_handler(_data, _ctype, _filename, _payload):
+            pass
+        setattr(mod, 'handle_part', empty_handler)
+    return mod
+
+
+def type_from_starts_with(payload, default=None):
+    for text in INCLUSION_SRCH:
+        if payload.startswith(text):
+            return INCLUSION_TYPES_MAP[text]
+    return default
+
+
diff --git a/cloudinit/handlers/boot_hook.py b/cloudinit/handlers/boot_hook.py
index b3aab366..10f60b8d 100644
--- a/cloudinit/handlers/boot_hook.py
+++ b/cloudinit/handlers/boot_hook.py
@@ -22,8 +22,8 @@
 
 import os
 
+from cloudinit import handlers
 from cloudinit import log as logging
-from cloudinit import user_data as ud
 from cloudinit import util
 
 from cloudinit.settings import (PER_ALWAYS)
@@ -31,31 +31,34 @@ from cloudinit.settings import (PER_ALWAYS)
 LOG = logging.getLogger(__name__)
 
 
-class BootHookPartHandler(ud.PartHandler):
+class BootHookPartHandler(handlers.Handler):
     def __init__(self, paths, instance_id, **_kwargs):
-        ud.PartHandler.__init__(self, PER_ALWAYS)
+        handlers.Handler.__init__(self, PER_ALWAYS)
         self.boothook_dir = paths.get_ipath("boothooks")
         self.instance_id = instance_id
 
     def list_types(self):
         return [
-            ud.type_from_starts_with("#cloud-boothook"),
+            handlers.type_from_starts_with("#cloud-boothook"),
         ]
 
-    def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype in ud.CONTENT_SIGNALS:
-            return
-
+    def _write_part(self, payload, filename):
         filename = util.clean_filename(filename)
         payload = util.dos2unix(payload)
         prefix = "#cloud-boothook"
         start = 0
         if payload.startswith(prefix):
             start = len(prefix) + 1
-
         filepath = os.path.join(self.boothook_dir, filename)
         contents = payload[start:]
         util.write_file(filepath, contents, 0700)
+        return filepath
+
+    def _handle_part(self, _data, ctype, filename, payload, _frequency):
+        if ctype in handlers.CONTENT_SIGNALS:
+            return
+
+        filepath = self._write_part(payload, filename)
         try:
             env = os.environ.copy()
             if self.instance_id:
diff --git a/cloudinit/handlers/cloud_config.py b/cloudinit/handlers/cloud_config.py
index 12d1bd96..f6d95244 100644
--- a/cloudinit/handlers/cloud_config.py
+++ b/cloudinit/handlers/cloud_config.py
@@ -20,8 +20,8 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from cloudinit import handlers
 from cloudinit import log as logging
-from cloudinit import user_data as ud
 from cloudinit import util
 
 from cloudinit.settings import (PER_ALWAYS)
@@ -29,28 +29,34 @@ from cloudinit.settings import (PER_ALWAYS)
 LOG = logging.getLogger(__name__)
 
 
-class CloudConfigPartHandler(ud.PartHandler):
+class CloudConfigPartHandler(handlers.Handler):
     def __init__(self, paths, **_kwargs):
-        ud.PartHandler.__init__(self, PER_ALWAYS)
+        handlers.Handler.__init__(self, PER_ALWAYS)
         self.cloud_buf = []
         self.cloud_fn = paths.get_ipath("cloud_config")
 
     def list_types(self):
         return [
-            ud.type_from_starts_with("#cloud-config"),
+            handlers.type_from_starts_with("#cloud-config"),
         ]
 
+    def _write_cloud_config(self, buf):
+        if not self.cloud_fn:
+            return
+        lines = [str(b) for b in buf]
+        payload = "\n".join(lines)
+        util.write_file(self.cloud_fn, payload, 0600)
+
     def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype == ud.CONTENT_START:
+        if ctype == handlers.CONTENT_START:
             self.cloud_buf = []
             return
-
-        if ctype == ud.CONTENT_END:
-            payload = "\n".join(self.cloud_buf)
-            util.write_file(self.cloud_fn, payload, 0600)
+        if ctype == handlers.CONTENT_END:
+            self._write_cloud_config(self.cloud_buf)
             self.cloud_buf = []
             return
 
         filename = util.clean_filename(filename)
-        entry = "\n".join(["#%s" % (filename), str(payload)])
-        self.cloud_buf.append(entry)
+        if not filename:
+            filename = '??'
+        self.cloud_buf.extend(["#%s" % (filename), str(payload)])
diff --git a/cloudinit/handlers/shell_script.py b/cloudinit/handlers/shell_script.py
index f6e2ef16..a9d8e544 100644
--- a/cloudinit/handlers/shell_script.py
+++ b/cloudinit/handlers/shell_script.py
@@ -22,8 +22,8 @@
 
 import os
 
+from cloudinit import handlers
 from cloudinit import log as logging
-from cloudinit import user_data as ud
 from cloudinit import util
 
 from cloudinit.settings import (PER_ALWAYS)
@@ -31,18 +31,18 @@ from cloudinit.settings import (PER_ALWAYS)
 LOG = logging.getLogger(__name__)
 
 
-class ShellScriptPartHandler(ud.PartHandler):
+class ShellScriptPartHandler(handlers.Handler):
     def __init__(self, paths, **_kwargs):
-        ud.PartHandler.__init__(self, PER_ALWAYS)
+        handlers.Handler.__init__(self, PER_ALWAYS)
         self.script_dir = paths.get_ipath_cur('scripts')
 
     def list_types(self):
         return [
-            ud.type_from_starts_with("#!"),
+            handlers.type_from_starts_with("#!"),
         ]
 
     def _handle_part(self, _data, ctype, filename, payload, _frequency):
-        if ctype in ud.CONTENT_SIGNALS:
+        if ctype in handlers.CONTENT_SIGNALS:
             # TODO: maybe delete existing things here
             return
 
diff --git a/cloudinit/handlers/upstart_job.py b/cloudinit/handlers/upstart_job.py
index 059a4851..411a5d68 100644
--- a/cloudinit/handlers/upstart_job.py
+++ b/cloudinit/handlers/upstart_job.py
@@ -23,8 +23,8 @@
 
 import os
 
+from cloudinit import handlers
 from cloudinit import log as logging
-from cloudinit import user_data as ud
 from cloudinit import util
 
 from cloudinit.settings import (PER_INSTANCE)
@@ -32,18 +32,18 @@ from cloudinit.settings import (PER_INSTANCE)
 LOG = logging.getLogger(__name__)
 
 
-class UpstartJobPartHandler(ud.PartHandler):
+class UpstartJobPartHandler(handlers.Handler):
     def __init__(self, paths, **_kwargs):
-        ud.PartHandler.__init__(self, PER_INSTANCE)
+        handlers.Handler.__init__(self, PER_INSTANCE)
         self.upstart_dir = paths.upstart_conf_d
 
     def list_types(self):
         return [
-            ud.type_from_starts_with("#upstart-job"),
+            handlers.type_from_starts_with("#upstart-job"),
         ]
 
     def _handle_part(self, _data, ctype, filename, payload, frequency):
-        if ctype in ud.CONTENT_SIGNALS:
+        if ctype in handlers.CONTENT_SIGNALS:
             return
 
         if not self.upstart_dir:

From ba71b016b3e1972e0ef05f557c92ded52b79096e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 10:56:41 -0700
Subject: [PATCH 147/434] Move the helper functions for handlers to the handler
 __init__ instead of being in here.

This class will now just contain user data parsing, leaving the handler running to happen elsewhere.
---
 cloudinit/user_data.py | 196 +++--------------------------------------
 1 file changed, 10 insertions(+), 186 deletions(-)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 28c9f2ce..2f01579a 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -20,7 +20,6 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import abc
 import os
 
 import email
@@ -28,56 +27,24 @@ from email.mime.multipart import MIMEMultipart
 from email.mime.text import MIMEText
 from email.mime.base import MIMEBase
 
-from cloudinit import importer
+from cloudinit import handlers
 from cloudinit import log as logging
 from cloudinit import url_helper
 from cloudinit import util
 
-from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE, FREQUENCIES)
-
 LOG = logging.getLogger(__name__)
 
-# Special content types that signal the start and end of processing
-CONTENT_END = "__end__"
-CONTENT_START = "__begin__"
-CONTENT_SIGNALS = [CONTENT_START, CONTENT_END]
+# Constants copied in from the handler module
+NOT_MULTIPART_TYPE = handlers.NOT_MULTIPART_TYPE
+PART_FN_TPL = handlers.PART_FN_TPL
+OCTET_TYPE = handlers.OCTET_TYPE
 
-# Used when a part-handler type is encountered
-# to allow for registration of new types.
-PART_CONTENT_TYPES = ["text/part-handler"]
-PART_HANDLER_FN_TMPL = 'part-handler-%03d'
-
-# For parts without filenames
-PART_FN_TPL = 'part-%03d'
-
-# Used as the content type when a message is not multipart
-# and it doesn't contain its own content-type
-NOT_MULTIPART_TYPE = "text/x-not-multipart"
-OCTET_TYPE = 'application/octet-stream'
-
-# Different file beginnings to there content type
-INCLUSION_TYPES_MAP = {
-    '#include': 'text/x-include-url',
-    '#include-once': 'text/x-include-once-url',
-    '#!': 'text/x-shellscript',
-    '#cloud-config': 'text/cloud-config',
-    '#upstart-job': 'text/upstart-job',
-    '#part-handler': 'text/part-handler',
-    '#cloud-boothook': 'text/cloud-boothook',
-    '#cloud-config-archive': 'text/cloud-config-archive',
-}
-
-# Sorted longest first
-INCLUSION_SRCH = sorted(list(INCLUSION_TYPES_MAP.keys()),
-                        key=(lambda e: 0 - len(e)))
-
-# Various special content types
+# Various special content types that cause special actions
 TYPE_NEEDED = ["text/plain", "text/x-not-multipart"]
 INCLUDE_TYPES = ['text/x-include-url', 'text/x-include-once-url']
 ARCHIVE_TYPES = ["text/cloud-config-archive"]
 UNDEF_TYPE = "text/plain"
 ARCHIVE_UNDEF_TYPE = "text/cloud-config"
-OCTET_TYPE = 'application/octet-stream'
 
 # Msg header used to track attachments
 ATTACHMENT_FIELD = 'Number-Attachments'
@@ -107,7 +74,7 @@ class UserDataProcessor(object):
                 ctype_orig = UNDEF_TYPE
     
             if ctype_orig in TYPE_NEEDED:
-                ctype = type_from_starts_with(payload)
+                ctype = handlers.type_from_starts_with(payload)
     
             if ctype is None:
                 ctype = ctype_orig
@@ -181,7 +148,8 @@ class UserDataProcessor(object):
             content = ent.get('content', '')
             mtype = ent.get('type')
             if not mtype:
-                mtype = type_from_starts_with(content, ARCHIVE_UNDEF_TYPE)
+                mtype = handlers.type_from_starts_with(content,
+                                                       ARCHIVE_UNDEF_TYPE)
 
             maintype, subtype = mtype.split('/', 1)
             if maintype == "text":
@@ -232,146 +200,6 @@ class UserDataProcessor(object):
         self._multi_part_count(outer_msg, cur + 1)
 
 
-class PartHandler(object):
-
-    __metaclass__ = abc.ABCMeta
-
-    def __init__(self, frequency, version=2):
-        self.handler_version = version
-        self.frequency = frequency
-
-    def __repr__(self):
-        return "%s: [%s]" % (util.obj_name(self), self.list_types())
-
-    @abc.abstractmethod
-    def list_types(self):
-        raise NotImplementedError()
-
-    def handle_part(self, data, ctype, filename, payload, frequency):
-        return self._handle_part(data, ctype, filename, payload, frequency)
-
-    @abc.abstractmethod
-    def _handle_part(self, data, ctype, filename, payload, frequency):
-        raise NotImplementedError()
-
-
-def fixup_handler(mod, def_freq=PER_INSTANCE):
-    if not hasattr(mod, "handler_version"):
-        setattr(mod, "handler_version", 1)
-    if not hasattr(mod, 'list_types'):
-        def empty_types():
-            return []
-        setattr(mod, 'list_types', empty_types)
-    if not hasattr(mod, 'frequency'):
-        setattr(mod, 'frequency', def_freq)
-    else:
-        freq = mod.frequency
-        if freq and freq not in FREQUENCIES:
-            LOG.warn("Module %s has an unknown frequency %s", mod, freq)
-    if not hasattr(mod, 'handle_part'):
-        def empty_handler(_data, _ctype, _filename, _payload):
-            pass
-        setattr(mod, 'handle_part', empty_handler)
-    return mod
-
-
-def run_part(mod, data, ctype, filename, payload, frequency):
-    mod_freq = mod.frequency
-    if not (mod_freq == PER_ALWAYS or
-            (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
-        return
-    mod_ver = mod.handler_version
-    try:
-        if mod_ver == 1:
-            mod.handle_part(data, ctype, filename, payload)
-        else:
-            mod.handle_part(data, ctype, filename, payload, frequency)
-    except:
-        util.logexc(LOG, ("Failed calling mod %s (%s, %s, %s)"
-                         " with frequency %s"), 
-                    mod, ctype, filename,
-                    mod_ver, frequency)
-
-
-def call_begin(mod, data, frequency):
-    run_part(mod, data, CONTENT_START, None, None, frequency)
-
-
-def call_end(mod, data, frequency):
-    run_part(mod, data, CONTENT_END, None, None, frequency)
-
-
-def walker_handle_handler(pdata, _ctype, _filename, payload):
-    curcount = pdata['handlercount']
-    modname = PART_HANDLER_FN_TMPL % (curcount)
-    frequency = pdata['frequency']
-    modfname = os.path.join(pdata['handlerdir'], "%s" % (modname))
-    if not modfname.endswith(".py"):
-        modfname = "%s.py" % (modfname)
-    # TODO: Check if path exists??
-    util.write_file(modfname, payload, 0600)
-    handlers = pdata['handlers']
-    try:
-        mod = fixup_handler(importer.import_module(modname))
-        handlers.register(mod)
-        call_begin(mod, pdata['data'], frequency)
-        pdata['handlercount'] = curcount + 1
-    except:
-        util.logexc(LOG, "Failed at registered python file: %s", modfname)
-
-
-def extract_first_or_bytes(blob, size):
-    # Extract the first line upto X bytes or X bytes from more than the
-    # first line if the first line does not contain enough bytes
-    first_line = blob.split("\n", 1)[0]
-    if len(first_line) >= size:
-        start = first_line[:size]
-    else:
-        start = blob[0:size]
-    return start
-
-
-def walker_callback(pdata, ctype, filename, payload):
-    if ctype in PART_CONTENT_TYPES:
-        walker_handle_handler(pdata, ctype, filename, payload)
-        return
-    handlers = pdata['handlers']
-    if ctype not in handlers:
-        # Extract the first line or 24 bytes for displaying in the log
-        start = extract_first_or_bytes(payload, 24)
-        details = "'%s...'" % (start.encode("string-escape"))
-        if ctype == NOT_MULTIPART_TYPE:
-            LOG.warning("Unhandled non-multipart (%s) userdata: %s",
-                        ctype, details)
-        else:
-            LOG.warning("Unhandled unknown content-type (%s) userdata: %s",
-                        ctype, details)
-    else:
-        run_part(handlers[ctype], pdata['data'], ctype, filename,
-                 payload, pdata['frequency'])
-
-
-# Callback is a function that will be called with 
-# (data, content_type, filename, payload)
-def walk(msg, callback, data):
-    partnum = 0
-    for part in msg.walk():
-        # multipart/* are just containers
-        if part.get_content_maintype() == 'multipart':
-            continue
-
-        ctype = part.get_content_type()
-        if ctype is None:
-            ctype = OCTET_TYPE
-
-        filename = part.get_filename()
-        if not filename:
-            filename = PART_FN_TPL % (partnum)
-
-        callback(data, ctype, filename, part.get_payload(decode=True))
-        partnum = partnum + 1
-
-
 # Coverts a raw string into a mime message
 def convert_string(raw_data, headers=None):
     if not raw_data:
@@ -394,9 +222,5 @@ def convert_string(raw_data, headers=None):
     return msg
 
 
-def type_from_starts_with(payload, default=None):
-    for text in INCLUSION_SRCH:
-        if payload.startswith(text):
-            return INCLUSION_TYPES_MAP[text]
-    return default
+
 

From 33ea9e3bb2344d304d668a4b238388f93c8cce66 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 10:57:28 -0700
Subject: [PATCH 148/434] Allow the user data processor to be passed in.

This could and should be useful for unit testing.
---
 cloudinit/sources/__init__.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 46350255..5842d41b 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -42,7 +42,7 @@ class DataSource(object):
 
     __metaclass__ = abc.ABCMeta
 
-    def __init__(self, sys_cfg, distro, paths):
+    def __init__(self, sys_cfg, distro, paths, ud_proc=None):
         self.sys_cfg = sys_cfg
         self.distro = distro
         self.paths = paths
@@ -54,11 +54,15 @@ class DataSource(object):
             name = name[DS_PREFIX:]
         self.ds_cfg = util.get_cfg_by_path(self.sys_cfg,
                                           ("datasource", name), {})
+        if not ud_proc:
+            self.ud_proc = ud.UserDataProcessor(self.paths)
+        else:
+            self.ud_proc = ud_proc
 
     def get_userdata(self):
         if self.userdata is None:
             raw_data = self.get_userdata_raw()
-            self.userdata = ud.UserDataProcessor(self.paths).process(raw_data)
+            self.userdata = self.ud_proc.process(raw_data)
         return self.userdata
 
     def get_userdata_raw(self):

From c075baf0c4ec72ec8fc77c4d82cebe55f2fffddd Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 10:57:52 -0700
Subject: [PATCH 149/434] Add a restricted set of characters which can be used
 in filenames when cleaning them.

---
 cloudinit/util.py | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index ed12dada..6e8ce96e 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -64,6 +64,7 @@ LOG = logging.getLogger(__name__)
 FN_REPLACEMENTS = {
     os.sep: '_',
 }
+FN_ALLOWED = ('_-.()' + string.digits + string.ascii_letters)
 
 # Helper utils to see if running in a container
 CONTAINER_TESTS = ['running-in-container', 'lxc-is-container']
@@ -227,7 +228,14 @@ def read_conf(fname):
 def clean_filename(fn):
     for (k, v) in FN_REPLACEMENTS.iteritems():
         fn = fn.replace(k, v)
-    return fn.strip()
+    removals = []
+    for k in fn:
+        if k not in FN_ALLOWED:
+            removals.append(k)
+    for k in removals:
+        fn = fn.replace(k, '')
+    fn = fn.strip()
+    return fn
 
 
 def decomp_str(data):

From 67b5de190343776dc7f850042045485acc0e1f13 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 10:58:30 -0700
Subject: [PATCH 150/434] After the moving of items to handler/__init__ reflect
 those references here.

---
 cloudinit/stages.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 5dc289ea..9d8ff2bb 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -34,6 +34,7 @@ except ImportError:
 from cloudinit.settings import (OLD_CLOUD_CONFIG)
 from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
 
+from cloudinit import handlers
 from cloudinit.handlers import boot_hook as bh_part
 from cloudinit.handlers import cloud_config as cc_part
 from cloudinit.handlers import shell_script as ss_part
@@ -46,7 +47,6 @@ from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import sources
 from cloudinit import transforms
-from cloudinit import user_data as ud
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)
@@ -319,7 +319,7 @@ class Init(object):
         potential_handlers = util.find_modules(cdir)
         for (fname, modname) in potential_handlers.iteritems():
             try:
-                mod = ud.fixup_handler(importer.import_module(modname))
+                mod = handlers.fixup_handler(importer.import_module(modname))
                 types = c_handlers.register(mod)
                 LOG.debug("Added handler for %s from %s", types, fname)
             except:
@@ -338,7 +338,7 @@ class Init(object):
         for (_ctype, mod) in c_handlers.iteritems():
             if mod in called:
                 continue
-            ud.call_begin(mod, data, frequency)
+            handlers.call_begin(mod, data, frequency)
             called.append(mod)
 
         # Walk the user data
@@ -352,14 +352,14 @@ class Init(object):
             # names...
             'handlercount': 0,
         }
-        ud.walk(ud_obj, ud.walker_callback, data=part_data)
+        handlers.walk(ud_obj, handlers.walker_callback, data=part_data)
 
         # Give callbacks opportunity to finalize
         called = []
         for (_ctype, mod) in c_handlers.iteritems():
             if mod in called:
                 continue
-            ud.call_end(mod, data, frequency)
+            handlers.call_end(mod, data, frequency)
             called.append(mod)
 
 
@@ -481,7 +481,7 @@ class Transforms(object):
                 run_name = "config-%s" % (name)
                 c_cloud.run(run_name, mod.handle, func_args, freq=freq)
             except Exception as e:
-                util.logexc(LOG, "Running %s failed", mod)
+                util.logexc(LOG, "Running %s (%s) failed", name, mod)
                 failures.append((name, e))
         return failures
 

From 5ec7c412ed88f957e20b7f0d4ac82a03a8756a90 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 12:02:21 -0700
Subject: [PATCH 151/434] Correct the mount options to use a comma separated
 list for the mount options (if any provided/selected)

---
 cloudinit/util.py | 15 +++++++++++----
 1 file changed, 11 insertions(+), 4 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 6e8ce96e..38ca9573 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1090,7 +1090,7 @@ def mounts():
     return mounted
 
 
-def mount_cb(device, callback, data=None, rw=False, mtype=None):
+def mount_cb(device, callback, data=None, rw=False, mtype=None, sync=True):
     """
     Mount the device, call method 'callback' passing the directory
     in which it was mounted, then unmount.  Return whatever 'callback'
@@ -1103,11 +1103,18 @@ def mount_cb(device, callback, data=None, rw=False, mtype=None):
             mountpoint = "%s/" % mounted[device]['mountpoint']
         else:
             try:
-                mountcmd = ['mount', "-o"]
+                mountcmd = ['mount']
+                mountopts = []
                 if rw:
-                    mountcmd.append('rw')
+                    mountopts.append('rw')
                 else:
-                    mountcmd.append('ro')
+                    mountopts.append('ro')
+                if sync:
+                    # This seems like the safe approach to do
+                    # (where this is on by default)
+                    mountopts.append("sync")
+                if mountopts:
+                    mountcmd.extend(["-o", ",".join(mountopts)])
                 if mtype:
                     mountcmd.extend(['-t', mtype])
                 mountcmd.append(device)

From 57fe8cadc1bdda5b0e5f4d61abce0996c3984373 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 12:14:54 -0700
Subject: [PATCH 152/434] Remove the need to have transforms start with "cc_".

1. Just let them have no prefix (ie blank) unless this isn't wanted later.
---
 cloudinit/transforms/__init__.py                                | 2 +-
 .../transforms/{cc_apt_pipelining.py => apt_pipelining.py}      | 0
 .../{cc_apt_update_upgrade.py => apt_update_upgrade.py}         | 0
 cloudinit/transforms/{cc_bootcmd.py => bootcmd.py}              | 0
 cloudinit/transforms/{cc_byobu.py => byobu.py}                  | 0
 cloudinit/transforms/{cc_ca_certs.py => ca_certs.py}            | 0
 cloudinit/transforms/{cc_chef.py => chef.py}                    | 0
 .../{cc_disable_ec2_metadata.py => disable_ec2_metadata.py}     | 0
 cloudinit/transforms/{cc_final_message.py => final_message.py}  | 0
 cloudinit/transforms/{cc_foo.py => foo.py}                      | 0
 cloudinit/transforms/{cc_grub_dpkg.py => grub_dpkg.py}          | 0
 .../transforms/{cc_keys_to_console.py => keys_to_console.py}    | 0
 cloudinit/transforms/{cc_landscape.py => landscape.py}          | 0
 cloudinit/transforms/{cc_locale.py => locale.py}                | 0
 cloudinit/transforms/{cc_mcollective.py => mcollective.py}      | 0
 cloudinit/transforms/{cc_mounts.py => mounts.py}                | 0
 cloudinit/transforms/{cc_phone_home.py => phone_home.py}        | 0
 cloudinit/transforms/{cc_puppet.py => puppet.py}                | 0
 cloudinit/transforms/{cc_resizefs.py => resizefs.py}            | 0
 .../{cc_rightscale_userdata.py => rightscale_userdata.py}       | 0
 cloudinit/transforms/{cc_rsyslog.py => rsyslog.py}              | 0
 cloudinit/transforms/{cc_runcmd.py => runcmd.py}                | 0
 cloudinit/transforms/{cc_salt_minion.py => salt_minion.py}      | 0
 .../transforms/{cc_scripts_per_boot.py => scripts_per_boot.py}  | 0
 .../{cc_scripts_per_instance.py => scripts_per_instance.py}     | 0
 .../transforms/{cc_scripts_per_once.py => scripts_per_once.py}  | 0
 cloudinit/transforms/{cc_scripts_user.py => scripts_user.py}    | 0
 cloudinit/transforms/{cc_set_hostname.py => set_hostname.py}    | 0
 cloudinit/transforms/{cc_set_passwords.py => set_passwords.py}  | 0
 cloudinit/transforms/{cc_ssh.py => ssh.py}                      | 0
 cloudinit/transforms/{cc_ssh_import_id.py => ssh_import_id.py}  | 0
 cloudinit/transforms/{cc_timezone.py => timezone.py}            | 0
 .../transforms/{cc_update_etc_hosts.py => update_etc_hosts.py}  | 0
 .../transforms/{cc_update_hostname.py => update_hostname.py}    | 0
 cloudinit/transforms/{cc_welcome.py => welcome.py}              | 0
 35 files changed, 1 insertion(+), 1 deletion(-)
 rename cloudinit/transforms/{cc_apt_pipelining.py => apt_pipelining.py} (100%)
 rename cloudinit/transforms/{cc_apt_update_upgrade.py => apt_update_upgrade.py} (100%)
 rename cloudinit/transforms/{cc_bootcmd.py => bootcmd.py} (100%)
 rename cloudinit/transforms/{cc_byobu.py => byobu.py} (100%)
 rename cloudinit/transforms/{cc_ca_certs.py => ca_certs.py} (100%)
 rename cloudinit/transforms/{cc_chef.py => chef.py} (100%)
 rename cloudinit/transforms/{cc_disable_ec2_metadata.py => disable_ec2_metadata.py} (100%)
 rename cloudinit/transforms/{cc_final_message.py => final_message.py} (100%)
 rename cloudinit/transforms/{cc_foo.py => foo.py} (100%)
 rename cloudinit/transforms/{cc_grub_dpkg.py => grub_dpkg.py} (100%)
 rename cloudinit/transforms/{cc_keys_to_console.py => keys_to_console.py} (100%)
 rename cloudinit/transforms/{cc_landscape.py => landscape.py} (100%)
 rename cloudinit/transforms/{cc_locale.py => locale.py} (100%)
 rename cloudinit/transforms/{cc_mcollective.py => mcollective.py} (100%)
 rename cloudinit/transforms/{cc_mounts.py => mounts.py} (100%)
 rename cloudinit/transforms/{cc_phone_home.py => phone_home.py} (100%)
 rename cloudinit/transforms/{cc_puppet.py => puppet.py} (100%)
 rename cloudinit/transforms/{cc_resizefs.py => resizefs.py} (100%)
 rename cloudinit/transforms/{cc_rightscale_userdata.py => rightscale_userdata.py} (100%)
 rename cloudinit/transforms/{cc_rsyslog.py => rsyslog.py} (100%)
 rename cloudinit/transforms/{cc_runcmd.py => runcmd.py} (100%)
 rename cloudinit/transforms/{cc_salt_minion.py => salt_minion.py} (100%)
 rename cloudinit/transforms/{cc_scripts_per_boot.py => scripts_per_boot.py} (100%)
 rename cloudinit/transforms/{cc_scripts_per_instance.py => scripts_per_instance.py} (100%)
 rename cloudinit/transforms/{cc_scripts_per_once.py => scripts_per_once.py} (100%)
 rename cloudinit/transforms/{cc_scripts_user.py => scripts_user.py} (100%)
 rename cloudinit/transforms/{cc_set_hostname.py => set_hostname.py} (100%)
 rename cloudinit/transforms/{cc_set_passwords.py => set_passwords.py} (100%)
 rename cloudinit/transforms/{cc_ssh.py => ssh.py} (100%)
 rename cloudinit/transforms/{cc_ssh_import_id.py => ssh_import_id.py} (100%)
 rename cloudinit/transforms/{cc_timezone.py => timezone.py} (100%)
 rename cloudinit/transforms/{cc_update_etc_hosts.py => update_etc_hosts.py} (100%)
 rename cloudinit/transforms/{cc_update_hostname.py => update_hostname.py} (100%)
 rename cloudinit/transforms/{cc_welcome.py => welcome.py} (100%)

diff --git a/cloudinit/transforms/__init__.py b/cloudinit/transforms/__init__.py
index 391a916e..925cf569 100644
--- a/cloudinit/transforms/__init__.py
+++ b/cloudinit/transforms/__init__.py
@@ -26,7 +26,7 @@ from cloudinit import log as logging
 LOG = logging.getLogger(__name__)
 
 # TODO remove this from being a prefix??
-TRANSFORM_PREFIX = "cc_"
+TRANSFORM_PREFIX = ''  # "cc_"
 
 
 def form_transform_name(name):
diff --git a/cloudinit/transforms/cc_apt_pipelining.py b/cloudinit/transforms/apt_pipelining.py
similarity index 100%
rename from cloudinit/transforms/cc_apt_pipelining.py
rename to cloudinit/transforms/apt_pipelining.py
diff --git a/cloudinit/transforms/cc_apt_update_upgrade.py b/cloudinit/transforms/apt_update_upgrade.py
similarity index 100%
rename from cloudinit/transforms/cc_apt_update_upgrade.py
rename to cloudinit/transforms/apt_update_upgrade.py
diff --git a/cloudinit/transforms/cc_bootcmd.py b/cloudinit/transforms/bootcmd.py
similarity index 100%
rename from cloudinit/transforms/cc_bootcmd.py
rename to cloudinit/transforms/bootcmd.py
diff --git a/cloudinit/transforms/cc_byobu.py b/cloudinit/transforms/byobu.py
similarity index 100%
rename from cloudinit/transforms/cc_byobu.py
rename to cloudinit/transforms/byobu.py
diff --git a/cloudinit/transforms/cc_ca_certs.py b/cloudinit/transforms/ca_certs.py
similarity index 100%
rename from cloudinit/transforms/cc_ca_certs.py
rename to cloudinit/transforms/ca_certs.py
diff --git a/cloudinit/transforms/cc_chef.py b/cloudinit/transforms/chef.py
similarity index 100%
rename from cloudinit/transforms/cc_chef.py
rename to cloudinit/transforms/chef.py
diff --git a/cloudinit/transforms/cc_disable_ec2_metadata.py b/cloudinit/transforms/disable_ec2_metadata.py
similarity index 100%
rename from cloudinit/transforms/cc_disable_ec2_metadata.py
rename to cloudinit/transforms/disable_ec2_metadata.py
diff --git a/cloudinit/transforms/cc_final_message.py b/cloudinit/transforms/final_message.py
similarity index 100%
rename from cloudinit/transforms/cc_final_message.py
rename to cloudinit/transforms/final_message.py
diff --git a/cloudinit/transforms/cc_foo.py b/cloudinit/transforms/foo.py
similarity index 100%
rename from cloudinit/transforms/cc_foo.py
rename to cloudinit/transforms/foo.py
diff --git a/cloudinit/transforms/cc_grub_dpkg.py b/cloudinit/transforms/grub_dpkg.py
similarity index 100%
rename from cloudinit/transforms/cc_grub_dpkg.py
rename to cloudinit/transforms/grub_dpkg.py
diff --git a/cloudinit/transforms/cc_keys_to_console.py b/cloudinit/transforms/keys_to_console.py
similarity index 100%
rename from cloudinit/transforms/cc_keys_to_console.py
rename to cloudinit/transforms/keys_to_console.py
diff --git a/cloudinit/transforms/cc_landscape.py b/cloudinit/transforms/landscape.py
similarity index 100%
rename from cloudinit/transforms/cc_landscape.py
rename to cloudinit/transforms/landscape.py
diff --git a/cloudinit/transforms/cc_locale.py b/cloudinit/transforms/locale.py
similarity index 100%
rename from cloudinit/transforms/cc_locale.py
rename to cloudinit/transforms/locale.py
diff --git a/cloudinit/transforms/cc_mcollective.py b/cloudinit/transforms/mcollective.py
similarity index 100%
rename from cloudinit/transforms/cc_mcollective.py
rename to cloudinit/transforms/mcollective.py
diff --git a/cloudinit/transforms/cc_mounts.py b/cloudinit/transforms/mounts.py
similarity index 100%
rename from cloudinit/transforms/cc_mounts.py
rename to cloudinit/transforms/mounts.py
diff --git a/cloudinit/transforms/cc_phone_home.py b/cloudinit/transforms/phone_home.py
similarity index 100%
rename from cloudinit/transforms/cc_phone_home.py
rename to cloudinit/transforms/phone_home.py
diff --git a/cloudinit/transforms/cc_puppet.py b/cloudinit/transforms/puppet.py
similarity index 100%
rename from cloudinit/transforms/cc_puppet.py
rename to cloudinit/transforms/puppet.py
diff --git a/cloudinit/transforms/cc_resizefs.py b/cloudinit/transforms/resizefs.py
similarity index 100%
rename from cloudinit/transforms/cc_resizefs.py
rename to cloudinit/transforms/resizefs.py
diff --git a/cloudinit/transforms/cc_rightscale_userdata.py b/cloudinit/transforms/rightscale_userdata.py
similarity index 100%
rename from cloudinit/transforms/cc_rightscale_userdata.py
rename to cloudinit/transforms/rightscale_userdata.py
diff --git a/cloudinit/transforms/cc_rsyslog.py b/cloudinit/transforms/rsyslog.py
similarity index 100%
rename from cloudinit/transforms/cc_rsyslog.py
rename to cloudinit/transforms/rsyslog.py
diff --git a/cloudinit/transforms/cc_runcmd.py b/cloudinit/transforms/runcmd.py
similarity index 100%
rename from cloudinit/transforms/cc_runcmd.py
rename to cloudinit/transforms/runcmd.py
diff --git a/cloudinit/transforms/cc_salt_minion.py b/cloudinit/transforms/salt_minion.py
similarity index 100%
rename from cloudinit/transforms/cc_salt_minion.py
rename to cloudinit/transforms/salt_minion.py
diff --git a/cloudinit/transforms/cc_scripts_per_boot.py b/cloudinit/transforms/scripts_per_boot.py
similarity index 100%
rename from cloudinit/transforms/cc_scripts_per_boot.py
rename to cloudinit/transforms/scripts_per_boot.py
diff --git a/cloudinit/transforms/cc_scripts_per_instance.py b/cloudinit/transforms/scripts_per_instance.py
similarity index 100%
rename from cloudinit/transforms/cc_scripts_per_instance.py
rename to cloudinit/transforms/scripts_per_instance.py
diff --git a/cloudinit/transforms/cc_scripts_per_once.py b/cloudinit/transforms/scripts_per_once.py
similarity index 100%
rename from cloudinit/transforms/cc_scripts_per_once.py
rename to cloudinit/transforms/scripts_per_once.py
diff --git a/cloudinit/transforms/cc_scripts_user.py b/cloudinit/transforms/scripts_user.py
similarity index 100%
rename from cloudinit/transforms/cc_scripts_user.py
rename to cloudinit/transforms/scripts_user.py
diff --git a/cloudinit/transforms/cc_set_hostname.py b/cloudinit/transforms/set_hostname.py
similarity index 100%
rename from cloudinit/transforms/cc_set_hostname.py
rename to cloudinit/transforms/set_hostname.py
diff --git a/cloudinit/transforms/cc_set_passwords.py b/cloudinit/transforms/set_passwords.py
similarity index 100%
rename from cloudinit/transforms/cc_set_passwords.py
rename to cloudinit/transforms/set_passwords.py
diff --git a/cloudinit/transforms/cc_ssh.py b/cloudinit/transforms/ssh.py
similarity index 100%
rename from cloudinit/transforms/cc_ssh.py
rename to cloudinit/transforms/ssh.py
diff --git a/cloudinit/transforms/cc_ssh_import_id.py b/cloudinit/transforms/ssh_import_id.py
similarity index 100%
rename from cloudinit/transforms/cc_ssh_import_id.py
rename to cloudinit/transforms/ssh_import_id.py
diff --git a/cloudinit/transforms/cc_timezone.py b/cloudinit/transforms/timezone.py
similarity index 100%
rename from cloudinit/transforms/cc_timezone.py
rename to cloudinit/transforms/timezone.py
diff --git a/cloudinit/transforms/cc_update_etc_hosts.py b/cloudinit/transforms/update_etc_hosts.py
similarity index 100%
rename from cloudinit/transforms/cc_update_etc_hosts.py
rename to cloudinit/transforms/update_etc_hosts.py
diff --git a/cloudinit/transforms/cc_update_hostname.py b/cloudinit/transforms/update_hostname.py
similarity index 100%
rename from cloudinit/transforms/cc_update_hostname.py
rename to cloudinit/transforms/update_hostname.py
diff --git a/cloudinit/transforms/cc_welcome.py b/cloudinit/transforms/welcome.py
similarity index 100%
rename from cloudinit/transforms/cc_welcome.py
rename to cloudinit/transforms/welcome.py

From 8346507b13a9ea9ecf171d22aaeda9b048a8257b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 12:33:31 -0700
Subject: [PATCH 153/434] Have the top level distro class take paths instead of
 a runner. This allows the following:

1. Let the ubuntu subclass construct its own runner with those paths (since not every subclass may want it)

Adjust the base class + subclass to reflect this, adjust stages as well to reflect the constructor changes.
---
 cloudinit/distros/__init__.py |  4 ++--
 cloudinit/distros/ubuntu.py   |  8 ++++++++
 cloudinit/stages.py           | 12 +++++-------
 3 files changed, 15 insertions(+), 9 deletions(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index e85e702e..0ee7f06b 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -42,8 +42,8 @@ class Distro(object):
 
     __metaclass__ = abc.ABCMeta
 
-    def __init__(self, name, cfg, runner):
-        self._runner = runner
+    def __init__(self, name, cfg, paths):
+        self._paths = paths
         self._cfg = cfg
         self.name = name
 
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index ad12400a..9b743b55 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -23,6 +23,7 @@
 import os
 
 from cloudinit import distros
+from cloudinit import helpers
 from cloudinit import log as logging
 from cloudinit import util
 
@@ -33,6 +34,13 @@ LOG = logging.getLogger(__name__)
 
 class Distro(distros.Distro):
 
+    def __init__(self, name, cfg, paths):
+        distros.Distro.__init__(self, name, cfg, paths)
+        # This will be used to restrict certain 
+        # calls from repeatly happening (when they
+        # should only happen say once per instance...)
+        self._runner = helpers.Runners(paths)
+    
     def install_packages(self, pkglist):
         self._update_package_sources()
         self._apt_get('install', pkglist)
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 9d8ff2bb..8fa9d6d3 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -77,13 +77,11 @@ class Init(object):
     def distro(self):
         if not self._distro:
             # Try to find the right class to use
-            d_cfg = self._extract_cfg('system')
-            distro_name = d_cfg.pop('distro', 'ubuntu')
-            distro_cls = distros.fetch(distro_name)
-            LOG.debug("Using distro class %s", distro_cls)
-            distro = distro_cls(distro_name, d_cfg,
-                                helpers.Runners(self.paths))
-            self._distro = distro
+            scfg = self._extract_cfg('system')
+            name = scfg.pop('distro', 'ubuntu')
+            cls = distros.fetch(name)
+            LOG.debug("Using distro class %s", cls)
+            self._distro = cls(name, scfg, self.paths)
         return self._distro
 
     @property

From 7e6fc978bc12fd67ea322de1d8ef0bd468c6a20a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 12:34:33 -0700
Subject: [PATCH 154/434] Add comment as to why we need to check for none/empty
 later when fetching an ipath.

---
 cloudinit/helpers.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 76faa1d5..e5c45632 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -128,6 +128,11 @@ class Runners(object):
             return None
         sem_path = None
         if freq == PER_INSTANCE:
+            # This may not exist,
+            # so thats why we still check for none
+            # below if say the paths object
+            # doesn't have a datasource that can
+            # provide this instance path...
             sem_path = self.paths.get_ipath("sem")
         elif freq == PER_ONCE:
             sem_path = self.paths.get_cpath("sem")

From 81c791d7c00476b1e5967ec5024f30c3a58365c7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 12:40:58 -0700
Subject: [PATCH 155/434] If bringing up, return whatever the bring up result
 is, otherwise false.

---
 cloudinit/distros/__init__.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 0ee7f06b..79d441ac 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -80,7 +80,8 @@ class Distro(object):
         self._write_network(settings)
         # Now try to bring them up
         if bring_up:
-            self._interface_action('up')
+            return self._interface_action('up')
+        return False
 
     @abc.abstractmethod
     def set_timezone(self, tz):

From 65f978c3246eff6f276be8de8b80533e75dbbfc6 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 12:51:43 -0700
Subject: [PATCH 156/434] Update the cloud init requirements with comments as
 to why they are needed.

Also:

1. Add in boto as a requirement (used for ec2 metadata calls)
2. Add in pyyaml as a requirement (used for all yaml processing)
3. Add in configobj as a requirement (only for old-style configs)
---
 Requires | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/Requires b/Requires
index dbf64baf..e2ec8ff7 100644
--- a/Requires
+++ b/Requires
@@ -1,3 +1,25 @@
+# Pypi requirements for cloud-init to work
+
+# Used for templating any files or strings that are considered 
+# to be templates, not cheetah since it pulls in alot of extra libs.
+# This one is pretty dinky and does want we want (var substituion)
 Tempita>=0.4
+
+# This is used for any pretty printing of tabular data.
 PrettyTable>=0.4
+
+# This one is currently only used by the MAAS datasource. If that
+# datasource is removed, this is no longer needed
 oauth>=1.0
+
+# This is used to fetch the ec2 metadata into a easily
+# parseable format, instead of having to have cloud-init perform
+# those same fetchs and decodes and signing (...) that ec2 requires.
+boto>=2.4
+
+# This is only needed if you have old style configurations
+configobj>=4.6
+
+# All new style configurations are in the yaml format
+pyyaml>=3.0
+

From 987c06768c3c529bcfa81da1b4435fe63e0d9d6a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 12:58:30 -0700
Subject: [PATCH 157/434] They are handlers not mods ;)

---
 cloudinit/handlers/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 0ff80a9e..afa9ec3b 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -104,7 +104,7 @@ def run_part(mod, data, ctype, filename, payload, frequency):
         else:
             mod.handle_part(data, ctype, filename, payload, frequency)
     except:
-        util.logexc(LOG, ("Failed calling mod %s (%s, %s, %s)"
+        util.logexc(LOG, ("Failed calling handler %s (%s, %s, %s)"
                          " with frequency %s"), 
                     mod, ctype, filename,
                     mod_ver, frequency)

From 77864b2c43a8dd5095153d1f01f9cb4d2bc75407 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:06:02 -0700
Subject: [PATCH 158/434] When a handler version is set but to an unknown
 non-int convertable value, treat it as 1

---
 cloudinit/handlers/__init__.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index afa9ec3b..156e228d 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -98,11 +98,18 @@ def run_part(mod, data, ctype, filename, payload, frequency):
             (frequency == PER_INSTANCE and mod_freq == PER_INSTANCE)):
         return
     mod_ver = mod.handler_version
+    # Sanity checks on version (should be an int convertable)
     try:
-        if mod_ver == 1:
-            mod.handle_part(data, ctype, filename, payload)
-        else:
+        mod_ver = int(mod_ver)
+    except:
+        mod_ver = None
+    try:
+        if mod_ver and mod_ver >= 2:
+            # Treat as v. 2 which does get a frequency
             mod.handle_part(data, ctype, filename, payload, frequency)
+        else:
+            # Treat as v. 1 which gets no frequency
+            mod.handle_part(data, ctype, filename, payload)
     except:
         util.logexc(LOG, ("Failed calling handler %s (%s, %s, %s)"
                          " with frequency %s"), 

From 4cb2327ad002519e81618108337e234f36009d58 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:11:22 -0700
Subject: [PATCH 159/434] Pass in the datasource as a option, instead of the
 lower level instance id.

This allows for others to use datasource functions if they desire to instead of being restricted.

+1 for future use ;)
---
 cloudinit/handlers/boot_hook.py | 6 ++++--
 cloudinit/stages.py             | 2 +-
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/cloudinit/handlers/boot_hook.py b/cloudinit/handlers/boot_hook.py
index 10f60b8d..fa675f09 100644
--- a/cloudinit/handlers/boot_hook.py
+++ b/cloudinit/handlers/boot_hook.py
@@ -32,10 +32,12 @@ LOG = logging.getLogger(__name__)
 
 
 class BootHookPartHandler(handlers.Handler):
-    def __init__(self, paths, instance_id, **_kwargs):
+    def __init__(self, paths, datasource, **_kwargs):
         handlers.Handler.__init__(self, PER_ALWAYS)
         self.boothook_dir = paths.get_ipath("boothooks")
-        self.instance_id = instance_id
+        self.instance_id = None
+        if datasource:
+            self.instance_id = datasource.get_instance_id()
 
     def list_types(self):
         return [
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 8fa9d6d3..2931830c 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -287,7 +287,7 @@ class Init(object):
     def _default_userdata_handlers(self):
         opts = {
             'paths': self.paths,
-            'instance_id': self.datasource.get_instance_id(),
+            'datasource': self.datasource,
         }
         # TODO Hmmm, should we dynamically import these??
         def_handlers = [

From e28ae97c0d47a04b6bfd72e3f57175facfc53893 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:15:34 -0700
Subject: [PATCH 160/434] Add comment as to why this cfg class is useful

---
 cloudinit/cfg.py | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/cloudinit/cfg.py b/cloudinit/cfg.py
index dd8f7baf..215ed855 100644
--- a/cloudinit/cfg.py
+++ b/cloudinit/cfg.py
@@ -20,6 +20,14 @@ import io
 
 from ConfigParser import (NoSectionError, NoOptionError, RawConfigParser)
 
+# This config parser will not throw when sections don't exist
+# and you are setting values on those sections which is useful
+# when writing to new options that may not have corresponding
+# sections. Also it can default other values when doing gets
+# so that if those sections/options do not exist you will
+# get a default instead of an error. Another useful case where
+# you can avoid catching exceptions that you typically don't
+# care about...
 
 class DefaultingConfigParser(RawConfigParser):
     DEF_INT = 0

From 4a7eb1f30040cc0d5f9ba4d39bef04655d9bb1aa Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:19:15 -0700
Subject: [PATCH 161/434] Add comment as to why the cloud object/wrapper is
 useful

---
 cloudinit/cloud.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index 8372d123..a2a5cfdb 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -27,6 +27,16 @@ from cloudinit import log as logging
 
 LOG = logging.getLogger(__name__)
 
+# This class is the high level wrapper that provides
+# access to cloud-init objects without exposing the stage objects
+# to handler and or transform manipulation. It allows for cloud
+# init to restrict what those types of user facing code may see
+# and or adjust (which helps avoid code messing with each other)
+#
+# It also provides util functions that avoid having to know
+# how to get a certain member from this submembers as well
+# as providing a backwards compatible object that can be maintained
+# while the stages/other objects can be worked on independently...
 
 class Cloud(object):
     def __init__(self, datasource, paths, cfg, distro, runners):

From b5086ec15c21da1e2e5f319aa9a7a9c7466d0a14 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:23:32 -0700
Subject: [PATCH 162/434] Check instance id against none, and not just
 empty/false/0/none since 0 or empty might be valid

---
 cloudinit/handlers/boot_hook.py | 2 +-
 cloudinit/stages.py             | 8 ++++----
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/cloudinit/handlers/boot_hook.py b/cloudinit/handlers/boot_hook.py
index fa675f09..456b8020 100644
--- a/cloudinit/handlers/boot_hook.py
+++ b/cloudinit/handlers/boot_hook.py
@@ -63,7 +63,7 @@ class BootHookPartHandler(handlers.Handler):
         filepath = self._write_part(payload, filename)
         try:
             env = os.environ.copy()
-            if self.instance_id:
+            if self.instance_id is not None:
                 env['INSTANCE_ID'] = str(self.instance_id)
             util.subp([filepath], env=env)
         except util.ProcessExecutionError:
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 2931830c..c2d78a78 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -233,13 +233,13 @@ class Init(object):
 
         # Write what the datasource was and is..
         ds = "%s: %s" % (util.obj_name(self.datasource), self.datasource)
-        previous_ds = ''
+        previous_ds = None
         ds_fn = os.path.join(idir, 'datasource')
         try:
             previous_ds = util.load_file(ds_fn).strip()
         except Exception:
             pass
-        if not previous_ds:
+        if previous_ds is None:
             # TODO: ?? is this right
             previous_ds = ds
         util.write_file(ds_fn, "%s\n" % ds)
@@ -248,14 +248,14 @@ class Init(object):
 
         # What the instance id was and is...
         iid = self.datasource.get_instance_id()
-        previous_iid = ''
+        previous_iid = None
         p_iid_fn = os.path.join(dp, 'previous-instance-id')
         c_iid_fn = os.path.join(dp, 'instance-id')
         try:
             previous_iid = util.load_file(p_iid_fn).strip()
         except Exception:
             pass
-        if not previous_iid:
+        if previous_iid is None:
             # TODO: ?? is this right
             previous_iid = iid
         util.write_file(c_iid_fn, "%s\n" % iid)

From b795faf73d5f933904706fe884836e7277ba0cb8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:25:15 -0700
Subject: [PATCH 163/434] Revert that last change for this file, it should be a
 string that is non-empty so checking against that is fine

---
 cloudinit/stages.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index c2d78a78..05b59852 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -239,7 +239,7 @@ class Init(object):
             previous_ds = util.load_file(ds_fn).strip()
         except Exception:
             pass
-        if previous_ds is None:
+        if not previous_ds:
             # TODO: ?? is this right
             previous_ds = ds
         util.write_file(ds_fn, "%s\n" % ds)
@@ -255,7 +255,7 @@ class Init(object):
             previous_iid = util.load_file(p_iid_fn).strip()
         except Exception:
             pass
-        if previous_iid is None:
+        if not previous_iid:
             # TODO: ?? is this right
             previous_iid = iid
         util.write_file(c_iid_fn, "%s\n" % iid)

From f0559348d8e904c7ee90c2e285ff6c576bc28912 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:27:10 -0700
Subject: [PATCH 164/434] Should be loaded not loading

---
 cloudinit/stages.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 05b59852..b0eef928 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -92,7 +92,7 @@ class Init(object):
         # None check so that we don't keep on re-loading if empty
         if self._cfg is None:
             self._cfg = self._read_cfg()
-            LOG.debug("Loading init config %s", self._cfg)
+            LOG.debug("Loaded init config %s", self._cfg)
         # Nobody gets the real config
         ocfg = copy.deepcopy(self._cfg)
         if restriction == 'restricted':

From bd39c490adb3f361c6014c86f29030f2ae37ea82 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:31:48 -0700
Subject: [PATCH 165/434] Fix logic issue with reading previous file for
 previous instance id, when the current file should be looked at instead

---
 cloudinit/stages.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index b0eef928..ddac2ac2 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -249,17 +249,17 @@ class Init(object):
         # What the instance id was and is...
         iid = self.datasource.get_instance_id()
         previous_iid = None
-        p_iid_fn = os.path.join(dp, 'previous-instance-id')
         c_iid_fn = os.path.join(dp, 'instance-id')
         try:
-            previous_iid = util.load_file(p_iid_fn).strip()
+            previous_iid = util.load_file(c_iid_fn).strip()
         except Exception:
             pass
         if not previous_iid:
             # TODO: ?? is this right
             previous_iid = iid
         util.write_file(c_iid_fn, "%s\n" % iid)
-        util.write_file(p_iid_fn, "%s\n" % previous_iid)
+        util.write_file(os.path.join(dp, 'previous-instance-id'),
+                        "%s\n" % previous_iid)
         return iid
 
     def fetch(self):

From e97959c5a7d714c1f4f2760e32d3d736a669df3e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:33:06 -0700
Subject: [PATCH 166/434] Comments about checking if this is right, no longer
 needed

---
 cloudinit/stages.py | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index ddac2ac2..5a00eae3 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -240,7 +240,6 @@ class Init(object):
         except Exception:
             pass
         if not previous_ds:
-            # TODO: ?? is this right
             previous_ds = ds
         util.write_file(ds_fn, "%s\n" % ds)
         util.write_file(os.path.join(dp, 'previous-datasource'),
@@ -249,17 +248,16 @@ class Init(object):
         # What the instance id was and is...
         iid = self.datasource.get_instance_id()
         previous_iid = None
-        c_iid_fn = os.path.join(dp, 'instance-id')
+        iid_fn = os.path.join(dp, 'instance-id')
         try:
-            previous_iid = util.load_file(c_iid_fn).strip()
+            previous_iid = util.load_file(iid_fn).strip()
         except Exception:
             pass
         if not previous_iid:
-            # TODO: ?? is this right
             previous_iid = iid
-        util.write_file(c_iid_fn, "%s\n" % iid)
+        util.write_file(iid_fn, "%s\n" % iid)
         util.write_file(os.path.join(dp, 'previous-instance-id'),
-                        "%s\n" % previous_iid)
+                        "%s\n" % (previous_iid))
         return iid
 
     def fetch(self):

From 4eef02db6d9a9597687e7aee16f2ee1b58ffa9b3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 13:43:31 -0700
Subject: [PATCH 167/434] Comments as to why we are using a csv parser and do
 some of the logic checks that are done for option extraction

---
 cloudinit/ssh_util.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index f6941a29..ba252e7f 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -79,12 +79,22 @@ class AuthKeyEntry(object):
     
         options = ent[0:i]
         options_lst = []
+        
+        # Now use a csv parser to pull the options
+        # out of the above string that we just found an endpoint for.
+        #
+        # No quoting so we don't mess up any of the quoting that
+        # is already there.
         reader = csv.reader(StringIO(options), quoting=csv.QUOTE_NONE)
         for row in reader:
             for e in row:
+                # Only keep non-empty csv options
                 e = e.strip()
                 if e:
                     options_lst.append(e)
+
+        # Now take the rest of the items before the string
+        # as long as there is room to do this...
         toks = []
         if i + 1 < len(ent):
             toks = ent[i + 1:].split(None, 3)

From 56367832967a870515ade2056c7699a617c52ea8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 19:18:29 -0700
Subject: [PATCH 168/434] Update ssh_util to have a parser class and a line
 entry class. Also have a method that will parse the authorized key file.

This allows:

1. Testing of parsing seperate from testing of entry construction.
1. Testing of authorized key file parsing, separate from updating.
---
 cloudinit/ssh_util.py | 118 +++++++++++++++++++++++++-----------------
 1 file changed, 71 insertions(+), 47 deletions(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index ba252e7f..663afd92 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -32,7 +32,38 @@ LOG = logging.getLogger(__name__)
 DEF_SSHD_CFG = "/etc/ssh/sshd_config"
 
 
-class AuthKeyEntry(object):
+class AuthKeyLine(object):
+    def __init__(self, source, keytype=None, base64=None,
+                 comment=None, options=None):
+        self.base64 = base64
+        self.comment = comment
+        self.options = options
+        self.keytype = keytype
+        self.source = source
+
+    def empty(self):
+        if (not self.base64 and
+            not self.comment and not self.keytype and not self.options):
+            return True
+        return False
+
+    def __str__(self):
+        toks = []
+        if self.options:
+            toks.append(self.options)
+        if self.keytype:
+            toks.append(self.keytype)
+        if self.base64:
+            toks.append(self.base64)
+        if self.comment:
+            toks.append(self.comment)
+        if not toks:
+            return self.source
+        else:
+            return ' '.join(toks)
+
+
+class AuthKeyLineParser(object):
     """
     AUTHORIZED_KEYS FILE FORMAT
      AuthorizedKeysFile specifies the file containing public keys for public
@@ -52,10 +83,6 @@ class AuthKeyEntry(object):
      case-insensitive):
     """
 
-    def __init__(self, line, def_opt=None):
-        self.line = str(line)
-        (self.value, self.components) = self._parse(self.line, def_opt)
-
     def _extract_options(self, ent):
         """
         The options (if present) consist of comma-separated option specifica-
@@ -97,10 +124,11 @@ class AuthKeyEntry(object):
         # as long as there is room to do this...
         toks = []
         if i + 1 < len(ent):
-            toks = ent[i + 1:].split(None, 3)
+            rest = ent[i + 1:]
+            toks = rest.split(None, 2)
         return (options_lst, toks)
 
-    def _form_components(self, toks):
+    def _form_components(self, line, toks, options=None):
         components = {}
         if len(toks) == 1:
             components['base64'] = toks[0]
@@ -111,50 +139,31 @@ class AuthKeyEntry(object):
             components['keytype'] = toks[0]
             components['base64'] = toks[1]
             components['comment'] = toks[2]
-        return components
+        components['options'] = options
+        if not components:
+            return AuthKeyLine(line)
+        else:
+            return AuthKeyLine(line, **components)
 
-    def get(self, piece):
-        return self.components.get(piece)
-
-    def _parse(self, in_line, def_opt):
+    def parse(self, in_line, def_opt=None):
         line = in_line.rstrip("\r\n")
         if line.startswith("#") or line.strip() == '':
-            return (False, {})
+            return AuthKeyLine(source=line)
         else:
             ent = line.strip()
             toks = ent.split(None, 3)
-            tmp_components = {}
-            if def_opt:
-                tmp_components['options'] = def_opt
             if len(toks) < 4:
-                tmp_components.update(self._form_components(toks))
+                return self._form_components(line, toks, def_opt)
             else:
                 (options, toks) = self._extract_options(ent)
                 if options:
-                    tmp_components['options'] = ",".join(options)
-                tmp_components.update(self._form_components(toks))
-            # We got some useful value!
-            return (True, tmp_components)
-
-    def __str__(self):
-        if not self.value:
-            return self.line
-        else:
-            toks = []
-            if 'options' in self.components:
-                toks.append(self.components['options'])
-            if 'keytype' in self.components:
-                toks.append(self.components['keytype'])
-            if 'base64' in self.components:
-                toks.append(self.components['base64'])
-            if 'comment' in self.components:
-                toks.append(self.components['comment'])
-            if not toks:
-                return ''
-            return ' '.join(toks)
+                    options = ",".join(options)
+                else:
+                    options = def_opt
+                return self._form_components(line, toks, options)
 
 
-def update_authorized_keys(fname, keys):
+def parse_authorized_keys(fname):
     lines = []
     try:
         if os.path.isfile(fname):
@@ -163,25 +172,38 @@ def update_authorized_keys(fname, keys):
         util.logexc(LOG, "Error reading lines from %s", fname)
         lines = []
 
+    parser = AuthKeyLineParser()
+    contents = []
+    for line in lines:
+        contents.append(parser.parse(line))
+    return contents
+
+
+def update_authorized_keys(fname, keys):
+    entries = parse_authorized_keys(fname)
     to_add = list(keys)
-    for i in range(0, len(lines)):
-        ent = AuthKeyEntry(lines[i])
-        if not ent.value:
+
+    for i in range(0, len(entries)):
+        ent = entries[i]
+        if ent.empty() or not ent.base64:
             continue
         # Replace those with the same base64
         for k in keys:
-            if not k.value:
+            if k.empty() or not k.base64:
                 continue
-            if k.get('base64') == ent.get('base64'):
+            if k.base64 == ent.base64:
                 # Replace it with our better one
                 ent = k
                 # Don't add it later
                 to_add.remove(k)
-        lines[i] = str(ent)
+        entries[i] = ent
 
     # Now append any entries we did not match above
     for key in to_add:
-        lines.append(str(key))
+        entries.append(key)
+
+    # Now format them back to strings...
+    lines = [str(b) for b in entries]
 
     # Ensure it ends with a newline
     lines.append('')
@@ -198,9 +220,11 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn=None):
         util.ensure_dir(ssh_dir, mode=0700)
         util.chownbyid(ssh_dir, pwent.pw_uid, pwent.pw_gid)
 
+    # Turn the keys given into actual entries
+    parser = AuthKeyLineParser()
     key_entries = []
     for k in keys:
-        key_entries.append(AuthKeyEntry(k, def_opt=key_prefix))
+        key_entries.append(parser.parse(str(k), def_opt=key_prefix))
 
     with util.SeLinuxGuard(ssh_dir, recursive=True):
         try:

From 38b20db28a1850caa83aeb5a563d74ab49ea92ce Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 19:24:30 -0700
Subject: [PATCH 169/434] Send in src line instead of stripped line.

---
 cloudinit/ssh_util.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index 663afd92..d58707d0 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -128,7 +128,7 @@ class AuthKeyLineParser(object):
             toks = rest.split(None, 2)
         return (options_lst, toks)
 
-    def _form_components(self, line, toks, options=None):
+    def _form_components(self, src_line, toks, options=None):
         components = {}
         if len(toks) == 1:
             components['base64'] = toks[0]
@@ -141,26 +141,26 @@ class AuthKeyLineParser(object):
             components['comment'] = toks[2]
         components['options'] = options
         if not components:
-            return AuthKeyLine(line)
+            return AuthKeyLine(src_line)
         else:
-            return AuthKeyLine(line, **components)
+            return AuthKeyLine(src_line, **components)
 
-    def parse(self, in_line, def_opt=None):
-        line = in_line.rstrip("\r\n")
+    def parse(self, src_line, def_opt=None):
+        line = src_line.rstrip("\r\n")
         if line.startswith("#") or line.strip() == '':
-            return AuthKeyLine(source=line)
+            return AuthKeyLine(src_line)
         else:
             ent = line.strip()
             toks = ent.split(None, 3)
             if len(toks) < 4:
-                return self._form_components(line, toks, def_opt)
+                return self._form_components(src_line, toks, def_opt)
             else:
                 (options, toks) = self._extract_options(ent)
                 if options:
                     options = ",".join(options)
                 else:
                     options = def_opt
-                return self._form_components(line, toks, options)
+                return self._form_components(src_line, toks, options)
 
 
 def parse_authorized_keys(fname):

From 1fc29a2cd8a7442d65830377906b90782195dd9d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 19:38:41 -0700
Subject: [PATCH 170/434] Capture the exceptions and just re-throw the last one
 on errors

---
 cloudinit/url_helper.py | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 7ae0226a..18686686 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -60,7 +60,7 @@ def readurl(url, data=None, timeout=None,
     retries = max(retries, 0)
     attempts = retries + 1
 
-    last_excp = Exception("??")
+    excepts = []
     LOG.info(("Attempting to read from %s with %s attempts"
                 " (%s retries) to be performed"), url, attempts, retries)
     open_args = {}
@@ -78,16 +78,16 @@ def readurl(url, data=None, timeout=None,
                          url, status, len(content), (i + 1))
                 return (content, status)
         except urllib2.HTTPError as e:
-            last_excp = e
+            excepts.append(e)
         except urllib2.URLError as e:
             # This can be a message string or
             # another exception instance 
             # (socket.error for remote URLs, OSError for local URLs).
             if (isinstance(e.reason, (OSError)) and
                 e.reason.errno == errno.ENOENT):
-                last_excp = e.reason
+                excepts.append(e.reason)
             else:
-                last_excp = e
+                excepts.append(e)
         if i + 1 < attempts:
             LOG.debug("Please wait %s seconds while we wait to try again",
                      sec_between)
@@ -95,7 +95,11 @@ def readurl(url, data=None, timeout=None,
 
     # Didn't work out
     LOG.warn("Failed reading from %s after %s attempts", url, attempts)
-    raise last_excp
+    
+    # It must of errored at least once for code
+    # to get here so re-raise the last error
+    LOG.debug("%s errors occured, re-raising the last one", len(excepts))
+    raise excepts[-1]
 
 
 def wait_for_url(urls, max_wait=None, timeout=None,

From 25ba996edc4822a9106779719b998b8694db96dc Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 19:43:42 -0700
Subject: [PATCH 171/434] Let read_file_or_url util function have good defaults

---
 cloudinit/util.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 38ca9573..11986447 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -553,7 +553,7 @@ def read_optional_seed(fill, base="", ext="", timeout=5):
         raise
 
 
-def read_file_or_url(url, timeout, retries, file_retries):
+def read_file_or_url(url, timeout=5, retries=10, file_retries=0):
     if url.startswith("/"):
         url = "file://%s" % url
     if url.startswith("file://"):

From 4b258a4593a5e348284c0146dc040e7ddf4995eb Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 19:45:48 -0700
Subject: [PATCH 172/434] Allow url fetching to catch any other type of
 exceptions that occur

---
 cloudinit/url_helper.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 18686686..95de9c7a 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -88,6 +88,8 @@ def readurl(url, data=None, timeout=None,
                 excepts.append(e.reason)
             else:
                 excepts.append(e)
+        except Exception as e:
+            excepts.append(e)
         if i + 1 < attempts:
             LOG.debug("Please wait %s seconds while we wait to try again",
                      sec_between)

From 6811734ccebb1649e1e95327d08b120632d80f43 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 19:57:01 -0700
Subject: [PATCH 173/434] Remove default since it will never be called that way
 and apply default since its not currently being called that way

---
 cloudinit/ssh_util.py       | 5 +----
 cloudinit/transforms/ssh.py | 3 +--
 2 files changed, 2 insertions(+), 6 deletions(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index d58707d0..13adbb09 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -210,10 +210,7 @@ def update_authorized_keys(fname, keys):
     return '\n'.join(lines)
 
 
-def setup_user_keys(keys, user, key_prefix, sshd_config_fn=None):
-    if not sshd_config_fn:
-        sshd_config_fn = DEF_SSHD_CFG
-
+def setup_user_keys(keys, user, key_prefix, sshd_config_fn=DEF_SSHD_CFG):
     pwent = pwd.getpwnam(user)
     ssh_dir = os.path.join(pwent.pw_dir, '.ssh')
     if not os.path.exists(ssh_dir):
diff --git a/cloudinit/transforms/ssh.py b/cloudinit/transforms/ssh.py
index f5c22e28..b1f2ce89 100644
--- a/cloudinit/transforms/ssh.py
+++ b/cloudinit/transforms/ssh.py
@@ -112,8 +112,7 @@ def handle(_name, cfg, cloud, log, _args):
         util.logexc(log, "Applying ssh credentials failed!")
 
 
-def apply_credentials(keys, user, disable_root,
-                      disable_root_opts=DISABLE_ROOT_OPTS):
+def apply_credentials(keys, user, disable_root, disable_root_opts):
 
     keys = set(keys)
     if user:

From 5b453631ff1d02ee67f566106e67fe92ea47f65f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 20:03:38 -0700
Subject: [PATCH 174/434] Match the transform named final_msg by adding a _msg
 to the transform name.

---
 cloudinit/transforms/{welcome.py => welcome_msg.py} | 0
 config/cloud.cfg                                    | 2 +-
 2 files changed, 1 insertion(+), 1 deletion(-)
 rename cloudinit/transforms/{welcome.py => welcome_msg.py} (100%)

diff --git a/cloudinit/transforms/welcome.py b/cloudinit/transforms/welcome_msg.py
similarity index 100%
rename from cloudinit/transforms/welcome.py
rename to cloudinit/transforms/welcome_msg.py
diff --git a/config/cloud.cfg b/config/cloud.cfg
index f1c43f2f..147e0500 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -20,7 +20,7 @@ preserve_hostname: false
 
 # The transform modules that run in the 'init' stage
 cloud_init_modules:
- - welcome
+ - welcome_msg
  - bootcmd
  - resizefs
  - set_hostname

From 99a0001c621c4646f6a3deaac12aea00292a02fb Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 20:04:13 -0700
Subject: [PATCH 175/434] Not config anymore, now a transform

---
 cloudinit/stages.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 5a00eae3..24a4d23f 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -474,7 +474,7 @@ class Transforms(object):
                 func_args = [name, copy.deepcopy(self.cfg),
                              c_cloud, transforms.LOG, args]
                 # This name will affect the semaphore name created
-                run_name = "config-%s" % (name)
+                run_name = "transform-%s" % (name)
                 c_cloud.run(run_name, mod.handle, func_args, freq=freq)
             except Exception as e:
                 util.logexc(LOG, "Running %s (%s) failed", name, mod)

From 835ac9de92abf4697a9dbe7537678e70ae4c716a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 20:16:19 -0700
Subject: [PATCH 176/434] Rename user data obj, which is really a user data
 message object and add comments as to what the data items are used for

---
 cloudinit/stages.py | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 24a4d23f..70f2bcc9 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -306,7 +306,7 @@ class Init(object):
         sys.path.insert(0, idir)
 
         # Ensure datasource fetched before activation (just incase)
-        ud_obj = self.datasource.get_userdata()
+        user_data_msg = self.datasource.get_userdata()
 
         # This keeps track of all the active handlers
         c_handlers = helpers.ContentHandlers()
@@ -340,15 +340,17 @@ class Init(object):
         # Walk the user data
         part_data = {
             'handlers': c_handlers,
+            # Any new handlers that are encountered get writen here
             'handlerdir': idir,
-            'data': data, 
+            'data': data,
+            # The default frequency if handlers don't have one
             'frequency': frequency,
             # This will be used when new handlers are found
             # to help write there contents to files with numbered
             # names...
             'handlercount': 0,
         }
-        handlers.walk(ud_obj, handlers.walker_callback, data=part_data)
+        handlers.walk(user_data_msg, handlers.walker_callback, data=part_data)
 
         # Give callbacks opportunity to finalize
         called = []

From cd8fd732b81a981875a04a3e773bdd6035954360 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 20:16:26 -0700
Subject: [PATCH 177/434] 1. Ensure a that when a bad version is found, that it
 gets set to 1. 2. Increment part handler count even if it doesn't get
 registered (this shouldn't cause any problems)

---
 cloudinit/handlers/__init__.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 156e228d..0ef704f7 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -102,7 +102,7 @@ def run_part(mod, data, ctype, filename, payload, frequency):
     try:
         mod_ver = int(mod_ver)
     except:
-        mod_ver = None
+        mod_ver = 1
     try:
         if mod_ver and mod_ver >= 2:
             # Treat as v. 2 which does get a frequency
@@ -134,12 +134,12 @@ def walker_handle_handler(pdata, _ctype, _filename, payload):
         modfname = "%s.py" % (modfname)
     # TODO: Check if path exists??
     util.write_file(modfname, payload, 0600)
+    pdata['handlercount'] = curcount + 1
     handlers = pdata['handlers']
     try:
         mod = fixup_handler(importer.import_module(modname))
         handlers.register(mod)
         call_begin(mod, pdata['data'], frequency)
-        pdata['handlercount'] = curcount + 1
     except:
         util.logexc(LOG, "Failed at registered python file: %s", modfname)
 

From 6b52f5af635359d60b296744ec73110e858e1636 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 20:22:16 -0700
Subject: [PATCH 178/434] Update error messaging for when importing/registring
 a part-handler fails

---
 cloudinit/handlers/__init__.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 0ef704f7..3944c661 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -141,7 +141,8 @@ def walker_handle_handler(pdata, _ctype, _filename, payload):
         handlers.register(mod)
         call_begin(mod, pdata['data'], frequency)
     except:
-        util.logexc(LOG, "Failed at registered python file: %s", modfname)
+        util.logexc(LOG, ("Failed at registering python file: %s"
+                          " (part handler %s)"), modfname, curcount)
 
 
 def _extract_first_or_bytes(blob, size):

From 8597dbbb8a1923240ea5ad0b4cdef3c812b99623 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 20:44:58 -0700
Subject: [PATCH 179/434] 1. Fix the welcome_msg name to welcome_message (oops)
 2. Adjust that name in the cloud.cfg 3. Add in the ability to specify a
 dictionary that is the transform instead of a list    which makes the config
 look nicer when users have custom transforms with arguments and such.

---
 cloudinit/stages.py                                  | 12 ++++++++++++
 .../{welcome_msg.py => welcome_message.py}           |  0
 config/cloud.cfg                                     | 12 ++++++++----
 3 files changed, 20 insertions(+), 4 deletions(-)
 rename cloudinit/transforms/{welcome_msg.py => welcome_message.py} (100%)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 70f2bcc9..ba6cb915 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -431,6 +431,18 @@ class Transforms(object):
                     contents['args'] = item[2:]
                 if contents:
                     module_list.append(contents)
+            elif isinstance(item, (dict)):
+                contents = {}
+                valid = False
+                if 'name' in item:
+                    contents['mod'] = item['name'].strip()
+                    valid = True
+                if 'frequency' in item:
+                    contents['freq'] = item['frequency'].strip()
+                if 'args' in item:
+                    contents['args'] = item['args'] or []
+                if contents and valid:
+                    module_list.append(contents)
             else:
                 raise TypeError(("Failed to read '%s' item in config,"
                                  " unknown type %s") %
diff --git a/cloudinit/transforms/welcome_msg.py b/cloudinit/transforms/welcome_message.py
similarity index 100%
rename from cloudinit/transforms/welcome_msg.py
rename to cloudinit/transforms/welcome_message.py
diff --git a/config/cloud.cfg b/config/cloud.cfg
index 147e0500..0e431962 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -18,9 +18,13 @@ preserve_hostname: false
 #      timeout: 5 # (defaults to 50 seconds)
 #      max_wait: 10 # (defaults to 120 seconds)
 
-# The transform modules that run in the 'init' stage
+# The transform that run in the 'init' stage
 cloud_init_modules:
- - welcome_msg
+# This is the hash way of specifying a transform
+ - name: welcome_message
+# This argument list will get passed to the transform when activated
+   args:
+    - init
  - bootcmd
  - resizefs
  - set_hostname
@@ -30,7 +34,7 @@ cloud_init_modules:
  - rsyslog
  - ssh
 
- # The transform modules that run in the 'config' stage
+ # The transforms that run in the 'config' stage
 cloud_config_modules:
  - mounts
  - ssh-import-id
@@ -49,7 +53,7 @@ cloud_config_modules:
  - runcmd
  - byobu
 
-# The transform modules that run in the 'final' stage
+# The transforms that run in the 'final' stage
 cloud_final_modules:
  - rightscale_userdata
  - scripts-per-once

From 66ccc2353e02df3c088da341af99cb1b196d4e26 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 20:48:30 -0700
Subject: [PATCH 180/434] Consistently use dashes instead of underscores for
 the transform names

---
 config/cloud.cfg | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/config/cloud.cfg b/config/cloud.cfg
index 0e431962..7a6bf243 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -21,15 +21,15 @@ preserve_hostname: false
 # The transform that run in the 'init' stage
 cloud_init_modules:
 # This is the hash way of specifying a transform
- - name: welcome_message
+ - name: welcome-message
 # This argument list will get passed to the transform when activated
    args:
     - init
  - bootcmd
  - resizefs
- - set_hostname
- - update_hostname
- - update_etc_hosts
+ - set-hostname
+ - update-hostname
+ - update-etc-hosts
  - ca-certs
  - rsyslog
  - ssh
@@ -55,7 +55,7 @@ cloud_config_modules:
 
 # The transforms that run in the 'final' stage
 cloud_final_modules:
- - rightscale_userdata
+ - rightscale-userdata
  - scripts-per-once
  - scripts-per-boot
  - scripts-per-instance

From b5c554e8a3628db95f102fee7aebab6848e0ed7c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 23:12:21 -0700
Subject: [PATCH 181/434] Fix include on enabling, simplify statements around
 include skipping, allow for case insensitive include statements to be used

---
 cloudinit/user_data.py | 28 ++++++++++++++++------------
 1 file changed, 16 insertions(+), 12 deletions(-)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 2f01579a..7a79cc02 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -100,16 +100,18 @@ class UserDataProcessor(object):
                             'urlcache', entry_fn)
 
     def _do_include(self, content, append_msg):
-        # is just a list of urls, one per line
+        # Inlude a list of urls, one per line
         # also support '#include <url here>'
+        # or #include-once '<url here>'
+        include_once_on = False
         for line in content.splitlines():
-            includeonce = False
-            if line in ("#include", "#include-once"):
-                continue
-            if line.startswith("#include-once"):
+            lc_line = line.lower()
+            if lc_line.startswith("#include-once"):
                 line = line[len("#include-once"):].lstrip()
-                includeonce = True
-            elif line.startswith("#include"):
+                # Every following include will now 
+                # not be refetched....
+                include_once_on = True
+            elif lc_line.startswith("#include"):
                 line = line[len("#include"):].lstrip()
             if line.startswith("#"):
                 continue
@@ -117,13 +119,15 @@ class UserDataProcessor(object):
             if not include_url:
                 continue
 
-            includeonce_filename = self._get_include_once_filename(include_url)
-            if includeonce and os.path.isfile(includeonce_filename):
-                content = util.load_file(includeonce_filename)
+            include_once_fn = None
+            if include_once_on:
+                include_once_fn = self._get_include_once_filename(include_url)
+            if include_once_on and os.path.isfile(include_once_fn):
+                content = util.load_file(include_once_fn)
             else:
                 (content, st) = url_helper.readurl(include_url)
-                if includeonce and url_helper.ok_http_code(st):
-                    util.write_file(includeonce_filename, content, mode=0600)
+                if include_once_on and url_helper.ok_http_code(st):
+                    util.write_file(include_once_fn, content, mode=0600)
                 if not url_helper.ok_http_code(st):
                     content = ''
 

From ea767f14185c6f80e5265c4c06c45732c6e81577 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 23:15:05 -0700
Subject: [PATCH 182/434] 1. Allow for checking against lower case include
 types. 2. Perform lstrip on the payload, just incase people put
 spaces/whitespace before the type.

---
 cloudinit/handlers/__init__.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 3944c661..d3374666 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -218,8 +218,10 @@ def fixup_handler(mod, def_freq=PER_INSTANCE):
 
 
 def type_from_starts_with(payload, default=None):
+    payload_lc = payload.lower()
+    payload_lc = payload_lc.lstrip()
     for text in INCLUSION_SRCH:
-        if payload.startswith(text):
+        if payload_lc.startswith(text):
             return INCLUSION_TYPES_MAP[text]
     return default
 

From 6bace7c07c374e33c7375f7042867121696d50b7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sat, 16 Jun 2012 23:19:02 -0700
Subject: [PATCH 183/434] Add todo to see if we should turn back off include
 once

---
 cloudinit/user_data.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 7a79cc02..663f7cda 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -113,6 +113,7 @@ class UserDataProcessor(object):
                 include_once_on = True
             elif lc_line.startswith("#include"):
                 line = line[len("#include"):].lstrip()
+                # TODO: Should we turn back off include once here???
             if line.startswith("#"):
                 continue
             include_url = line.strip()

From aeaecdd9ceaf8dd19bff344b967ea0f0f03bd075 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sun, 17 Jun 2012 00:15:04 -0700
Subject: [PATCH 184/434] Log handler + info that is about to be called

---
 cloudinit/handlers/__init__.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index d3374666..c6f2119c 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -104,7 +104,9 @@ def run_part(mod, data, ctype, filename, payload, frequency):
     except:
         mod_ver = 1
     try:
-        if mod_ver and mod_ver >= 2:
+        LOG.debug("Calling handler %s (%s, %s, %s) with frequency %s", 
+                  mod, ctype, filename, mod_ver, frequency)
+        if mod_ver >= 2:
             # Treat as v. 2 which does get a frequency
             mod.handle_part(data, ctype, filename, payload, frequency)
         else:

From 19202ba958eb5eb1c7318890a3909a1d62489406 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 17 Jun 2012 13:37:49 -0700
Subject: [PATCH 185/434] 1. Remove rhel sysconfig for timezone, now have a
 rhel distro subclass 2. Remove private apt_get function, since it can just be
 the package_command public one.

---
 cloudinit/distros/ubuntu.py | 19 ++++++-------------
 1 file changed, 6 insertions(+), 13 deletions(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 9b743b55..ec4d6b5b 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -43,14 +43,11 @@ class Distro(distros.Distro):
     
     def install_packages(self, pkglist):
         self._update_package_sources()
-        self._apt_get('install', pkglist)
+        self.package_command('install', pkglist)
 
     def _write_network(self, settings):
         util.write_file("/etc/network/interfaces", settings)
 
-    def package_command(self, command, args=None):
-        self._apt_get(command, args)
-
     def set_hostname(self, hostname):
         contents = "%s\n" % (hostname)
         util.write_file("/etc/hostname", contents, 0644)
@@ -103,24 +100,20 @@ class Distro(distros.Distro):
                              " no file found at %s") % (tz, tz_file))
         tz_contents = "%s\n" % tz
         util.write_file("/etc/timezone", tz_contents)
-        # TODO, this should be in a rhel distro subclass??
-        if os.path.exists("/etc/sysconfig/clock"):
-            tz_contents = '"%s"\n' % tz
-            util.write_file("/etc/sysconfig/clock", tz_contents)
-        # This ensures that the correct tz will be used for the system
         util.copy(tz_file, "/etc/localtime")
 
-    # apt_get top level command (install, update...), and args to pass it
-    def _apt_get(self, tlc, args=None):
+    def package_command(self, command, args=None):
         e = os.environ.copy()
+        # See: http://tiny.cc/kg91fw
+        # Or: http://tiny.cc/mh91fw
         e['DEBIAN_FRONTEND'] = 'noninteractive'
         cmd = ['apt-get', '--option', 'Dpkg::Options::=--force-confold',
-               '--assume-yes', tlc]
+               '--assume-yes', command]
         if args:
             cmd.extend(args)
         # Allow the output of this to flow outwards (ie not be captured)
         util.subp(cmd, env=e, capture=False)
 
     def _update_package_sources(self):
-        self._runner.run("update-sources", self._apt_get,
+        self._runner.run("update-sources", self.package_command,
                          ["update"], freq=PER_INSTANCE)
\ No newline at end of file

From c636a8780327bb1f00689e2c2ee85b4f766e8449 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 17 Jun 2012 13:38:58 -0700
Subject: [PATCH 186/434] Added a new rhel distro that does the following.

1. Translate (some of) the ubuntu network format to the rhel format (until we have python netcf active) and
   then write the different ifcfg files to /etc/sysconfig/network-scripts as needed to bring the network online
2. Apply the hostname to the write /etc/sysconfig/network file (appending to it or adjusting that file if it exists)
3. Write to the /etc/sysconfig/clock file to adjust the timezone (or adjust that file instead of appending)
4. Runs yum commands (to match the packaging commands in the apt-get flavor)
5. Update the hostname in /etc/sysconfig/network (or a previous file) for the update hostname transform
---
 cloudinit/distros/rhel.py | 294 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 294 insertions(+)
 create mode 100644 cloudinit/distros/rhel.py

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
new file mode 100644
index 00000000..85283b23
--- /dev/null
+++ b/cloudinit/distros/rhel.py
@@ -0,0 +1,294 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import os
+
+from cloudinit import distros
+from cloudinit import log as logging
+from cloudinit import util
+
+LOG = logging.getLogger(__name__)
+
+NETWORK_FN_TPL = '/etc/sysconfig/network-scripts/ifcfg-%s'
+
+
+class Distro(distros.Distro):
+
+    def __init__(self, name, cfg, paths):
+        distros.Distro.__init__(self, name, cfg, paths)
+    
+    def install_packages(self, pkglist):
+        self.package_command('install', pkglist)
+
+    def _write_network(self, settings):
+        # TODO fix this... since this is the ubuntu format
+        entries = translate_network(settings)
+        LOG.debug("Translated ubuntu style network settings %s into %s",
+                  settings, entries)
+        # Make the intermediate format as the rhel format...
+        for (dev, info) in entries.iteritems():
+            lines = []
+            lines.append("DEVICE=%s" % (dev))
+            boot_proto = info.get('bootproto')
+            if boot_proto:
+                lines.append("BOOTPROTO=%s" % (boot_proto))
+            net_mask = info.get('netmask')
+            if net_mask:
+                lines.append("NETMASK=%s" % (net_mask))
+            addr = info.get('address')
+            if addr:
+                lines.append("IPADDR=%s" % (addr))
+            if info.get('auto'):
+                lines.append("ONBOOT=yes")
+            else:
+                lines.append("ONBOOT=no")
+            gtway = info.get('gateway')
+            if gtway:
+                lines.append("GATEWAY=%s" % (gtway))
+            bcast = info.get('broadcast')
+            if bcast:
+                lines.append("BROADCAST=%s" % (bcast))
+            mac_addr = info.get('hwaddress')
+            if mac_addr:
+                lines.append("MACADDR=%s" % (mac_addr))
+            contents = "\n".join(lines)
+            net_fn = NETWORK_FN_TPL % (dev)
+            util.write_file(net_fn, contents, 0644)
+
+    def set_hostname(self, hostname):
+        self._write_hostname(hostname, "/etc/sysconfig/network")
+        LOG.debug("Setting hostname to %s", hostname)
+        util.subp(['hostname', hostname])
+
+    def _write_hostname(self, hostname, out_fn):
+        old_contents = []
+        if os.path.isfile(out_fn):
+            old_contents = self._read_conf(out_fn)
+        # Update the 'HOSTNAME' if it exists instead of appending
+        new_contents = []
+        adjusted = False
+        for entry in old_contents:
+            if not entry:
+                continue
+            if len(entry) == 1:
+                new_contents.append(entry[0])
+                continue
+            (cmd, args) = entry
+            cmd_c = cmd.strip().lower()
+            if cmd_c == 'hostname':
+                args = "%s" % (hostname)
+                adjusted = True
+            new_contents.append("=".join([cmd, args]))
+        # Guess not found, append it
+        if not adjusted:
+            new_contents.append("HOSTNAME=%s" % (hostname))
+        contents = "\n".join(new_contents)
+        util.write_file(out_fn, contents, 0644)
+
+    def update_hostname(self, hostname, prev_file):
+        hostname_prev = self._read_hostname(prev_file)
+        hostname_in_sys = self._read_hostname("/etc/sysconfig/network")
+        update_files = []
+        if not hostname_prev or hostname_prev != hostname:
+            update_files.append(prev_file)
+        if (not hostname_in_sys or
+           (hostname_in_sys == hostname_prev and hostname_in_sys != hostname)):
+            update_files.append("/etc/sysconfig/network")
+        for fn in update_files:
+            try:
+                self._write_hostname(hostname, fn)
+            except:
+                util.logexc(LOG, "Failed to write hostname %s to %s",
+                            hostname, fn)
+        if (hostname_in_sys and hostname_prev and
+            hostname_in_sys != hostname_prev):
+            LOG.debug(("%s differs from /etc/sysconfig/network."
+                        " Assuming user maintained hostname."), prev_file)
+        if "/etc/sysconfig/network" in update_files:
+            LOG.debug("Setting hostname to %s", hostname)
+            util.subp(['hostname', hostname])
+
+    def _read_hostname(self, filename, default=None):
+        contents = self._read_conf(filename)
+        for c in contents:
+            if len(c) != 2:
+                continue
+            (cmd, args) = c
+            cmd_c = cmd.lower().strip()
+            if cmd_c == 'hostname':
+                args_c = args.strip()
+                if args_c:
+                    return args_c
+        return default
+
+    def _read_conf(self, filename):
+        contents = util.load_file(filename, quiet=True)
+        conf_lines = []
+        for line in contents.splitlines():
+            c_line = line.strip()
+            if not c_line or c_line.startswith("#"):
+                conf_lines.append([line])
+                continue
+            # Handle inline comments
+            c_pos = c_line.find("#")
+            if c_pos != -1:
+                c_line = c_line[0:c_pos].strip()
+            if not c_line:
+                conf_lines.append([line])
+                continue
+            # Format should be CMD=ARG1 ARG2...
+            pieces = c_line.split("=", 1)
+            if not pieces or len(pieces) == 1:
+                conf_lines.append([line])
+                continue
+            (cmd, args) = pieces
+            cmd = cmd.strip()
+            conf_lines.append([cmd, args])
+        return conf_lines
+
+    def set_timezone(self, tz):
+        tz_file = os.path.join("/usr/share/zoneinfo", tz)
+        if not os.path.isfile(tz_file):
+            raise Exception(("Invalid timezone %s,"
+                             " no file found at %s") % (tz, tz_file))
+        # Adjust the sysconfig clock zone setting
+        old_contents = self._read_conf("/etc/sysconfig/clock")
+        new_contents = []
+        zone_added = False
+        # Update the 'ZONE' if it exists instead of appending
+        for entry in old_contents:
+            if not entry:
+                continue
+            if len(entry) == 1:
+                new_contents.append(entry[0])
+                continue
+            (cmd, args) = entry
+            cmd_c = cmd.lower().strip()
+            if cmd_c == 'zone':
+                args = '"%s"' % (tz)
+                zone_added = True
+            new_contents.append("=".join([cmd, args]))
+        # Guess not found, append it
+        if not zone_added:
+            new_contents.append('ZONE="%s"' % (tz))
+        tz_contents = "\n".join(new_contents)
+        util.write_file("/etc/sysconfig/clock", tz_contents)
+        # This ensures that the correct tz will be used for the system
+        util.copy(tz_file, "/etc/localtime")
+
+    def package_command(self, command, args=None):
+        cmd = ['yum']
+        # If enabled, then yum will be tolerant of errors on the command line
+        # with regard to packages. 
+        # For example: if you request to install foo, bar and baz and baz is 
+        # installed; yum won't error out complaining that baz is already
+        # installed. 
+        cmd.append("-t")
+        # Determines whether or not yum prompts for confirmation 
+        # of critical actions. We don't want to prompt...
+        cmd.append("-y")
+        cmd.append(command)
+        if args:
+            cmd.extend(args)
+        # Allow the output of this to flow outwards (ie not be captured)
+        util.subp(cmd, capture=False)
+        
+        
+# This is a util function to translate a ubuntu /etc/network/interfaces 'blob'
+# to a rhel equiv. that can then be written to /etc/sysconfig/network-scripts/
+# TODO remove when we have python-netcf active...
+def translate_network(settings):
+    # Get the standard cmd, args from the ubuntu format
+    entries = []
+    for line in settings.splitlines():
+        line = line.strip()
+        if not line or line.startswith("#"):
+            continue
+        split_up = line.split(None, 1)
+        if len(split_up) <= 1:
+            continue
+        entries.append(split_up)
+    # Figure out where each iface section is
+    ifaces = []
+    consume = {}
+    for (cmd, args) in entries:
+        if cmd == 'iface':
+            if consume:
+                ifaces.append(consume)
+                consume = {}
+            consume[cmd] = args
+        else:
+            consume[cmd] = args
+    # Check if anything left over to consume
+    absorb = False
+    for (cmd, args) in consume.iteritems():
+        if cmd == 'iface':
+            absorb = True
+    if absorb:
+        ifaces.append(consume)
+    # Now translate
+    real_ifaces = {}
+    for info in ifaces:
+        if 'iface' not in info:
+            continue
+        iface_details = info['iface'].split(None)
+        dev_name = None
+        if len(iface_details) >= 1:
+            dev = iface_details[0].strip().lower()
+            if dev:
+                dev_name = dev
+        if not dev_name:
+            continue
+        iface_info = {}
+        if len(iface_details) >= 3:
+            proto_type = iface_details[2].strip().lower()
+            # Seems like this can be 'loopback' which we don't
+            # really care about
+            if proto_type in ['dhcp', 'static']:
+                iface_info['bootproto'] = proto_type
+        # These can just be copied over
+        for k in ['netmask', 'address', 'gateway', 'broadcast']:
+            if k in info:
+                val = info[k].strip().lower()
+                if val:
+                    iface_info[k] = val
+        # Is any mac address spoofing going on??
+        if 'hwaddress' in info:
+            hw_info = info['hwaddress'].lower().strip()
+            hw_split = hw_info.split(None, 1)
+            if len(hw_split) == 2 and hw_split[0].startswith('ether'):
+                hw_addr = hw_split[1]
+                if hw_addr:
+                    iface_info['hwaddress'] = hw_addr
+        real_ifaces[dev_name] = iface_info
+    # Check for those that should be started on boot via 'auto'
+    for (cmd, args) in entries:
+        if cmd == 'auto':
+            # Seems like auto can be like 'auto eth0 eth0:1' so just get the
+            # first part out as the device name
+            args = args.split(None)
+            if not args:
+                continue
+            dev_name = args[0].strip().lower()
+            if dev_name in real_ifaces:
+                real_ifaces[dev_name]['auto'] = True
+    return real_ifaces

From f23f4a075dd58d1f7bc0bf7149d4d07d4acaac4d Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 17 Jun 2012 13:48:53 -0700
Subject: [PATCH 187/434] 1. Adjust the ubuntu network hostname writing to go
 through a standard write function 2. Add comment as to why we search for "#"
 when reading

---
 cloudinit/distros/ubuntu.py | 17 ++++++++++-------
 1 file changed, 10 insertions(+), 7 deletions(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index ec4d6b5b..786974ad 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -49,11 +49,14 @@ class Distro(distros.Distro):
         util.write_file("/etc/network/interfaces", settings)
 
     def set_hostname(self, hostname):
-        contents = "%s\n" % (hostname)
-        util.write_file("/etc/hostname", contents, 0644)
+        self._write_hostname(hostname, "/etc/hostname")
         LOG.debug("Setting hostname to %s", hostname)
         util.subp(['hostname', hostname])
 
+    def _write_hostname(self, hostname, out_fn):
+        contents = "%s\n" % (hostname)
+        util.write_file(out_fn, contents, 0644)
+
     def update_hostname(self, hostname, prev_file):
         hostname_prev = self._read_hostname(prev_file)
         hostname_in_etc = self._read_hostname("/etc/hostname")
@@ -65,8 +68,7 @@ class Distro(distros.Distro):
             update_files.append("/etc/hostname")
         for fn in update_files:
             try:
-                contents = "%s\n" % (hostname)
-                util.write_file(fn, contents, 0644)
+                self._write_hostname(hostname, fn)
             except:
                 util.logexc(LOG, "Failed to write hostname %s to %s",
                             hostname, fn)
@@ -82,11 +84,12 @@ class Distro(distros.Distro):
         contents = util.load_file(filename, quiet=True)
         for line in contents.splitlines():
             hpos = line.find("#")
+            # Handle inline comments
             if hpos != -1:
                 line = line[0:hpos]
-            line = line.rstrip()
-            if line:
-                return line
+            line_c = line.strip()
+            if line_c:
+                return line_c
         return default
 
     def _get_localhost_ip(self):

From 90a0658805acb8e7cd1cfe2b17e4bbe3ade67f9b Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 17 Jun 2012 18:21:30 -0700
Subject: [PATCH 188/434] Update the variable for comment positioning to be
 'c_pos' (comment position) instead of 'hpos' (??)

---
 cloudinit/distros/ubuntu.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 786974ad..c0345c1d 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -83,10 +83,10 @@ class Distro(distros.Distro):
     def _read_hostname(self, filename, default=None):
         contents = util.load_file(filename, quiet=True)
         for line in contents.splitlines():
-            hpos = line.find("#")
+            c_pos = line.find("#")
             # Handle inline comments
-            if hpos != -1:
-                line = line[0:hpos]
+            if c_pos != -1:
+                line = line[0:c_pos]
             line_c = line.strip()
             if line_c:
                 return line_c

From 0fc2ab95244ef7c7edfc9e88ff869f0102a33719 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 17 Jun 2012 18:23:24 -0700
Subject: [PATCH 189/434] 1. Add a url response class that urlreading now
 returns (instead of a tuple).    a. This allows for more properties to be
 added as needed in the future, instead of being very restrictive. 2. Fix up
 all uses of the url reading to now use this new response object. 3. Also
 fixup user data including, such that if no response actual occurs the url
 content is not further processed.

---
 cloudinit/sources/DataSourceMAAS.py         |  9 ++--
 cloudinit/transforms/rightscale_userdata.py |  6 +--
 cloudinit/url_helper.py                     | 49 ++++++++++++++++-----
 cloudinit/user_data.py                      | 20 ++++++---
 cloudinit/util.py                           | 16 ++++---
 5 files changed, 69 insertions(+), 31 deletions(-)

diff --git a/cloudinit/sources/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
index 40ace947..bb8fbac1 100644
--- a/cloudinit/sources/DataSourceMAAS.py
+++ b/cloudinit/sources/DataSourceMAAS.py
@@ -185,9 +185,12 @@ def read_maas_seed_url(seed_url, header_cb=None, timeout=None,
         else:
             headers = {}
         try:
-            (resp, sc) = uhelp.readurl(url, headers=headers, timeout=timeout)
-            if uhelp.ok_http_code(sc):
-                md[name] = resp
+            resp = uhelp.readurl(url, headers=headers, timeout=timeout)
+            if resp.ok():
+                md[name] = str(resp)
+            else:
+                LOG.warn(("Fetching from %s resulted in"
+                          " an invalid http code %s"), url, resp.code)
         except urllib2.HTTPError as e:
             if e.code != 404:
                 raise
diff --git a/cloudinit/transforms/rightscale_userdata.py b/cloudinit/transforms/rightscale_userdata.py
index 40d76c89..8dfd845f 100644
--- a/cloudinit/transforms/rightscale_userdata.py
+++ b/cloudinit/transforms/rightscale_userdata.py
@@ -79,10 +79,10 @@ def handle(name, _cfg, cloud, log, _args):
     for (i, url) in enumerate(urls):
         fname = os.path.join(scripts_d, "rightscale-%02i" % (i))
         try:
-            (content, st) = uhelp.readurl(url)
+            resp = uhelp.readurl(url)
             # Ensure its a valid http response (and something gotten)
-            if uhelp.ok_http_code(st) and content:
-                util.write_file(fname, content, mode=0700)
+            if resp.ok() and resp.contents:
+                util.write_file(fname, str(resp), mode=0700)
                 wrote_fns.append(fname)
         except Exception as e:
             captured_excps.append(e)
diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 95de9c7a..56649c1b 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -34,11 +34,35 @@ from cloudinit import version
 LOG = logging.getLogger(__name__)
 
 
-def ok_http_code(st, redirects_ok=False):
-    if redirects_ok:
-        return st in xrange(200, 400)
-    else:
-        return st in xrange(200, 300)
+class UrlResponse(object):
+    def __init__(self, status_code, contents=None, headers=None):
+        self._status_code = status_code
+        self._contents = contents
+        self._headers = headers
+
+    @property
+    def code(self):
+        return self._status_code
+
+    @property
+    def contents(self):
+        return self._contents
+    
+    @property
+    def headers(self):
+        return self._headers
+    
+    def __str__(self):
+        if not self.contents:
+            return ''
+        else:
+            return str(self.contents)
+
+    def ok(self, redirects_ok=False):
+        if redirects_ok:
+            return self.code in xrange(200, 400)
+        else:
+            return self.code in xrange(200, 300)
 
 
 def readurl(url, data=None, timeout=None,
@@ -74,9 +98,12 @@ def readurl(url, data=None, timeout=None,
                 if status is None:
                     # This seems to happen when files are read...
                     status = 200
+                headers = {}
+                if rh.headers:
+                    headers = dict(rh.headers)
                 LOG.info("Read from %s (%s, %sb) after %s attempts",
                          url, status, len(content), (i + 1))
-                return (content, status)
+                return UrlResponse(status, content, headers)
         except urllib2.HTTPError as e:
             excepts.append(e)
         except urllib2.URLError as e:
@@ -162,11 +189,11 @@ def wait_for_url(urls, max_wait=None, timeout=None,
                 else:
                     headers = {}
 
-                (resp, sc) = readurl(url, headers=headers, timeout=timeout)
-                if not resp:
-                    reason = "empty response [%s]" % sc
-                elif not ok_http_code(sc):
-                    reason = "bad status code [%s]" % sc
+                resp = readurl(url, headers=headers, timeout=timeout)
+                if not resp.contents:
+                    reason = "empty response [%s]" % (resp.code)
+                elif not resp.ok():
+                    reason = "bad status code [%s]" % (resp.code)
                 else:
                     return url
             except urllib2.HTTPError as e:
diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 663f7cda..bf34943d 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -121,19 +121,25 @@ class UserDataProcessor(object):
                 continue
 
             include_once_fn = None
+            content = None
             if include_once_on:
                 include_once_fn = self._get_include_once_filename(include_url)
             if include_once_on and os.path.isfile(include_once_fn):
                 content = util.load_file(include_once_fn)
             else:
-                (content, st) = url_helper.readurl(include_url)
-                if include_once_on and url_helper.ok_http_code(st):
-                    util.write_file(include_once_fn, content, mode=0600)
-                if not url_helper.ok_http_code(st):
-                    content = ''
+                resp = url_helper.readurl(include_url)
+                if include_once_on and resp.ok():
+                    util.write_file(include_once_fn, str(resp), mode=0600)
+                if resp.ok():
+                    content = str(resp)
+                else:
+                    LOG.warn(("Fetching from %s resulted in"
+                              " a invalid http code of %s"),
+                             include_url, resp.code)
 
-            new_msg = convert_string(content)
-            self._process_msg(new_msg, append_msg)
+            if content is not None:
+                new_msg = convert_string(content)
+                self._process_msg(new_msg, append_msg)
 
     def _explode_archive(self, archive, append_msg):
         entries = util.load_yaml(archive, default=[], allowed=[list, set])
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 11986447..b6fa959b 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -595,14 +595,16 @@ def read_seeded(base="", ext="", timeout=5, retries=10, file_retries=0):
         ud_url = "%s%s%s" % (base, "user-data", ext)
         md_url = "%s%s%s" % (base, "meta-data", ext)
 
-    (md_str, msc) = read_file_or_url(md_url, timeout, retries, file_retries)
+    md_resp = read_file_or_url(md_url, timeout, retries, file_retries)
     md = None
-    if md_str and uhelp.ok_http_code(msc):
+    if md_resp.ok():
+        md_str = str(md_resp)
         md = load_yaml(md_str, default={})
 
-    (ud_str, usc) = read_file_or_url(ud_url, timeout, retries, file_retries)
+    ud_resp = read_file_or_url(ud_url, timeout, retries, file_retries)
     ud = None
-    if ud_str and uhelp.ok_http_code(usc):
+    if ud_resp.ok():
+        ud_str = str(ud_resp)
         ud = ud_str
 
     return (md, ud)
@@ -769,9 +771,9 @@ def get_cmdline_url(names=None, starts=None, cmdline=None):
     if not url:
         return (None, None, None)
 
-    (contents, sc) = uhelp.readurl(url)
-    if contents.startswith(starts) and uhelp.ok_http_code(sc):
-        return (key, url, contents)
+    resp = uhelp.readurl(url)
+    if resp.contents.startswith(starts) and resp.ok():
+        return (key, url, str(resp))
 
     return (key, url, None)
 

From 3d5497a25252c26c7bb2ef3dc7c088cb43c826a2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:21:15 -0700
Subject: [PATCH 190/434] 1. Add in a clean section that will remove the
 /var/lib/cloud dir and the cloud.log file (helpful for testing)

---
 Makefile | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 783ebd76..683475fd 100644
--- a/Makefile
+++ b/Makefile
@@ -15,5 +15,9 @@ test:
 2to3:
 	2to3 $(PY_FILES)
 
-.PHONY: test pylint pyflakes 2to3
+clean:
+	rm -rf /var/log/cloud-init.log \
+		   /var/lib/cloud/
+
+.PHONY: test pylint pyflakes 2to3 clean
 

From 2526d1e27b34901dd3140783602e579ae3f25ee0 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:22:01 -0700
Subject: [PATCH 191/434] 1. Decreasing of logging in piping routing 2. Fixup
 of merge dict after found out that it depends on the src return for non dict
 types 3. Only merge kernel config if there was any kernel config

---
 cloudinit/util.py | 34 ++++++++++++++--------------------
 1 file changed, 14 insertions(+), 20 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index b6fa959b..aaeaa5fc 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -275,15 +275,20 @@ def is_ipv4(instr):
 
 def merge_base_cfg(cfgfile, cfg_builtin=None):
     syscfg = read_conf_with_confd(cfgfile)
-
+    
     kern_contents = read_cc_from_cmdline()
     kerncfg = {}
     if kern_contents:
         kerncfg = load_yaml(kern_contents, default={})
 
-    # kernel parameters override system config
-    combined = mergedict(kerncfg, syscfg)
+    # Kernel parameters override system config
+    if kerncfg:
+        combined = mergedict(kerncfg, syscfg)
+    else:
+        combined = syscfg
+
     if cfg_builtin:
+        # Combined over-ride anything builtin
         fin = mergedict(combined, cfg_builtin)
     else:
         fin = combined
@@ -450,18 +455,11 @@ def mergedict(src, cand):
     Nested dictionaries are merged recursively.
     """
     if isinstance(src, dict) and isinstance(cand, dict):
-        for k, v in cand.iteritems():
+        for (k, v) in cand.iteritems():
             if k not in src:
                 src[k] = v
             else:
                 src[k] = mergedict(src[k], v)
-    else:
-        if not isinstance(src, dict):
-            raise TypeError(("Attempting to merge a non dictionary "
-                             "source type: %s") % (obj_name(src)))
-        if not isinstance(cand, dict):
-            raise TypeError(("Attempting to merge a non dictionary "
-                             "candidate type: %s") % (obj_name(cand)))
     return src
 
 
@@ -616,7 +614,7 @@ def read_conf_d(confd):
 
     # remove anything not ending in '.cfg'
     confs = [f for f in confs if f.endswith(".cfg")]
-
+    
     # remove anything not a file
     confs = [f for f in confs if os.path.isfile(os.path.join(confd, f))]
 
@@ -646,7 +644,8 @@ def read_conf_with_confd(cfgfile):
     if not confd or not os.path.isdir(confd):
         return cfg
 
-    return mergedict(read_conf_d(confd), cfg)
+    cfg = mergedict(read_conf_d(confd), cfg)
+    return cfg
 
 
 def read_cc_from_cmdline(cmdline=None):
@@ -752,13 +751,10 @@ def get_fqdn_from_hosts(hostname, filename="/etc/hosts"):
     return fqdn
 
 
-def get_cmdline_url(names=None, starts=None, cmdline=None):
+def get_cmdline_url(names=('cloud-config-url', 'url'),
+                    starts="#cloud-config", cmdline=None):
     if cmdline is None:
         cmdline = get_cmdline()
-    if not names:
-        names = ('cloud-config-url', 'url')
-    if not starts:
-        starts = "#cloud-config"
 
     data = keyval_str_to_dict(cmdline)
     url = None
@@ -895,8 +891,6 @@ def get_cmdline():
 
 def pipe_in_out(in_fh, out_fh, chunk_size=1024, chunk_cb=None):
     bytes_piped = 0
-    LOG.debug(("Transferring the contents of %s "
-             "to %s in chunks of size %sb"), in_fh, out_fh, chunk_size)
     while True:
         data = in_fh.read(chunk_size)
         if data == '':

From 6d10b8d89d7f8f1bb8507e536b66ebadbe20ede8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:23:49 -0700
Subject: [PATCH 192/434] Adjust log message to say "open" instead of 'read'
 since this function can also post data...

---
 cloudinit/url_helper.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 56649c1b..5b5b41e2 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -85,7 +85,7 @@ def readurl(url, data=None, timeout=None,
     attempts = retries + 1
 
     excepts = []
-    LOG.info(("Attempting to read from %s with %s attempts"
+    LOG.info(("Attempting to open %s with %s attempts"
                 " (%s retries) to be performed"), url, attempts, retries)
     open_args = {}
     if timeout is not None:

From 53c44a81ce801ce5f41b79b4c71d6949cf251de7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:24:32 -0700
Subject: [PATCH 193/434] Include link to netcf library in the comment.

---
 cloudinit/distros/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 79d441ac..483642f3 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -53,7 +53,7 @@ class Distro(object):
 
     @abc.abstractmethod
     def _write_network(self, settings):
-        # In the future use the python-netcf
+        # In the future use the http://fedorahosted.org/netcf/
         # to write this blob out in a distro format
         raise NotImplementedError()
 

From 2df7700507a0449ace3d461751097fc5e4ad756a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:25:10 -0700
Subject: [PATCH 194/434] Add created by or added by cloud-init lines when we
 modify or create files.

---
 cloudinit/distros/rhel.py   | 3 +++
 cloudinit/distros/ubuntu.py | 5 ++++-
 2 files changed, 7 insertions(+), 1 deletion(-)

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index 85283b23..e0ca5909 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -70,6 +70,7 @@ class Distro(distros.Distro):
             mac_addr = info.get('hwaddress')
             if mac_addr:
                 lines.append("MACADDR=%s" % (mac_addr))
+            lines.insert(0, '# Created by cloud-init')
             contents = "\n".join(lines)
             net_fn = NETWORK_FN_TPL % (dev)
             util.write_file(net_fn, contents, 0644)
@@ -100,6 +101,7 @@ class Distro(distros.Distro):
             new_contents.append("=".join([cmd, args]))
         # Guess not found, append it
         if not adjusted:
+            new_contents.append("# Added by cloud-init")
             new_contents.append("HOSTNAME=%s" % (hostname))
         contents = "\n".join(new_contents)
         util.write_file(out_fn, contents, 0644)
@@ -189,6 +191,7 @@ class Distro(distros.Distro):
             new_contents.append("=".join([cmd, args]))
         # Guess not found, append it
         if not zone_added:
+            new_contents.append("# Added by cloud-init")
             new_contents.append('ZONE="%s"' % (tz))
         tz_contents = "\n".join(new_contents)
         util.write_file("/etc/sysconfig/clock", tz_contents)
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index c0345c1d..24724d83 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -54,7 +54,10 @@ class Distro(distros.Distro):
         util.subp(['hostname', hostname])
 
     def _write_hostname(self, hostname, out_fn):
-        contents = "%s\n" % (hostname)
+        lines = []
+        lines.append("# Created by cloud-init")
+        lines.append(str(hostname))
+        contents = "\n".join(lines)
         util.write_file(out_fn, contents, 0644)
 
     def update_hostname(self, hostname, prev_file):

From e17f702dfeecf00eab8f2cc8bf79874acfb144b3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:26:16 -0700
Subject: [PATCH 195/434] 1. Simplify basic logging (which will not always be
 turned on in the new cloud init main entrypoint 2. Have the ability to reset
 the logging handlers  a. This seems needed when we initially have basic
 logging turned on, then later we come in and change the logging.     It seems
 required for some odd reason to go in and reset the handlers for the
 root/cloudinit loggers (needs some more investigation).

---
 cloudinit/log.py | 44 ++++++++++++++++++++++++++------------------
 1 file changed, 26 insertions(+), 18 deletions(-)

diff --git a/cloudinit/log.py b/cloudinit/log.py
index 5fcb77ef..478946f8 100644
--- a/cloudinit/log.py
+++ b/cloudinit/log.py
@@ -46,24 +46,14 @@ DEF_CON_FORMAT = '%(asctime)s - %(filename)s[%(levelname)s]: %(message)s'
 
 def setupBasicLogging():
     root = logging.getLogger()
-    # Warnings go to the console
     console = logging.StreamHandler(sys.stderr)
     console.setFormatter(logging.Formatter(DEF_CON_FORMAT))
-    console.setLevel(WARNING)
+    console.setLevel(DEBUG)
     root.addHandler(console)
-    # Everything else goes to this file (if we can)
-    try:
-        cfile = logging.FileHandler('/var/log/cloud-init.log')
-        cfile.setFormatter(logging.Formatter(DEF_CON_FORMAT))
-        cfile.setLevel(DEBUG)
-        root.addHandler(cfile)
-    except (IOError, OSError):
-        # Likely that u can't write to that file...
-        # Make console now have DEBUG??
-        console.setLevel(DEBUG)
     root.setLevel(DEBUG)
 
 
+
 def setupLogging(cfg=None):
     # See if the config provides any logging conf...
     if not cfg:
@@ -86,7 +76,7 @@ def setupLogging(cfg=None):
     # See if any of them actually load...
     am_tried = 0
     am_worked = 0
-    for log_cfg in log_cfgs:
+    for i, log_cfg in enumerate(log_cfgs):
         try:
             am_tried += 1
             # Assume its just a string if not a filename
@@ -97,13 +87,14 @@ def setupLogging(cfg=None):
             # Attempt to load its config
             logging.config.fileConfig(log_cfg)
             am_worked += 1
-        except Exception:
-            pass
+        except Exception as e:
+            sys.stderr.write(("WARN: Setup of logging config %s"
+                              " failed due to: %s\n") % (i + 1, e))
 
     # If it didn't work, at least setup a basic logger (if desired)
     basic_enabled = cfg.get('log_basic', True)
     if not am_worked:
-        sys.stderr.write(("Warning, no logging configured!"
+        sys.stderr.write(("WARN: no logging configured!"
                           " (tried %s configs)\n") % (am_tried))
         if basic_enabled:
             sys.stderr.write("Setting up basic logging...\n")
@@ -123,5 +114,22 @@ except ImportError:
         def emit(self, record):
             pass
 
-logger = logging.getLogger()
-logger.addHandler(NullHandler())
+
+def _resetLogger(log):
+    if not log:
+        return
+    handlers = list(log.handlers)
+    for h in handlers:
+        h.flush()
+        h.close()
+        log.removeHandler(h)
+    log.setLevel(NOTSET)
+    log.addHandler(NullHandler())
+
+
+def resetLogging():
+    _resetLogger(logging.getLogger())
+    _resetLogger(getLogger())
+
+
+resetLogging()

From 8e43f12b1bf5c42a5a985639926657b37afa83a6 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:28:25 -0700
Subject: [PATCH 196/434] When logging is 'cycled' ensure that we call the
 logging reset routine first.

---
 cloudinit/cloud.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index a2a5cfdb..90679202 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -50,6 +50,7 @@ class Cloud(object):
     # it is typically useful to cause the logging to be
     # setup again.
     def cycle_logging(self):
+        logging.resetLogging()
         logging.setupLogging(self.cfg)
 
     @property

From d5ba0f66d70ae672a5bd9b9d7db0e70dcc35df09 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:29:16 -0700
Subject: [PATCH 197/434] Fix include once always staying on, only turn it on
 until a include says to turn it back off, if one of those is encountered

---
 cloudinit/user_data.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index bf34943d..b7902d44 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -100,7 +100,7 @@ class UserDataProcessor(object):
                             'urlcache', entry_fn)
 
     def _do_include(self, content, append_msg):
-        # Inlude a list of urls, one per line
+        # Include a list of urls, one per line
         # also support '#include <url here>'
         # or #include-once '<url here>'
         include_once_on = False
@@ -109,11 +109,14 @@ class UserDataProcessor(object):
             if lc_line.startswith("#include-once"):
                 line = line[len("#include-once"):].lstrip()
                 # Every following include will now 
-                # not be refetched....
+                # not be refetched.... but will be 
+                # re-read from a local urlcache (if it worked)
                 include_once_on = True
             elif lc_line.startswith("#include"):
                 line = line[len("#include"):].lstrip()
-                # TODO: Should we turn back off include once here???
+                # Disable the include once if it was on
+                # if it wasn't, then this has no effect.
+                include_once_on = False
             if line.startswith("#"):
                 continue
             include_url = line.strip()

From 4ac6031c487354cd0092cf0fe531df70e285b240 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:30:21 -0700
Subject: [PATCH 198/434] Add comments as to what the special reference
 sections mean in log_cfgs

---
 config/cloud.cfg.d/05_logging.cfg | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/config/cloud.cfg.d/05_logging.cfg b/config/cloud.cfg.d/05_logging.cfg
index 2e7ac2ed..410a0650 100644
--- a/config/cloud.cfg.d/05_logging.cfg
+++ b/config/cloud.cfg.d/05_logging.cfg
@@ -1,4 +1,4 @@
-## this yaml formated config file handles setting
+## This yaml formated config file handles setting
 ## logger information.  The values that are necessary to be set
 ## are seen at the bottom.  The top '_log' are only used to remove
 ## redundency in a syslog and fallback-to-file case.
@@ -53,5 +53,9 @@ _log:
    args=("/dev/log", handlers.SysLogHandler.LOG_USER)
 
 log_cfgs:
+# These will be joined into a string that defines the configuration
  - [ *log_base, *log_syslog ]
+# These will be joined into a string that defines the configuration
  - [ *log_base, *log_file ]
+# A file path can also be used
+# - /etc/log.conf

From 542c92ee801caa88c1264d7b9b8ec5c76d67680d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:32:03 -0700
Subject: [PATCH 199/434] 1. Revert the 'transform-' template back to 'config-'
 template for now. 2. Make the init class have a public 'read_cfg' which can
 be used to force cfg loading to occur (instead of having to go through the
 cfg property)    a. This is a more 'public' way of forcing config to load,
 without exposing the config itself.

---
 cloudinit/stages.py | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index ba6cb915..a713bd1f 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -89,10 +89,8 @@ class Init(object):
         return self._extract_cfg('restricted')
 
     def _extract_cfg(self, restriction):
-        # None check so that we don't keep on re-loading if empty
-        if self._cfg is None:
-            self._cfg = self._read_cfg()
-            LOG.debug("Loaded init config %s", self._cfg)
+        # Ensure actually read
+        self.read_cfg()
         # Nobody gets the real config
         ocfg = copy.deepcopy(self._cfg)
         if restriction == 'restricted':
@@ -154,6 +152,12 @@ class Init(object):
                     g = None
                 util.chownbyname(log_file, u, g)
 
+    def read_cfg(self):
+        # None check so that we don't keep on re-loading if empty
+        if self._cfg is None:
+            self._cfg = self._read_cfg()
+            LOG.debug("Loaded init config %s", self._cfg)
+
     def _read_cfg(self):
         b_config = util.get_builtin_cfg()
         try:
@@ -488,7 +492,7 @@ class Transforms(object):
                 func_args = [name, copy.deepcopy(self.cfg),
                              c_cloud, transforms.LOG, args]
                 # This name will affect the semaphore name created
-                run_name = "transform-%s" % (name)
+                run_name = "config-%s" % (name)
                 c_cloud.run(run_name, mod.handle, func_args, freq=freq)
             except Exception as e:
                 util.logexc(LOG, "Running %s (%s) failed", name, mod)

From 62b27e436f7d2521dde508cbcf155ca93c9b5183 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 17:33:36 -0700
Subject: [PATCH 200/434] 1. Initial work on a unified program that will call
 into the new libraries.

Main features:

1. Use of argparse + subcommands to handle 'action' specific actions
  a. Actions being 'query', 'init', 'final', 'config'

!WIP!
---
 bin/cloud-init2.py | 183 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 183 insertions(+)
 create mode 100755 bin/cloud-init2.py

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
new file mode 100755
index 00000000..6663379f
--- /dev/null
+++ b/bin/cloud-init2.py
@@ -0,0 +1,183 @@
+#!/usr/bin/python
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import argparse
+import os
+import traceback
+import sys
+
+# This is more just for running from the bin folder
+possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
+        sys.argv[0]), os.pardir, os.pardir))
+if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
+    sys.path.insert(0, possible_topdir)
+
+
+from cloudinit import log as logging
+from cloudinit import netinfo
+from cloudinit import settings
+from cloudinit import sources
+from cloudinit import stages
+from cloudinit import util
+from cloudinit import version
+
+
+# Things u can query on
+QUERY_DATA_TYPES = [
+    'data',
+    'data_raw',
+    'instance_id',
+]
+
+LOG = logging.getLogger(__name__)
+
+
+def read_write_cmdline_url(target_fn):
+    if not os.path.exists(target_fn):
+        try:
+            (key, url, content) = util.get_cmdline_url()
+        except:
+            util.logexc(LOG, "Failed fetching command line url")
+            return
+        try:
+            if key and content:
+                util.write_file(target_fn, content, mode=0600)
+                LOG.info(("Wrote to %s with contents of command line"
+                          " url %s (len=%s)"), target_fn, url, len(content))
+            elif key and not content:
+                LOG.info(("Command line key %s with url"
+                          " %s had no contents"), key, url)
+        except:
+            util.logexc(LOG, "Failed writing url content to %s", target_fn)
+
+
+def main_init(args):
+    deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
+    if args.local:
+        deps = [sources.DEP_FILESYSTEM]
+
+    cfg_path = None
+    if args.file:
+        # Already opened so lets just pass that along
+        # since it would of broke if it couldn't have
+        # read that file
+        cfg_path = str(args.file.name)
+
+    if not args.local:
+        # What is this for??
+        root_name = "%s.d" % (settings.CLOUD_CONFIG)
+        target_fn = os.path.join(root_name, "91_kernel_cmdline_url.cfg")
+        read_write_cmdline_url(target_fn)
+    
+    # Cloud-init 'init' stage is broken up into the following stages
+    # 1. Ensure that the init object fetches its config without errors
+    # 2. Setup logging/output redirections with resultant config (if any)
+    # 3. Initialize the cloud-init filesystem
+    # 4. Check if we can stop early by looking for various files
+    # 5. Fetch the datasource
+    # 6. Consume the userdata (handlers get activated here)
+    # 7. Adjust any subsequent logging/output redirections
+    # 8. Run the transforms for the 'init' stage
+    # 9. Done!
+    now = util.time_rfc2822()
+    uptime = util.uptime()
+    init = stages.Init(deps)
+    # Stage 1
+    init.read_cfg()
+    # Stage 2
+    try:
+        util.fixup_output(init.cfg, 'init')
+    except:
+        util.logexc(LOG, "Failed to setup output redirection")
+    if args.debug:
+        # Reset so that all the debug handlers are closed out
+        LOG.debug("Logging being reset, this logger may no longer be active shortly")
+        logging.resetLogging()
+    logging.setupLogging(init.cfg)
+    # Stage 3
+    try:
+        init.initialize()
+    except Exception as e:
+        util.logexc(LOG, "Failed to initialize, likely bad things to come: %s", e)
+    # Stage 4
+    path_helper = init.paths
+    if not args.local:
+        nonet_path = "%s/%s" % (cloudinit.get_cpath("data"), "no-net")
+
+def main_config(args):
+    pass
+
+
+def main_final(args):
+    pass
+
+
+def main():
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--version', '-v', action='version', 
+                        version='%(prog)s ' + (version.version_string()))
+    parser.add_argument('--file', '-f', action='store', 
+                        help='additional configuration file to include',
+                        type=argparse.FileType('rb'))
+    parser.add_argument('--debug', '-d', action='store_true', 
+                        help='show additional pre-action logging',
+                        default=False)
+    subparsers = parser.add_subparsers()
+
+    # Each action and its suboptions (if any)
+    parser_init = subparsers.add_parser('init', help='initializes cloud-init and performs \'init\' transforms')
+    parser_init.add_argument("--local", '-l', action='store_true',
+                             help="start in local mode", default=False)
+    parser_init.set_defaults(action='init')  # This is used so that we can know which action is selected
+
+    parser_config = subparsers.add_parser('config', help='performs cloud-init \'config\' transforms')
+    parser_config.set_defaults(action='config')
+
+    parser_final = subparsers.add_parser('final', help='performs cloud-init \'final\' transforms')
+    parser_final.set_defaults(action='final')
+
+    parser_query = subparsers.add_parser('query', help='query information stored in cloud-init')
+    parser_query.add_argument("--name", action="store",
+                              help="item name to query on",
+                              required=True,
+                              choices=QUERY_DATA_TYPES)
+    parser_query.set_defaults(action='query')
+    args = parser.parse_args()
+    
+    # Setup basic logging to start (until reinitialized)
+    if args.debug:
+        logging.setupBasicLogging()
+
+    stage_name = args.action
+    stage_mp = {
+        'init': main_init,
+        'config': main_config,
+        'final': main_final,
+    }
+    func = stage_mp.get(stage_name)
+    return func(args)
+
+
+if __name__ == '__main__':
+    sys.exit(main())
+

From 13bc46ee976796a107c15c8fc45bacb244daa194 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 21:05:57 -0700
Subject: [PATCH 201/434] 1. Removed the welcome message for now :-)

---
 config/cloud.cfg           |  6 ++----
 templates/welcome_msg.tmpl | 15 ---------------
 2 files changed, 2 insertions(+), 19 deletions(-)
 delete mode 100644 templates/welcome_msg.tmpl

diff --git a/config/cloud.cfg b/config/cloud.cfg
index 7a6bf243..b11b5aa5 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -21,10 +21,8 @@ preserve_hostname: false
 # The transform that run in the 'init' stage
 cloud_init_modules:
 # This is the hash way of specifying a transform
- - name: welcome-message
-# This argument list will get passed to the transform when activated
-   args:
-    - init
+ - name: bootcmd
+# This is the string way of specifying a transform
  - bootcmd
  - resizefs
  - set-hostname
diff --git a/templates/welcome_msg.tmpl b/templates/welcome_msg.tmpl
deleted file mode 100644
index 999202cc..00000000
--- a/templates/welcome_msg.tmpl
+++ /dev/null
@@ -1,15 +0,0 @@
-             _
-           _( )_
-          (     )
-         (_______)
-    _     \ \ \ \
-  _( )_        _
- (     )     _( )_
-(_______)   (     )
- \ \ \ \   (_______)
-            \ \ \ \
-
-Cloud-init v. {{version}}
-Starting stage: {{stage}} on {{timestamp}}
-System uptime: {{uptime}} seconds
---

From ef4d1bbc52a2cd74202a1d0cf2320f3b0fca768d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 21:06:24 -0700
Subject: [PATCH 202/434] Fixed the constructor params

---
 cloudinit/sources/DataSourceConfigDrive.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/sources/DataSourceConfigDrive.py b/cloudinit/sources/DataSourceConfigDrive.py
index 7450572f..5da1ffea 100644
--- a/cloudinit/sources/DataSourceConfigDrive.py
+++ b/cloudinit/sources/DataSourceConfigDrive.py
@@ -116,8 +116,8 @@ class DataSourceConfigDrive(sources.DataSource):
 
 
 class DataSourceConfigDriveNet(DataSourceConfigDrive):
-    def __init__(self, sys_cfg, paths):
-        DataSourceConfigDrive.__init__(self, sys_cfg, paths)
+    def __init__(self, sys_cfg, distro, paths):
+        DataSourceConfigDrive.__init__(self, sys_cfg, distro, paths)
         self.dsmode = 'net'
 
 

From 9d32b78f6e8feae6b8c922e853d82a61dbe5d28f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 21:07:17 -0700
Subject: [PATCH 203/434] 1. Fixed datasource construction (switched param
 order) 2. Fixed up importing of modules to handle the failure case better   
 a. Also realized that using the import class we don't have to reimport a
 module via getattr, so removed that.

---
 cloudinit/sources/__init__.py | 12 +++++-------
 1 file changed, 5 insertions(+), 7 deletions(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 5842d41b..831f97ea 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -51,7 +51,7 @@ class DataSource(object):
         self.userdata_raw = None
         name = util.obj_name(self)
         if name.startswith(DS_PREFIX):
-            name = name[DS_PREFIX:]
+            name = name[len(DS_PREFIX):]
         self.ds_cfg = util.get_cfg_by_path(self.sys_cfg,
                                           ("datasource", name), {})
         if not ud_proc:
@@ -171,7 +171,7 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
     for cls in ds_list:
         ds = util.obj_name(cls)
         try:
-            s = cls(distro, sys_cfg, paths)
+            s = cls(sys_cfg, distro, paths)
             if s.get_data():
                 return (s, ds)
         except Exception:
@@ -198,15 +198,13 @@ def list_sources(cfg_list, depends, pkg_list):
             if pkg:
                 pkg_name.append(str(pkg))
             pkg_name.append(ds_name)
-            mod = importer.import_module(".".join(pkg_name))
-            if pkg:
-                mod = getattr(mod, ds_name, None)
-            if not mod:
+            try:
+                mod = importer.import_module(".".join(pkg_name))
+            except RuntimeError:
                 continue
             lister = getattr(mod, "get_datasource_list", None)
             if not lister:
                 continue
-            LOG.debug("Seeing if %s matches using function %s", mod, lister)
             cls_matches = lister(depends)
             if not cls_matches:
                 continue

From 0b0bc2bcbe45791507116c31a7e11f25ed7b6225 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 21:08:00 -0700
Subject: [PATCH 204/434] Show the timeout (useful to see this when debugging)

---
 cloudinit/url_helper.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 5b5b41e2..0376450f 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -85,8 +85,8 @@ def readurl(url, data=None, timeout=None,
     attempts = retries + 1
 
     excepts = []
-    LOG.info(("Attempting to open %s with %s attempts"
-                " (%s retries) to be performed"), url, attempts, retries)
+    LOG.info(("Attempting to open '%s' with %s attempts"
+                " (%s retries, timeout=%s) to be performed"), url, attempts, retries, timeout)
     open_args = {}
     if timeout is not None:
         open_args['timeout'] = int(timeout)

From a9649b9417269fe8d11255333724ea38818828ac Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 21:08:21 -0700
Subject: [PATCH 205/434] 1. Cleanup the rm cur instance link variable name to
 match more of what it is 2. Allow on config reading the ability to pass in
 config files that over-ride the search for configs (useful for testing...)

---
 cloudinit/stages.py | 31 ++++++++++++++++++-------------
 1 file changed, 18 insertions(+), 13 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index a713bd1f..2c610ce5 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -126,14 +126,14 @@ class Init(object):
         ]
         return initial_dirs
 
-    def purge_cache(self, rmcur=True):
-        rmlist = []
+    def purge_cache(self, rm_instance_lnk=True):
+        rm_list = []
         rmlist.append(self.paths.boot_finished)
-        if rmcur:
-            rmlist.append(self.paths.instance_link)
-        for f in rmlist:
+        if rm_instance_lnk:
+            rm_list.append(self.paths.instance_link)
+        for f in rm_list:
             util.del_file(f)
-        return len(rmlist)
+        return len(rm_list)
 
     def initialize(self):
         self._initialize_filesystem()
@@ -152,19 +152,24 @@ class Init(object):
                     g = None
                 util.chownbyname(log_file, u, g)
 
-    def read_cfg(self):
+    def read_cfg(self, extra_fns=None):
         # None check so that we don't keep on re-loading if empty
         if self._cfg is None:
-            self._cfg = self._read_cfg()
+            self._cfg = self._read_cfg(extra_fns)
             LOG.debug("Loaded init config %s", self._cfg)
 
-    def _read_cfg(self):
-        b_config = util.get_builtin_cfg()
+    def _read_cfg(self, extra_fns):
+        builtin_cfg = util.get_builtin_cfg()
         try:
-            conf = util.get_base_cfg()
+            conf = util.get_base_cfg(builtin=builtin_cfg)
         except Exception:
-            conf = b_config
-        return util.mergedict(conf, self._read_cfg_old())
+            conf = builtin_cfg
+        m_cfg = util.mergedict(conf, self._read_cfg_old())
+        if extra_fns:
+            for fn in extra_fns:
+                # Any extras over-ride the existing configs
+                m_cfg = util.mergedict(util.read_conf(fn), m_cfg)
+        return m_cfg
 
     def _restore_from_cache(self):
         pickled_fn = self.paths.get_ipath_cur('obj_pkl')

From e7aa88cbf0ba0a657d3a4ed9d512e99c1229f828 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 21:09:11 -0700
Subject: [PATCH 206/434] 1. Allow the built-in config to be passed in when
 getting the base config 2. Move the cloudinit util function that writes the
 command line url to a file to here.

---
 cloudinit/util.py | 25 +++++++++++++++++++++++--
 1 file changed, 23 insertions(+), 2 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index aaeaa5fc..164bcea8 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1021,6 +1021,25 @@ def ensure_dirs(dirlist, mode=0755):
         ensure_dir(d, mode)
 
 
+def read_write_cmdline_url(target_fn):
+    if not os.path.exists(target_fn):
+        try:
+            (key, url, content) = get_cmdline_url()
+        except:
+            logexc(LOG, "Failed fetching command line url")
+            return
+        try:
+            if key and content:
+                write_file(target_fn, content, mode=0600)
+                LOG.debug(("Wrote to %s with contents of command line"
+                          " url %s (len=%s)"), target_fn, url, len(content))
+            elif key and not content:
+                LOG.debug(("Command line key %s with url"
+                          " %s had no contents"), key, url)
+        except:
+            logexc(LOG, "Failed writing url content to %s", target_fn)
+
+
 def yaml_dumps(obj):
     formatted = yaml.dump(obj,
                     line_break="\n",
@@ -1045,10 +1064,12 @@ def ensure_dir(path, mode=None):
         chmod(path, mode)
 
 
-def get_base_cfg(cfg_path=None):
+def get_base_cfg(cfg_path=None, builtin=None):
     if not cfg_path:
         cfg_path = CLOUD_CONFIG
-    return merge_base_cfg(cfg_path, get_builtin_cfg())
+    if not builtin:
+        builtin = get_builtin_cfg()
+    return merge_base_cfg(cfg_path, builtin)
 
 
 @contextlib.contextmanager

From 0e3ebd3c6ac67d0c4ead66a5491e3ca26d90bdce Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 18 Jun 2012 21:10:47 -0700
Subject: [PATCH 207/434] Removed this for now.

---
 cloudinit/transforms/welcome_message.py | 64 -------------------------
 1 file changed, 64 deletions(-)
 delete mode 100644 cloudinit/transforms/welcome_message.py

diff --git a/cloudinit/transforms/welcome_message.py b/cloudinit/transforms/welcome_message.py
deleted file mode 100644
index 04691d21..00000000
--- a/cloudinit/transforms/welcome_message.py
+++ /dev/null
@@ -1,64 +0,0 @@
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2012 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#    Copyright (C) 2012 Yahoo! Inc.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
-#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-from cloudinit.settings import PER_ALWAYS
-
-from cloudinit import templater
-from cloudinit import util
-from cloudinit import version
-
-import sys
-
-welcome_message_def = ("Cloud-init v. {{version}} starting stage {{stage}} at "
-                       "{{timestamp}}. Up {{uptime}} seconds.")
-
-
-frequency = PER_ALWAYS
-
-
-def handle(_name, cfg, cloud, log, args):
-
-    welcome_msg = util.get_cfg_option_str(cfg, "welcome_msg")
-    if not welcome_msg:
-        tpl_fn = cloud.get_template_filename("welcome_msg")
-        if tpl_fn:
-            welcome_msg = util.load_file(tpl_fn)
-
-    if not welcome_msg:
-        welcome_msg = welcome_message_def
-
-    stage = "??"
-    if args:
-        stage = args[0]
-
-    tpl_params = {
-        'stage': stage,
-        'version': version.version_string(),
-        'uptime': util.uptime(),
-        'timestamp': util.time_rfc2822(),
-    }
-    try:
-        contents = templater.render_string(welcome_msg, tpl_params)
-        # TODO use log or sys.stderr??
-        sys.stderr.write("%s\n" % (contents))
-    except:
-        util.logexc(log, "Failed to render welcome message template")

From fc7413233646dffc9a87cfcf8c0de55c8ecd2a5a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:04:42 -0700
Subject: [PATCH 208/434] 1. When running, return the function results as well
 as a boolean that stated if it ran.

---
 cloudinit/helpers.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index e5c45632..3fd819b3 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -150,7 +150,7 @@ class Runners(object):
             args = []
         if sem.has_run(name, freq):
             LOG.info("%s already ran (freq=%s)", name, freq)
-            return None
+            return (False, None)
         with sem.lock(name, freq, clear_on_fail) as lk:
             if not lk:
                 raise LockFailure("Failed to acquire lock for %s" % name)
@@ -158,9 +158,10 @@ class Runners(object):
                 LOG.debug("Running %s with args %s using lock %s",
                           functor, args, lk)
                 if isinstance(args, (dict)):
-                    return functor(**args)
+                    results = functor(**args)
                 else:
-                    return functor(*args)
+                    results = functor(*args)
+                return (True, results)
 
 
 class ContentHandlers(object):

From 36638c72f19bfbfb0356cbea87e8bf8468b458bb Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:05:11 -0700
Subject: [PATCH 209/434] Add the ability to check if the metadata service is
 up before actually using it.

1. This is very useful for testing (until we have boto timeout in a more sane manner)
---
 cloudinit/sources/DataSourceCloudStack.py | 51 +++++++++++++++++++++--
 1 file changed, 48 insertions(+), 3 deletions(-)

diff --git a/cloudinit/sources/DataSourceCloudStack.py b/cloudinit/sources/DataSourceCloudStack.py
index 27217e65..b1817654 100644
--- a/cloudinit/sources/DataSourceCloudStack.py
+++ b/cloudinit/sources/DataSourceCloudStack.py
@@ -30,6 +30,7 @@ import boto.utils as boto_utils
 
 from cloudinit import log as logging
 from cloudinit import sources
+from cloudinit import url_helper as uhelp
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)
@@ -63,6 +64,48 @@ class DataSourceCloudStack(sources.DataSource):
     def __str__(self):
         return util.obj_name(self)
 
+    def _get_url_settings(self):
+        mcfg = self.ds_cfg
+        if not mcfg:
+            mcfg = {}
+        max_wait = 120
+        try:
+            max_wait = int(mcfg.get("max_wait", max_wait))
+        except Exception:
+            util.logexc(LOG, "Failed to get max wait. using %s", max_wait)
+
+        if max_wait == 0:
+            return False
+
+        timeout = 50
+        try:
+            timeout = int(mcfg.get("timeout", timeout))
+        except Exception:
+            util.logexc(LOG, "Failed to get timeout, using %s", timeout)
+
+        return (max_wait, timeout)
+
+    def wait_for_metadata_service(self):
+        mcfg = self.ds_cfg
+        if not mcfg:
+            mcfg = {}
+
+        (max_wait, timeout) = self._get_url_settings()
+
+        urls = [self.metadata_address]
+        start_time = time.time()
+        url = uhelp.wait_for_url(urls=urls, max_wait=max_wait,
+                                timeout=timeout, status_cb=LOG.warn)
+
+        if url:
+            LOG.info("Using metadata source: '%s'", url)
+        else:
+            LOG.critical(("Giving up on waiting for the metadata from %s"
+                          " after %s seconds"),
+                          urls, int(time.time() - start_time))
+
+        return bool(url)
+
     def get_data(self):
         seed_ret = {}
         if util.read_optional_seed(seed_ret, base=(self.seed_dir + "/")):
@@ -71,13 +114,15 @@ class DataSourceCloudStack(sources.DataSource):
             LOG.debug("Using seeded cloudstack data from: %s", self.seed_dir)
             return True
         try:
-            start = time.time()
+            if not self.wait_for_metadata_service():
+                return False
+            start_time = time.time()
             self.userdata_raw = boto_utils.get_instance_userdata(self.api_ver,
                 None, self.metadata_address)
             self.metadata = boto_utils.get_instance_metadata(self.api_ver,
                 self.metadata_address)
-            tot_time = (time.time() - start)
-            LOG.debug("Crawl of metadata service took %s", int(tot_time))
+            LOG.debug("Crawl of metadata service took %s seconds", 
+                      int(time.time() - start_time))
             return True
         except Exception:
             util.logexc(LOG, ('Failed fetching from metadata '

From b37af29192c8d2a14dca5c858deb6d4778928256 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:05:54 -0700
Subject: [PATCH 210/434] Syntax + comment cleanups.

---
 cloudinit/sources/DataSourceEc2.py | 20 ++++++++++++++------
 1 file changed, 14 insertions(+), 6 deletions(-)

diff --git a/cloudinit/sources/DataSourceEc2.py b/cloudinit/sources/DataSourceEc2.py
index c2c3b9b7..55447102 100644
--- a/cloudinit/sources/DataSourceEc2.py
+++ b/cloudinit/sources/DataSourceEc2.py
@@ -31,8 +31,15 @@ from cloudinit import url_helper as uhelp
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)
+
 DEF_MD_URL = "http://169.254.169.254"
+
+# Which version we are requesting of the ec2 metadata apis
 DEF_MD_VERSION = '2009-04-04'
+
+# Default metadata urls that will be used if none are provided
+# They will be checked for 'resolveability' and some of the 
+# following may be discarded if they do not resolve
 DEF_MD_URLS = [DEF_MD_URL, "http://instance-data:8773"]
 
 
@@ -57,13 +64,13 @@ class DataSourceEc2(sources.DataSource):
         try:
             if not self.wait_for_metadata_service():
                 return False
-            start = time.time()
+            start_time = time.time()
             self.userdata_raw = boto_utils.get_instance_userdata(self.api_ver,
                 None, self.metadata_address)
             self.metadata = boto_utils.get_instance_metadata(self.api_ver,
                 self.metadata_address)
-            tot_time = int(time.time() - start)
-            LOG.debug("Crawl of metadata service took %s", tot_time)
+            LOG.debug("Crawl of metadata service took %s seconds", 
+                       int(time.time() - start_time))
             return True
         except Exception:
             util.logexc(LOG, "Failed reading from metadata address %s",
@@ -126,6 +133,7 @@ class DataSourceEc2(sources.DataSource):
             timeout = int(mcfg.get("timeout", timeout))
         except Exception:
             util.logexc(LOG, "Failed to get timeout, using %s", timeout)
+
         return (max_wait, timeout)
 
     def wait_for_metadata_service(self):
@@ -156,15 +164,15 @@ class DataSourceEc2(sources.DataSource):
             urls.append(cur)
             url2base[cur] = url
 
-        starttime = time.time()
+        start_time = time.time()
         url = uhelp.wait_for_url(urls=urls, max_wait=max_wait,
                                 timeout=timeout, status_cb=LOG.warn)
 
         if url:
             LOG.info("Using metadata source: '%s'", url2base[url])
         else:
-            LOG.critical("Giving up on md from %s after %i seconds",
-                            urls, int(time.time() - starttime))
+            LOG.critical("Giving up on md from %s after %s seconds",
+                            urls, int(time.time() - start_time))
 
         self.metadata_address = url2base.get(url)
         return bool(url)

From 5ae507a6a7fa5c33ff70b4428f4851fc4aa5a331 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:06:14 -0700
Subject: [PATCH 211/434] Cleanup some of the logging (its a little to
 verbose).

---
 cloudinit/sources/__init__.py | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 831f97ea..a227e050 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -169,13 +169,13 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
     LOG.info("Searching for data source in: %s", ds_names)
 
     for cls in ds_list:
-        ds = util.obj_name(cls)
         try:
+            LOG.debug("Seeing if we can get any data from %s", cls)
             s = cls(sys_cfg, distro, paths)
             if s.get_data():
-                return (s, ds)
+                return (s, util.obj_name(cls))
         except Exception:
-            util.logexc(LOG, "Getting data from %s failed", ds)
+            util.logexc(LOG, "Getting data from %s failed", cls)
 
     msg = "Did not find any data source, searched classes: %s" % (ds_names)
     raise DataSourceNotFoundException(msg)
@@ -188,7 +188,7 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
 def list_sources(cfg_list, depends, pkg_list):
     src_list = []
     LOG.info(("Looking for for data source in: %s,"
-              " %s that matches %s"), cfg_list, pkg_list, depends)
+              " via packages %s that matches dependencies %s"), cfg_list, pkg_list, depends)
     for ds_coll in cfg_list:
         ds_name = str(ds_coll)
         if not ds_name.startswith(DS_PREFIX):
@@ -209,8 +209,8 @@ def list_sources(cfg_list, depends, pkg_list):
             if not cls_matches:
                 continue
             src_list.extend(cls_matches)
-            LOG.debug(("Found a match for data source %s"
-                       " in %s with matches %s"), ds_name, mod, cls_matches)
+            LOG.debug(("Found a match"
+                       " in %s with matches %s"), mod, cls_matches)
             break
     return src_list
 

From 4bea73e8fba5f29df4a03ce28dcaa396406ae647 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:06:32 -0700
Subject: [PATCH 212/434] Fix pylint error about the rmlist variable name being
 mis-named.

---
 cloudinit/stages.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 2c610ce5..6eb211db 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -128,7 +128,7 @@ class Init(object):
 
     def purge_cache(self, rm_instance_lnk=True):
         rm_list = []
-        rmlist.append(self.paths.boot_finished)
+        rm_list.append(self.paths.boot_finished)
         if rm_instance_lnk:
             rm_list.append(self.paths.instance_link)
         for f in rm_list:

From 5d59fe0e6767694741b37e4dd2225e1380ce077d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:06:49 -0700
Subject: [PATCH 213/434] Cleanup pylint warning about line length.

---
 cloudinit/url_helper.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 0376450f..c69da1bb 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -86,7 +86,8 @@ def readurl(url, data=None, timeout=None,
 
     excepts = []
     LOG.info(("Attempting to open '%s' with %s attempts"
-                " (%s retries, timeout=%s) to be performed"), url, attempts, retries, timeout)
+                " (%s retries, timeout=%s) to be performed"), 
+             url, attempts, retries, timeout)
     open_args = {}
     if timeout is not None:
         open_args['timeout'] = int(timeout)

From 1d39ae0d94d0c72ab3c18b3d3ee4afc79078704f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:07:05 -0700
Subject: [PATCH 214/434] 1. Continue working on main 'init' method 2. Add the
 ability to take in multiple extra config files (mainly for debugging) 3. Move
 'simple' welcome message to this file 4. Only setup initial basic logging if
 '-d' option is provided.

---
 bin/cloud-init2.py | 134 ++++++++++++++++++++++++++++++++-------------
 1 file changed, 96 insertions(+), 38 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index 6663379f..0e6a75da 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -32,12 +32,12 @@ possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
 if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
     sys.path.insert(0, possible_topdir)
 
-
 from cloudinit import log as logging
 from cloudinit import netinfo
 from cloudinit import settings
 from cloudinit import sources
 from cloudinit import stages
+from cloudinit import templater
 from cloudinit import util
 from cloudinit import version
 
@@ -49,58 +49,58 @@ QUERY_DATA_TYPES = [
     'instance_id',
 ]
 
-LOG = logging.getLogger(__name__)
+LOG = logging.getLogger()
 
 
-def read_write_cmdline_url(target_fn):
-    if not os.path.exists(target_fn):
-        try:
-            (key, url, content) = util.get_cmdline_url()
-        except:
-            util.logexc(LOG, "Failed fetching command line url")
-            return
-        try:
-            if key and content:
-                util.write_file(target_fn, content, mode=0600)
-                LOG.info(("Wrote to %s with contents of command line"
-                          " url %s (len=%s)"), target_fn, url, len(content))
-            elif key and not content:
-                LOG.info(("Command line key %s with url"
-                          " %s had no contents"), key, url)
-        except:
-            util.logexc(LOG, "Failed writing url content to %s", target_fn)
+def warn(wstr):
+    sys.stderr.write("WARN: %s\n" % (wstr))
 
 
-def main_init(args):
+def welcome(action):
+    msg = ("Cloud-init v. {{version}} running '{{action}}' at "
+           "{{timestamp}}. Up {{uptime}} seconds.")
+    tpl_params = {
+        'version': version.version_string(),
+        'uptime': util.uptime(),
+        'timestamp': util.time_rfc2822(),
+        'action': action,
+    }
+    welcome_msg = "%s" % (templater.render_string(msg, tpl_params))
+    sys.stderr.write("%s\n" % (welcome_msg))
+    sys.stderr.flush()
+    LOG.info(welcome_msg)
+
+
+def main_init(name, args):
     deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
     if args.local:
         deps = [sources.DEP_FILESYSTEM]
 
-    cfg_path = None
-    if args.file:
+    cfg_extra_paths = []
+    if args.files:
         # Already opened so lets just pass that along
         # since it would of broke if it couldn't have
         # read that file
-        cfg_path = str(args.file.name)
+        for f in args.files:
+            cfg_extra_paths.append(f.name)
 
     if not args.local:
-        # What is this for??
+        # TODO: What is this for??
         root_name = "%s.d" % (settings.CLOUD_CONFIG)
         target_fn = os.path.join(root_name, "91_kernel_cmdline_url.cfg")
-        read_write_cmdline_url(target_fn)
-    
-    # Cloud-init 'init' stage is broken up into the following stages
+        util.read_write_cmdline_url(target_fn)
+
+    # Cloud-init 'init' stage is broken up into the following sub-stages
     # 1. Ensure that the init object fetches its config without errors
     # 2. Setup logging/output redirections with resultant config (if any)
     # 3. Initialize the cloud-init filesystem
     # 4. Check if we can stop early by looking for various files
     # 5. Fetch the datasource
-    # 6. Consume the userdata (handlers get activated here)
-    # 7. Adjust any subsequent logging/output redirections
-    # 8. Run the transforms for the 'init' stage
-    # 9. Done!
-    now = util.time_rfc2822()
-    uptime = util.uptime()
+    # 6. Connect to the current instance location + update the cache
+    # 7. Consume the userdata (handlers get activated here)
+    # 8. Adjust any subsequent logging/output redirections
+    # 9. Run the transforms for the 'init' stage
+    # 10. Done!
     init = stages.Init(deps)
     # Stage 1
     init.read_cfg()
@@ -122,13 +122,70 @@ def main_init(args):
     # Stage 4
     path_helper = init.paths
     if not args.local:
-        nonet_path = "%s/%s" % (cloudinit.get_cpath("data"), "no-net")
+        sys.stderr.write("%s\n" % (netinfo.debug_info()))
+        LOG.debug(("Checking to see if files that we need already"
+                   " exist from a previous run that would allow us"
+                   " to stop early."))
+        stop_files = [
+            os.path.join(path_helper.get_cpath("data"), "no-net"),
+            path_helper.get_ipath_cur("obj_pkl"),
+        ]
+        existing_files = []
+        for fn in stop_files:
+            try:
+                c = util.load_file(fn)
+                if len(c):
+                    existing_files.append((fn, len(c)))
+            except Exception as e:
+                pass
+        if existing_files:
+            LOG.debug("Exiting early due to the existence of %s", existing_files)
+            return 0
+    else:
+        # The cache is not instance specific, so it has to be purged
+        # but we want 'start' to benefit from a cache if
+        # a previous start-local populated one...
+        manual_clean = util.get_cfg_option_bool(init.cfg,
+                                                'manual_cache_clean', False)
+        if manual_clean:
+            LOG.debug("Not purging instance link, manual cleaning enabled")
+            init.purge_cache(False)
+        else:
+            init.purge_cache()
+        # Delete the non-net file as well
+        util.del_fie(os.path.join(path_helper.get_cpath("data"), "no-net"))
+    # Stage 5
+    welcome(name)
+    try:
+        init.fetch()
+    except sources.DataSourceNotFoundException as e:
+        util.logexc(LOG, "No instance datasource found")
+        warn("No instance datasource found: %s" % (e))
+        # TODO: Return 0 or 1??
+        return 1
+    # Stage 6
+    iid = init.instancify()
+    LOG.debug("%s will now be targeting instance id: %s", name, iid)
+    init.update()
+    # Stage 7
+    try:
+        (ran, _results) = init.cloudify().run('consume_userdata',
+                                             init.consume,
+                                             args=[settings.PER_INSTANCE],
+                                             freq=settings.PER_INSTANCE)
+        if not ran:
+            init.consume(settings.ALWAYS)
+    except Exception as e:
+        warn("Consuming user data failed: %s" % (e))
+        raise
+    # Stage 8
+    
 
-def main_config(args):
+def main_config(name, args):
     pass
 
 
-def main_final(args):
+def main_final(name, args):
     pass
 
 
@@ -136,7 +193,8 @@ def main():
     parser = argparse.ArgumentParser()
     parser.add_argument('--version', '-v', action='version', 
                         version='%(prog)s ' + (version.version_string()))
-    parser.add_argument('--file', '-f', action='store', 
+    parser.add_argument('--file', '-f', action='append', 
+                        dest='files',
                         help='additional configuration file to include',
                         type=argparse.FileType('rb'))
     parser.add_argument('--debug', '-d', action='store_true', 
@@ -175,7 +233,7 @@ def main():
         'final': main_final,
     }
     func = stage_mp.get(stage_name)
-    return func(args)
+    return func(stage_name, args)
 
 
 if __name__ == '__main__':

From 60240524195d865c872b10d20f923f0b55b7c777 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:17:08 -0700
Subject: [PATCH 215/434] Passed along the extra config paths

---
 bin/cloud-init2.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index 0e6a75da..e1757af4 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -103,7 +103,7 @@ def main_init(name, args):
     # 10. Done!
     init = stages.Init(deps)
     # Stage 1
-    init.read_cfg()
+    init.read_cfg(cfg_extra_paths)
     # Stage 2
     try:
         util.fixup_output(init.cfg, 'init')

From 11224afb2a99706f4c6a872212656d0c47205247 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 11:24:21 -0700
Subject: [PATCH 216/434] Add a mock ec2 metadata server that can be used for
 testing with

---
 tools/mock-meta.py | 327 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 327 insertions(+)
 create mode 100755 tools/mock-meta.py

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
new file mode 100755
index 00000000..019a24f2
--- /dev/null
+++ b/tools/mock-meta.py
@@ -0,0 +1,327 @@
+#!/usr/bin/python
+
+# Provides a somewhat random, somewhat compat, somewhat useful mock version of
+#
+# http://docs.amazonwebservices.com/AWSEC2/2007-08-29/DeveloperGuide/AESDG-chapter-instancedata.html
+
+import functools
+import httplib
+import logging
+import sys
+import string
+import random
+import yaml
+
+from optparse import OptionParser
+
+from BaseHTTPServer import (HTTPServer, BaseHTTPRequestHandler)
+
+log = logging.getLogger('meta-server')
+
+# Constants
+EC2_VERSIONS = [
+    '1.0',
+    '2007-01-19',
+    '2007-03-01',
+    '2007-08-29',
+    '2007-10-10',
+    '2007-12-15',
+    '2008-02-01',
+    '2008-09-01',
+    '2009-04-04',
+    'latest',
+]
+
+BLOCK_DEVS = [
+    'ami',
+    'root',
+    'ephemeral0',
+]
+
+DEV_PREFIX = 'v'
+DEV_MAPPINGS = {
+    'ephemeral0': '%sda2' % (DEV_PREFIX),
+    'root': '/dev/%sda1' % (DEV_PREFIX),
+    'ami': '%sda1' % (DEV_PREFIX),
+    'swap': '%sda3' % (DEV_PREFIX),
+}
+
+META_CAPABILITIES = [
+    'aki-id',
+    'ami-id',
+    'ami-launch-index',
+    'ami-manifest-path',
+    'ari-id',
+    'block-device-mapping/',
+    'hostname',
+    'instance-action',
+    'instance-id',
+    'instance-type',
+    'local-hostname',
+    'local-ipv4',
+    'placement/',
+    'product-codes',
+    'public-hostname',
+    'public-ipv4',
+    'reservation-id',
+    'security-groups'
+]
+
+INSTANCE_TYPES = [
+    'm1.small',
+    'm1.medium',
+    'm1.large',
+    'm1.xlarge',
+]
+
+AVAILABILITY_ZONES = [
+    "us-east-1a",
+    "us-east-1b",
+    "us-east-1c",
+    'us-west-1',
+    "us-east-1d",
+    'eu-west-1a',
+    'eu-west-1b',
+]
+
+PLACEMENT_CAPABILITIES = {
+    'availability-zone': AVAILABILITY_ZONES,
+}
+
+
+class WebException(Exception):
+    def __init__(self, code, msg):
+        Exception.__init__(self, msg)
+        self.code = code
+
+
+def yamlify(data):
+    formatted = yaml.dump(data,
+        line_break="\n",
+        indent=4,
+        explicit_start=True,
+        explicit_end=True,
+        default_flow_style=False)
+    return formatted
+
+
+def format_text(text):
+    if not len(text):
+        return "<<"
+    lines = text.splitlines()
+    nlines = []
+    for line in lines:
+        nlines.append("<< %s" % line)
+    return "\n".join(nlines)
+
+
+ID_CHARS = [c for c in (string.ascii_uppercase + string.digits)]
+def id_generator(size=6, lower=False):
+    txt = ''.join(random.choice(ID_CHARS) for x in range(size))
+    if lower:
+        return txt.lower()
+    else:
+        return txt
+
+
+class MetaDataHandler(object):
+
+    def __init__(self, opts):
+        self.opts = opts
+        self.instances = {}
+
+    def get_data(self, params, who, **kwargs):
+        if not params:
+            caps = sorted(META_CAPABILITIES)
+            return "\n".join(caps)
+        action = params[0]
+        action = action.lower()
+        if action == 'instance-id':
+            return 'i-%s' % (id_generator(lower=True))
+        elif action == 'ami-launch-index':
+            return "%s" % random.choice([0,1,2,3])
+        elif action == 'aki-id':
+            return 'aki-%s' % (id_generator(lower=True))
+        elif action == 'ami-id':
+            return 'ami-%s' % (id_generator(lower=True))
+        elif action == 'ari-id':
+            return 'ari-%s' % (id_generator(lower=True))
+        elif action == 'block-device-mapping':
+            nparams = params[1:]
+            if not nparams:
+                devs = sorted(BLOCK_DEVS)
+                return "\n".join(devs)
+            else:
+                return "%s" % (DEV_MAPPINGS.get(nparams[0].strip(), ''))
+        elif action in ['hostname', 'local-hostname', 'public-hostname']:
+            return "%s" % (who)
+        elif action == 'instance-type':
+            return random.choice(INSTANCE_TYPES)
+        elif action == 'ami-manifest-path':
+            return 'my-amis/spamd-image.manifest.xml'
+        elif action == 'security-groups':
+            return 'default'
+        elif action in ['local-ipv4', 'public-ipv4']:
+            there_ip = kwargs.get('client_ip', '10.0.0.1')
+            return "%s" % (there_ip)
+        elif action == 'reservation-id':
+            return "r-%s" % (id_generator(lower=True))
+        elif action == 'product-codes':
+            return "%s" % (id_generator(size=8))
+        elif action == 'placement':
+            nparams = params[1:]
+            if not nparams:
+                pcaps = sorted(PLACEMENT_CAPABILITIES.keys())
+                return "\n".join(pcaps)
+            else:
+                pentry = nparams[0].strip().lower()
+                if pentry == 'availability-zone':
+                    zones = PLACEMENT_CAPABILITIES[pentry]
+                    return "%s" % random.choice(zones)
+                else:
+                    return "%s" % (PLACEMENT_CAPABILITIES.get(pentry, ''))
+        else:
+            return ''
+
+class UserDataHandler(object):
+
+    def __init__(self, opts):
+        self.opts = opts
+
+    def _get_user_blob(self, **kwargs):
+        blob_mp = {}
+        blob_mp['hostname'] = kwargs.get('who', '')
+        lines = []
+        lines.append("#cloud-config")
+        lines.append(yamlify(blob_mp))
+        blob = "\n".join(lines)
+        return blob.strip()
+
+    def get_data(self, params, who, **kwargs):
+        if not params:
+            return self._get_user_blob(who=who)
+        return ''
+
+
+# Seem to need to use globals since can't pass 
+# data into the request handlers instances...
+# Puke!
+meta_fetcher = None
+user_fetcher = None
+
+
+class Ec2Handler(BaseHTTPRequestHandler):
+
+    def _get_versions(self):
+        versions = []
+        for v in EC2_VERSIONS:
+            if v == 'latest':
+                continue
+            else:
+                versions.append(v)
+        versions = sorted(versions)
+        return "\n".join(versions)
+
+    def log_message(self, format, *args):
+        msg = "%s - %s" % (self.address_string(), format % (args))
+        log.info(msg)
+
+    def _find_method(self, path):
+        # Puke! (globals)
+        global meta_fetcher
+        global user_fetcher
+        func_mapping = {
+            'user-data': user_fetcher.get_data,
+            'meta-data': meta_fetcher.get_data,
+        }
+        segments = [piece for piece in path.split('/') if len(piece)]
+        if not segments:
+            return self._get_versions
+        date = segments[0].strip().lower()
+        if date not in EC2_VERSIONS:
+            raise WebException(httplib.BAD_REQUEST, "Unknown date format %r" % date)
+        if len(segments) < 2:
+            raise WebException(httplib.BAD_REQUEST, "No action provided")
+        look_name = segments[1].lower()
+        if look_name not in func_mapping:
+            raise WebException(httplib.BAD_REQUEST, "Unknown requested data %r" % look_name)
+        base_func = func_mapping[look_name]
+        who = self.address_string()
+        kwargs = {
+            'params': list(segments[2:]),
+            'who': self.address_string(),
+            'client_ip': self.client_address[0],
+        }
+        return functools.partial(base_func, **kwargs)
+
+    def _do_response(self):
+        who = self.client_address
+        log.info("Got a call from %s for path %s", who, self.path)
+        try:
+            func = self._find_method(self.path)
+            log.info("Calling into func %s to get your data.", func)
+            data = func()
+            if not data:
+                data = ''
+            self.send_response(httplib.OK)
+            self.send_header("Content-Type", "binary/octet-stream")
+            self.send_header("Content-Length", len(data))
+            log.info("Sending data (len=%s):\n%s", len(data), format_text(data))
+            self.end_headers()
+            self.wfile.write(data)
+        except RuntimeError as e:
+            log.exception("Error somewhere in the server.")
+            self.send_error(httplib.INTERNAL_SERVER_ERROR, message=str(e))
+        except WebException as e:
+            code = e.code
+            log.exception(str(e))
+            self.send_error(code, message=str(e))
+
+    def do_GET(self):
+        self._do_response()
+
+    def do_POST(self):
+        self._do_response()
+
+
+def setup_logging(log_level, format='%(levelname)s: @%(name)s : %(message)s'):
+    root_logger = logging.getLogger()
+    console_logger = logging.StreamHandler(sys.stdout)
+    console_logger.setFormatter(logging.Formatter(format))
+    root_logger.addHandler(console_logger)
+    root_logger.setLevel(log_level)
+
+
+def extract_opts():
+    parser = OptionParser()
+    parser.add_option("-p", "--port", dest="port", action="store", type=int, default=80,
+                  help="port from which to serve traffic (default: %default)", metavar="PORT")
+    (options, args) = parser.parse_args()
+    out = dict()
+    out['extra'] = args
+    out['port'] = options.port
+    return out
+
+
+def setup_fetchers(opts):
+    global meta_fetcher
+    global user_fetcher
+    meta_fetcher = MetaDataHandler(opts)
+    user_fetcher = UserDataHandler(opts)
+
+
+def run_server():
+    # Using global here since it doesn't seem like we 
+    # can pass opts into a request handler constructor...
+    opts = extract_opts()
+    setup_logging(logging.DEBUG)
+    setup_fetchers(opts)
+    log.info("CLI opts: %s", opts)
+    server = HTTPServer(('0.0.0.0', opts['port']), Ec2Handler)
+    sa = server.socket.getsockname()
+    log.info("Serving server on %s using port %s ...", sa[0], sa[1])
+    server.serve_forever()
+
+
+if __name__ == '__main__':
+    run_server()

From a15bf4a716a9f0c644f67b2b9325f0086b54130c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 12:16:51 -0700
Subject: [PATCH 217/434] Small logging changes.

---
 bin/cloud-init2.py | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index e1757af4..d80ee1ec 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -106,9 +106,9 @@ def main_init(name, args):
     init.read_cfg(cfg_extra_paths)
     # Stage 2
     try:
-        util.fixup_output(init.cfg, 'init')
+        util.fixup_output(init.cfg, name)
     except:
-        util.logexc(LOG, "Failed to setup output redirection")
+        util.logexc(LOG, "Failed to setup output redirection!")
     if args.debug:
         # Reset so that all the debug handlers are closed out
         LOG.debug("Logging being reset, this logger may no longer be active shortly")
@@ -118,7 +118,7 @@ def main_init(name, args):
     try:
         init.initialize()
     except Exception as e:
-        util.logexc(LOG, "Failed to initialize, likely bad things to come: %s", e)
+        util.logexc(LOG, "Failed to initialize, likely bad things to come!")
     # Stage 4
     path_helper = init.paths
     if not args.local:
@@ -159,8 +159,7 @@ def main_init(name, args):
     try:
         init.fetch()
     except sources.DataSourceNotFoundException as e:
-        util.logexc(LOG, "No instance datasource found")
-        warn("No instance datasource found: %s" % (e))
+        util.logexc(LOG, "No instance datasource found!")
         # TODO: Return 0 or 1??
         return 1
     # Stage 6
@@ -176,8 +175,8 @@ def main_init(name, args):
         if not ran:
             init.consume(settings.ALWAYS)
     except Exception as e:
-        warn("Consuming user data failed: %s" % (e))
-        raise
+        util.logexc(LOG, "Consuming user data failed!")
+        return 1
     # Stage 8
     
 

From f237072a416c77193e4e6ea40272f44cd2fc9c5a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 12:17:06 -0700
Subject: [PATCH 218/434] Cleanup no datasource exception to use cleaner csv
 list.

---
 cloudinit/sources/__init__.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index a227e050..128d4aad 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -177,7 +177,8 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
         except Exception:
             util.logexc(LOG, "Getting data from %s failed", cls)
 
-    msg = "Did not find any data source, searched classes: %s" % (ds_names)
+    msg = ("Did not find any data source,"
+           " searched classes: (%s)") % (", ".join(ds_names))
     raise DataSourceNotFoundException(msg)
 
 

From aebe5cc3165f1bc48bbfbbfe3d0821c3271a8e70 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 15:39:01 -0700
Subject: [PATCH 219/434] Fix pylint line length issues.

---
 cloudinit/sources/__init__.py | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 128d4aad..35fc01df 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -182,14 +182,15 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
     raise DataSourceNotFoundException(msg)
 
 
-# return a list of classes that have the same depends as 'depends'
-# iterate through cfg_list, loading "DataSourceCollections" modules
+# Return a list of classes that have the same depends as 'depends'
+# iterate through cfg_list, loading "DataSource*" modules
 # and calling their "get_datasource_list".
-# return an ordered list of classes that match
+# Return an ordered list of classes that match (if any)
 def list_sources(cfg_list, depends, pkg_list):
     src_list = []
     LOG.info(("Looking for for data source in: %s,"
-              " via packages %s that matches dependencies %s"), cfg_list, pkg_list, depends)
+              " via packages %s that matches dependencies %s"),
+             cfg_list, pkg_list, depends)
     for ds_coll in cfg_list:
         ds_name = str(ds_coll)
         if not ds_name.startswith(DS_PREFIX):

From df98d0b50a411a2d14b9e55518c8e6ff6886c808 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 15:39:54 -0700
Subject: [PATCH 220/434] 1. Cleanup variable names to match more of the
 pythonic underscore pattern 2. Seperate config loading from the actual final
 'merging' process.    a. A util function will now merge multiple config
 dictionaries after they have all been loaded instead of       loading and
 merging at the same time, which can get confusing to follow.

---
 cloudinit/stages.py | 85 ++++++++++++++++++++++++---------------------
 cloudinit/util.py   | 11 ++++++
 2 files changed, 57 insertions(+), 39 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 6eb211db..558de035 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -156,20 +156,27 @@ class Init(object):
         # None check so that we don't keep on re-loading if empty
         if self._cfg is None:
             self._cfg = self._read_cfg(extra_fns)
-            LOG.debug("Loaded init config %s", self._cfg)
+            LOG.debug("Loaded %s config %s", util.obj_name(self), self._cfg)
 
     def _read_cfg(self, extra_fns):
-        builtin_cfg = util.get_builtin_cfg()
-        try:
-            conf = util.get_base_cfg(builtin=builtin_cfg)
-        except Exception:
-            conf = builtin_cfg
-        m_cfg = util.mergedict(conf, self._read_cfg_old())
+        # Read extra files provided (if any)
+        i_cfgs = []
         if extra_fns:
             for fn in extra_fns:
-                # Any extras over-ride the existing configs
-                m_cfg = util.mergedict(util.read_conf(fn), m_cfg)
-        return m_cfg
+                try:
+                    fn_cfg = util.read_conf(fn)
+                    i_cfgs.append(fn_cfg)
+                except:
+                    util.logexc(LOG, ("Failed loading of additional"
+                                      " configuration from %s"), fn)
+        # Now read in the built-in + base + old
+        try:
+            conf = util.get_base_cfg(builtin=util.get_builtin_cfg())
+        except Exception:
+            conf = util.get_builtin_cfg()
+        i_cfgs.append(conf)
+        i_cfgs.append(self._read_cfg_old())
+        return util.mergemanydict(i_cfgs)
 
     def _restore_from_cache(self):
         pickled_fn = self.paths.get_ipath_cur('obj_pkl')
@@ -371,46 +378,46 @@ class Init(object):
 
 
 class Transforms(object):
-    def __init__(self, init, cfgfile=None):
+    def __init__(self, init, cfg_files=None):
         self.datasource = init.fetch()
-        self.cfgfile = cfgfile
-        self.basecfg = copy.deepcopy(init.cfg)
+        self.cfg_files = cfg_files
+        self.base_cfg = copy.deepcopy(init.cfg)
         self.init = init
         # Created on first use
-        self._cachedcfg = None
+        self._cached_cfg = None
 
     @property
     def cfg(self):
-        if self._cachedcfg is None:
-            self._cachedcfg = self._get_config(self.cfgfile)
-            LOG.debug("Loading module config %s", self._cachedcfg)
-        return self._cachedcfg
+        # None check to avoid empty case
+        if self._cached_cfg is None:
+            self._cached_cfg = self._get_config()
+            LOG.debug("Loading %s config %s",
+                      util.obj_name(self), self._cached_cfg)
+        return self._cached_cfg
 
-    def _get_config(self, cfgfile):
-        mcfg = None
+    def _get_config(self):
+        t_cfgs = []
+        if self.cfg_files:
+            for fn in self.cfg_files:
+                try:
+                    t_cfgs.append(util.read_conf(fn))
+                except:
+                    util.logexc(LOG, ("Failed loading of configuration"
+                                       " from %s"), fn)
 
-        if self.cfgfile:
+        if self.datasource:
             try:
-                mcfg = util.read_conf(cfgfile)
+                d_cfg = self.datasource.get_config_obj()
+                if d_cfg:
+                    t_cfgs.append(d_cfg)
             except:
-                util.logexc(LOG, ("Failed loading of cloud config '%s'. "
-                                  "Continuing with an empty config."), cfgfile)
-        if not mcfg:
-            mcfg = {}
+                util.logexc(LOG, ("Failed loading of datasource"
+                                  " config object from %s"), self.datasource)
+        
+        if self.base_cfg:
+            t_cfgs.append(self.base_cfg)
 
-        ds_cfg = None
-        try:
-            ds_cfg = self.datasource.get_config_obj()
-        except:
-            util.logexc(LOG, "Failed loading of datasource config object.")
-        if not ds_cfg:
-            ds_cfg = {}
-
-        mcfg = util.mergedict(mcfg, ds_cfg)
-        if self.basecfg:
-            return util.mergedict(mcfg, self.basecfg)
-        else:
-            return mcfg
+        return util.mergemanydict(t_cfgs)
 
 
     def _read_transforms(self, name):
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 164bcea8..91d20a76 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -360,6 +360,7 @@ def get_cfg_by_path(yobj, keyp, default=None):
 def fixup_output(cfg, mode):
     (outfmt, errfmt) = get_output_cfg(cfg, mode)
     redirect_output(outfmt, errfmt)
+    return (outfmt, errfmt)
 
 
 # redirect_output(outfmt, errfmt, orig_out, orig_err)
@@ -448,6 +449,16 @@ def obj_name(obj):
     return obj_name(obj.__class__)
 
 
+def mergemanydict(srcs, reverse=False):
+    if reverse:
+        srcs = reversed(srcs)
+    m_cfg = {}
+    for a_cfg in srcs:
+        if a_cfg:
+            m_cfg = mergedict(m_cfg, a_cfg)
+    return m_cfg
+
+
 def mergedict(src, cand):
     """
     Merge values from C{cand} into C{src}.

From 8f93dbabbfb6cf6174c0039b8db24b970a29c8e0 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 15:59:46 -0700
Subject: [PATCH 221/434] Add a return statement that will collect the failures
 and the amount of transforms ran.

---
 cloudinit/stages.py | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 558de035..d3e61ddc 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -156,7 +156,7 @@ class Init(object):
         # None check so that we don't keep on re-loading if empty
         if self._cfg is None:
             self._cfg = self._read_cfg(extra_fns)
-            LOG.debug("Loaded %s config %s", util.obj_name(self), self._cfg)
+            LOG.debug("Loaded 'init' config %s", self._cfg)
 
     def _read_cfg(self, extra_fns):
         # Read extra files provided (if any)
@@ -391,8 +391,7 @@ class Transforms(object):
         # None check to avoid empty case
         if self._cached_cfg is None:
             self._cached_cfg = self._get_config()
-            LOG.debug("Loading %s config %s",
-                      util.obj_name(self), self._cached_cfg)
+            LOG.debug("Loading 'transform' config %s", self._cached_cfg)
         return self._cached_cfg
 
     def _get_config(self):
@@ -487,6 +486,7 @@ class Transforms(object):
         failures = []
         d_name = self.init.distro.name
         c_cloud = self.init.cloudify()
+        am_ran = 0
         for (mod, name, freq, args) in mostly_mods:
             try:
                 # Try the modules frequency, otherwise fallback to a known one
@@ -503,13 +503,15 @@ class Transforms(object):
                 # Use the transforms logger and not our own
                 func_args = [name, copy.deepcopy(self.cfg),
                              c_cloud, transforms.LOG, args]
+                # Mark it as having started running
+                am_ran += 1
                 # This name will affect the semaphore name created
                 run_name = "config-%s" % (name)
                 c_cloud.run(run_name, mod.handle, func_args, freq=freq)
             except Exception as e:
                 util.logexc(LOG, "Running %s (%s) failed", name, mod)
                 failures.append((name, e))
-        return failures
+        return (am_ran, failures)
 
     def run(self, name):
         raw_mods = self._read_transforms(name)

From cf424230cea52cf83cd35d5ed5e5b0adb5255ccf Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 16:00:17 -0700
Subject: [PATCH 222/434] Get the 'init' stage working.

---
 bin/cloud-init2.py | 74 +++++++++++++++++++++++++++++++++++-----------
 1 file changed, 56 insertions(+), 18 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index d80ee1ec..1f938f01 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -42,6 +42,9 @@ from cloudinit import util
 from cloudinit import version
 
 
+# Transform section template
+TR_TPL = "cloud_%s_modules"
+
 # Things u can query on
 QUERY_DATA_TYPES = [
     'data',
@@ -98,26 +101,31 @@ def main_init(name, args):
     # 5. Fetch the datasource
     # 6. Connect to the current instance location + update the cache
     # 7. Consume the userdata (handlers get activated here)
-    # 8. Adjust any subsequent logging/output redirections
-    # 9. Run the transforms for the 'init' stage
-    # 10. Done!
+    # 8. Construct the transform object
+    # 9. Adjust any subsequent logging/output redirections using
+    #    the transform objects configuration
+    # 10. Run the transforms for the 'init' stage
+    # 11. Done!
     init = stages.Init(deps)
     # Stage 1
     init.read_cfg(cfg_extra_paths)
     # Stage 2
+    outfmt = None
+    errfmt = None
     try:
-        util.fixup_output(init.cfg, name)
+        (outfmt, errfmt) = util.fixup_output(init.cfg, name)
     except:
         util.logexc(LOG, "Failed to setup output redirection!")
     if args.debug:
         # Reset so that all the debug handlers are closed out
-        LOG.debug("Logging being reset, this logger may no longer be active shortly")
+        LOG.debug(("Logging being reset, this logger may no"
+                    " longer be active shortly"))
         logging.resetLogging()
     logging.setupLogging(init.cfg)
     # Stage 3
     try:
         init.initialize()
-    except Exception as e:
+    except Exception:
         util.logexc(LOG, "Failed to initialize, likely bad things to come!")
     # Stage 4
     path_helper = init.paths
@@ -136,10 +144,11 @@ def main_init(name, args):
                 c = util.load_file(fn)
                 if len(c):
                     existing_files.append((fn, len(c)))
-            except Exception as e:
+            except Exception:
                 pass
         if existing_files:
-            LOG.debug("Exiting early due to the existence of %s", existing_files)
+            LOG.debug("Exiting early due to the existence of %s files",
+                      existing_files)
             return 0
     else:
         # The cache is not instance specific, so it has to be purged
@@ -153,7 +162,7 @@ def main_init(name, args):
         else:
             init.purge_cache()
         # Delete the non-net file as well
-        util.del_fie(os.path.join(path_helper.get_cpath("data"), "no-net"))
+        util.del_file(os.path.join(path_helper.get_cpath("data"), "no-net"))
     # Stage 5
     welcome(name)
     try:
@@ -173,18 +182,38 @@ def main_init(name, args):
                                              args=[settings.PER_INSTANCE],
                                              freq=settings.PER_INSTANCE)
         if not ran:
-            init.consume(settings.ALWAYS)
+            init.consume(settings.PER_ALWAYS)
     except Exception as e:
         util.logexc(LOG, "Consuming user data failed!")
         return 1
     # Stage 8
-    
+    tr = stages.Transforms(init, cfg_extra_paths)
+    # Stage 9 - TODO is this really needed??
+    try:
+        outfmt_orig = outfmt
+        errfmt_orig = errfmt
+        (outfmt, errfmt) = util.get_output_cfg(tr.cfg, name)
+        if outfmt_orig != outfmt or errfmt_orig != errfmt:
+            LOG.warn("Stdout, stderr changing to (%s, %s)", outfmt, errfmt)
+            (outfmt, errfmt) = util.fixup_output(tr.cfg, name)
+    except:
+        util.logexc(LOG, "Failed to adjust output redirection!")
+    # Stage 10
+    section_name = TR_TPL % (name)
+    (ran_am, failures) = tr.run(section_name)
+    if not ran_am:
+        msg = "No %s transforms to run under section %s" % (name, section_name)
+        sys.stderr.write("%s\n" % (msg))
+        LOG.debug(msg)
+        return 0
+    return len(failures)
 
-def main_config(name, args):
+
+def main_config(_name, _args):
     pass
 
 
-def main_final(name, args):
+def main_final(_name, _args):
     pass
 
 
@@ -202,18 +231,27 @@ def main():
     subparsers = parser.add_subparsers()
 
     # Each action and its suboptions (if any)
-    parser_init = subparsers.add_parser('init', help='initializes cloud-init and performs \'init\' transforms')
+    parser_init = subparsers.add_parser('init', 
+                                        help=('initializes cloud-init and'
+                                              ' performs \'init\' transforms'))
     parser_init.add_argument("--local", '-l', action='store_true',
                              help="start in local mode", default=False)
-    parser_init.set_defaults(action='init')  # This is used so that we can know which action is selected
+    # This is used so that we can know which action is selected
+    parser_init.set_defaults(action='init')
 
-    parser_config = subparsers.add_parser('config', help='performs cloud-init \'config\' transforms')
+    parser_config = subparsers.add_parser('config', 
+                                          help=('performs cloud-init '
+                                                '\'config\' transforms'))
     parser_config.set_defaults(action='config')
 
-    parser_final = subparsers.add_parser('final', help='performs cloud-init \'final\' transforms')
+    parser_final = subparsers.add_parser('final', 
+                                         help=('performs cloud-init '
+                                               '\'final\' transforms'))
     parser_final.set_defaults(action='final')
 
-    parser_query = subparsers.add_parser('query', help='query information stored in cloud-init')
+    parser_query = subparsers.add_parser('query', 
+                                         help=('query information stored '
+                                               'in cloud-init'))
     parser_query.add_argument("--name", action="store",
                               help="item name to query on",
                               required=True,

From 1714be4b27e7f37baf6e98289b4b543d16180992 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 16:13:29 -0700
Subject: [PATCH 223/434] Initial add of read and write roots, this should
 cover a large set of cases that use the path object.

1. This basically allows configuration to specify 'read_root' which will be used for read operations, right now just templates
   and a 'write_root' via config that will be used for non read operations (ie 'var/lib/cloud' operations where most of the writing now happens)
---
 cloudinit/helpers.py | 24 ++++++++++++++++++++++--
 1 file changed, 22 insertions(+), 2 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 3fd819b3..3938e7ee 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -206,11 +206,17 @@ class ContentHandlers(object):
 
 class Paths(object):
     def __init__(self, path_cfgs, ds=None):
-        self.cloud_dir = path_cfgs.get('cloud_dir', '/var/lib/cloud')
+        self.cfgs = path_cfgs
+        # Populate all the initial paths
+        self.cloud_dir = self.join_paths(False,
+                                         path_cfgs.get('cloud_dir',
+                                                       '/var/lib/cloud'))
         self.instance_link = os.path.join(self.cloud_dir, 'instance')
         self.boot_finished = os.path.join(self.instance_link, "boot-finished")
         self.upstart_conf_d = path_cfgs.get('upstart_dir')
-        template_dir = path_cfgs.get('templates_dir', '/etc/cloud/templates/')
+        template_dir = self.join_paths(True,
+                                       path_cfgs.get('templates_dir',
+                                                     '/etc/cloud/templates/'))
         self.template_tpl = os.path.join(template_dir, '%s.tmpl')
         self.seed_dir = os.path.join(self.cloud_dir, 'seed')
         self.lookups = {
@@ -227,6 +233,20 @@ class Paths(object):
         # Set when a datasource becomes active
         self.datasource = ds
 
+    # joins the paths but also appends a read 
+    # or write root if available
+    def join_paths(self, read_only, *paths):
+        if read_only:
+            root = self.cfgs.get('read_root', '/')
+        else:
+            root = self.cfgs.get('write_root', '/')
+        if not paths:
+            return root
+        joined = os.path.join(*paths)
+        if root:
+            joined = os.path.join(root, joined.lstrip("/"))
+        return joined
+
     # get_ipath_cur: get the current instance path for an item
     def get_ipath_cur(self, name=None):
         ipath = self.instance_link

From 0431b7e4571714e9ec21f12455818ce4b22d7bc1 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 16:35:49 -0700
Subject: [PATCH 224/434] Use the given module as the root module for the given
 mod to be used from.

---
 cloudinit/transforms/__init__.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/transforms/__init__.py b/cloudinit/transforms/__init__.py
index 925cf569..5cd08575 100644
--- a/cloudinit/transforms/__init__.py
+++ b/cloudinit/transforms/__init__.py
@@ -29,7 +29,7 @@ LOG = logging.getLogger(__name__)
 TRANSFORM_PREFIX = ''  # "cc_"
 
 
-def form_transform_name(name):
+def form_transform_name(name, mod=__name__):
     canon_name = name.replace("-", "_")
     if canon_name.lower().endswith(".py"):
         canon_name = canon_name[0:(len(canon_name) - 3)]
@@ -38,7 +38,7 @@ def form_transform_name(name):
         return None
     if not canon_name.startswith(TRANSFORM_PREFIX):
         canon_name = '%s%s' % (TRANSFORM_PREFIX, canon_name)
-    return canon_name
+    return ".".join([str(mod), str(canon_name)])
 
 
 def fixup_transform(mod, def_freq=PER_INSTANCE):

From 05b522b0e1046da3ca1acf60fe741d9ac2e5a136 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 17:58:41 -0700
Subject: [PATCH 225/434] Make most of all the places use the paths join()
 function so that testing with non-real read/write paths is easier.

---
 cloudinit/distros/rhel.py                   |  6 +++-
 cloudinit/distros/ubuntu.py                 |  7 +++--
 cloudinit/helpers.py                        | 34 +++++++++++++--------
 cloudinit/ssh_util.py                       | 10 ++++--
 cloudinit/transforms/apt_pipelining.py      | 15 ++++-----
 cloudinit/transforms/apt_update_upgrade.py  | 21 ++++++++-----
 cloudinit/transforms/ca_certs.py            | 23 ++++++++------
 cloudinit/transforms/chef.py                | 31 +++++++++++++------
 cloudinit/transforms/keys_to_console.py     |  9 +++---
 cloudinit/transforms/landscape.py           | 20 +++++++-----
 cloudinit/transforms/mcollective.py         | 25 ++++++++-------
 cloudinit/transforms/mounts.py              |  6 ++--
 cloudinit/transforms/phone_home.py          |  2 +-
 cloudinit/transforms/puppet.py              | 34 ++++++++++++---------
 cloudinit/transforms/resizefs.py            |  8 ++---
 cloudinit/transforms/rightscale_userdata.py |  1 +
 cloudinit/transforms/rsyslog.py             |  3 +-
 cloudinit/transforms/runcmd.py              |  2 +-
 cloudinit/transforms/salt_minion.py         |  2 ++
 cloudinit/transforms/set_passwords.py       |  4 +--
 cloudinit/transforms/ssh.py                 | 13 +++++---
 21 files changed, 167 insertions(+), 109 deletions(-)

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index e0ca5909..aef7f6f3 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -73,6 +73,7 @@ class Distro(distros.Distro):
             lines.insert(0, '# Created by cloud-init')
             contents = "\n".join(lines)
             net_fn = NETWORK_FN_TPL % (dev)
+            net_fn = self._paths.join(False, net_fn)
             util.write_file(net_fn, contents, 0644)
 
     def set_hostname(self, hostname):
@@ -104,6 +105,7 @@ class Distro(distros.Distro):
             new_contents.append("# Added by cloud-init")
             new_contents.append("HOSTNAME=%s" % (hostname))
         contents = "\n".join(new_contents)
+        out_fn = self._paths.join(False, out_fn)
         util.write_file(out_fn, contents, 0644)
 
     def update_hostname(self, hostname, prev_file):
@@ -143,6 +145,7 @@ class Distro(distros.Distro):
         return default
 
     def _read_conf(self, filename):
+        filename = self._paths.join(True, filename)
         contents = util.load_file(filename, quiet=True)
         conf_lines = []
         for line in contents.splitlines():
@@ -194,7 +197,8 @@ class Distro(distros.Distro):
             new_contents.append("# Added by cloud-init")
             new_contents.append('ZONE="%s"' % (tz))
         tz_contents = "\n".join(new_contents)
-        util.write_file("/etc/sysconfig/clock", tz_contents)
+        tz_fn = self._paths.join(False, "/etc/sysconfig/clock")
+        util.write_file(tz_fn, tz_contents)
         # This ensures that the correct tz will be used for the system
         util.copy(tz_file, "/etc/localtime")
 
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 24724d83..94565b14 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -46,7 +46,8 @@ class Distro(distros.Distro):
         self.package_command('install', pkglist)
 
     def _write_network(self, settings):
-        util.write_file("/etc/network/interfaces", settings)
+        n_fn = self._paths.join(False, "/etc/network/interfaces")
+        util.write_file(n_fn, settings)
 
     def set_hostname(self, hostname):
         self._write_hostname(hostname, "/etc/hostname")
@@ -84,6 +85,7 @@ class Distro(distros.Distro):
             util.subp(['hostname', hostname])
 
     def _read_hostname(self, filename, default=None):
+        filename = self._paths.join(True, filename)
         contents = util.load_file(filename, quiet=True)
         for line in contents.splitlines():
             c_pos = line.find("#")
@@ -105,7 +107,8 @@ class Distro(distros.Distro):
             raise Exception(("Invalid timezone %s,"
                              " no file found at %s") % (tz, tz_file))
         tz_contents = "%s\n" % tz
-        util.write_file("/etc/timezone", tz_contents)
+        tz_fn = self._paths.join(False, "/etc/timezone")
+        util.write_file(tz_fn, tz_contents)
         util.copy(tz_file, "/etc/localtime")
 
     def package_command(self, command, args=None):
diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 3938e7ee..9f55a984 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -208,17 +208,18 @@ class Paths(object):
     def __init__(self, path_cfgs, ds=None):
         self.cfgs = path_cfgs
         # Populate all the initial paths
-        self.cloud_dir = self.join_paths(False,
-                                         path_cfgs.get('cloud_dir',
-                                                       '/var/lib/cloud'))
+        self.cloud_dir = self.join(False,
+                                   path_cfgs.get('cloud_dir', 
+                                                 '/var/lib/cloud'))
         self.instance_link = os.path.join(self.cloud_dir, 'instance')
         self.boot_finished = os.path.join(self.instance_link, "boot-finished")
         self.upstart_conf_d = path_cfgs.get('upstart_dir')
-        template_dir = self.join_paths(True,
-                                       path_cfgs.get('templates_dir',
-                                                     '/etc/cloud/templates/'))
-        self.template_tpl = os.path.join(template_dir, '%s.tmpl')
+        if self.upstart_conf_d:
+            self.upstart_conf_d = self.join(False, self.upstart_conf_d)
         self.seed_dir = os.path.join(self.cloud_dir, 'seed')
+        # This one isn't joined, since it should just be read-only
+        template_dir = path_cfgs.get('templates_dir', '/etc/cloud/templates/')
+        self.template_tpl = os.path.join(template_dir, '%s.tmpl')
         self.lookups = {
            "handlers": "handlers",
            "scripts": "scripts",
@@ -235,16 +236,25 @@ class Paths(object):
 
     # joins the paths but also appends a read 
     # or write root if available
-    def join_paths(self, read_only, *paths):
+    def join(self, read_only, *paths):
         if read_only:
-            root = self.cfgs.get('read_root', '/')
+            root = self.cfgs.get('read_root')
         else:
-            root = self.cfgs.get('write_root', '/')
+            root = self.cfgs.get('write_root')
         if not paths:
             return root
-        joined = os.path.join(*paths)
+        if len(paths) > 1:
+            joined = os.path.join(*paths)
+        else:
+            joined = paths[0]
         if root:
-            joined = os.path.join(root, joined.lstrip("/"))
+            pre_joined = joined
+            # Need to remove any starting '/' since this
+            # will confuse os.path.join
+            joined = joined.lstrip("/")
+            joined = os.path.join(root, joined)
+            LOG.debug("Translated %s to adjusted path %s (%s)",
+                      pre_joined, joined, read_only)
         return joined
 
     # get_ipath_cur: get the current instance path for an item
diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index 13adbb09..96143d32 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -210,9 +210,12 @@ def update_authorized_keys(fname, keys):
     return '\n'.join(lines)
 
 
-def setup_user_keys(keys, user, key_prefix, sshd_config_fn=DEF_SSHD_CFG):
+def setup_user_keys(keys, user, key_prefix, paths):
+    
+    # Make sure the users .ssh dir is setup accordingly
     pwent = pwd.getpwnam(user)
     ssh_dir = os.path.join(pwent.pw_dir, '.ssh')
+    ssh_dir = paths.join(False, ssh_dir)
     if not os.path.exists(ssh_dir):
         util.ensure_dir(ssh_dir, mode=0700)
         util.chownbyid(ssh_dir, pwent.pw_uid, pwent.pw_gid)
@@ -223,6 +226,7 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn=DEF_SSHD_CFG):
     for k in keys:
         key_entries.append(parser.parse(str(k), def_opt=key_prefix))
 
+    sshd_conf_fn = paths.join(True, DEF_SSHD_CFG)
     with util.SeLinuxGuard(ssh_dir, recursive=True):
         try:
             # AuthorizedKeysFile may contain tokens
@@ -230,7 +234,7 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn=DEF_SSHD_CFG):
             # The following tokens are defined: %% is replaced by a literal
             # '%', %h is replaced by the home directory of the user being
             # authenticated and %u is replaced by the username of that user.
-            ssh_cfg = parse_ssh_config(sshd_config_fn)
+            ssh_cfg = parse_ssh_config(sshd_conf_fn)
             akeys = ssh_cfg.get("authorizedkeysfile", '')
             akeys = akeys.strip()
             if not akeys:
@@ -247,7 +251,7 @@ def setup_user_keys(keys, user, key_prefix, sshd_config_fn=DEF_SSHD_CFG):
                               " in ssh config"
                               " from %s, using 'AuthorizedKeysFile' file"
                               " %s instead"),
-                        sshd_config_fn, authorized_keys)
+                        sshd_conf_fn, authorized_keys)
 
         content = update_authorized_keys(authorized_keys, key_entries)
         util.ensure_dir(os.path.dirname(authorized_keys), mode=0700)
diff --git a/cloudinit/transforms/apt_pipelining.py b/cloudinit/transforms/apt_pipelining.py
index d8e574b9..f460becb 100644
--- a/cloudinit/transforms/apt_pipelining.py
+++ b/cloudinit/transforms/apt_pipelining.py
@@ -23,7 +23,7 @@ frequency = PER_INSTANCE
 
 distros = ['ubuntu', 'debian']
 
-default_file = "/etc/apt/apt.conf.d/90cloud-init-pipelining"
+DEFAULT_FILE = "/etc/apt/apt.conf.d/90cloud-init-pipelining"
 
 # Acquire::http::Pipeline-Depth can be a value
 # from 0 to 5 indicating how many outstanding requests APT should send.
@@ -31,30 +31,27 @@ default_file = "/etc/apt/apt.conf.d/90cloud-init-pipelining"
 # on TCP connections - otherwise data corruption will occur.
 
 
-def handle(_name, cfg, _cloud, log, _args):
+def handle(_name, cfg, cloud, log, _args):
 
     apt_pipe_value = util.get_cfg_option_str(cfg, "apt_pipelining", False)
     apt_pipe_value_s = str(apt_pipe_value).lower().strip()
 
     if apt_pipe_value_s == "false":
-        write_apt_snippet("0", log)
-
+        write_apt_snippet(cloud, "0", log, DEFAULT_FILE)
     elif apt_pipe_value_s in ("none", "unchanged", "os"):
         return
-
     elif apt_pipe_value_s in [str(b) for b in xrange(0, 6)]:
-        write_apt_snippet(apt_pipe_value_s, log)
-
+        write_apt_snippet(cloud, apt_pipe_value_s, log, DEFAULT_FILE)
     else:
         log.warn("Invalid option for apt_pipeling: %s", apt_pipe_value)
 
 
-def write_apt_snippet(setting, log, f_name=default_file):
+def write_apt_snippet(cloud, setting, log, f_name):
     """ Writes f_name with apt pipeline depth 'setting' """
 
     file_contents = ("//Written by cloud-init per 'apt_pipelining'\n"
                      'Acquire::http::Pipeline-Depth "%s";\n') % (setting)
 
-    util.write_file(f_name, file_contents)
+    util.write_file(cloud.paths.join(False, f_name), file_contents)
 
     log.debug("Wrote %s with apt pipeline depth setting %s", f_name, setting)
diff --git a/cloudinit/transforms/apt_update_upgrade.py b/cloudinit/transforms/apt_update_upgrade.py
index d49d8bd2..29bbc1ae 100644
--- a/cloudinit/transforms/apt_update_upgrade.py
+++ b/cloudinit/transforms/apt_update_upgrade.py
@@ -26,6 +26,8 @@ from cloudinit import util
 
 distros = ['ubuntu', 'debian']
 
+PROXY_TPL = "Acquire::HTTP::Proxy \"%s\";\n"
+
 
 def handle(_name, cfg, cloud, log, _args):
     update = util.get_cfg_option_bool(cfg, 'apt_update', False)
@@ -44,22 +46,23 @@ def handle(_name, cfg, cloud, log, _args):
                                           "archive.ubuntu.com/ubuntu")
         rename_apt_lists(old_mir, mirror)
 
-    # set up proxy
+    # Set up any apt proxy
     proxy = cfg.get("apt_proxy", None)
     proxy_filename = "/etc/apt/apt.conf.d/95cloud-init-proxy"
     if proxy:
         try:
-            # See http://linux.die.net/man/5/apt.conf
-            contents = "Acquire::HTTP::Proxy \"%s\";\n"
-            util.write_file(proxy_filename, contents % (proxy))
+            # See man 'apt.conf'
+            contents = PROXY_TPL % (proxy)
+            util.write_file(cloud.paths.join(False, proxy_filename),
+                            contents)
         except Exception as e:
             util.logexc(log, "Failed to write proxy to %s", proxy_filename)
     elif os.path.isfile(proxy_filename):
         util.del_file(proxy_filename)
 
-    # process 'apt_sources'
+    # Process 'apt_sources'
     if 'apt_sources' in cfg:
-        errors = add_sources(cfg['apt_sources'],
+        errors = add_sources(cloud, cfg['apt_sources'],
                              {'MIRROR': mirror, 'RELEASE': release})
         for e in errors:
             log.warn("Source Error: %s", ':'.join(e))
@@ -138,7 +141,7 @@ def generate_sources_list(codename, mirror, cloud, log):
         log.warn("No template found, not rendering /etc/apt/sources.list")
 
 
-def add_sources(srclist, template_params=None):
+def add_sources(cloud, srclist, template_params=None):
     """
     add entries in /etc/apt/sources.list.d for each abbreviated
     sources.list entry in 'srclist'.  When rendering template, also
@@ -187,7 +190,9 @@ def add_sources(srclist, template_params=None):
                 errorlist.append([source, "failed add key"])
 
         try:
-            util.write_file(ent['filename'], "%s\n" % (source), omode="ab")
+            contents = "%s\n" % (source)
+            util.write_file(cloud.paths.join(False, ent['filename']),
+                            contents, omode="ab")
         except:
             errorlist.append([source,
                              "failed write to file %s" % ent['filename']])
diff --git a/cloudinit/transforms/ca_certs.py b/cloudinit/transforms/ca_certs.py
index e0802bfe..56c41561 100644
--- a/cloudinit/transforms/ca_certs.py
+++ b/cloudinit/transforms/ca_certs.py
@@ -33,7 +33,7 @@ def update_ca_certs():
     util.subp(["update-ca-certificates"])
 
 
-def add_ca_certs(certs):
+def add_ca_certs(cloud, certs):
     """
     Adds certificates to the system. To actually apply the new certificates
     you must also call L{update_ca_certs}.
@@ -41,26 +41,29 @@ def add_ca_certs(certs):
     @param certs: A list of certificate strings.
     """
     if certs:
-        cert_file_contents = "\n".join(certs)
+        # First ensure they are strings...
+        cert_file_contents = "\n".join([str(c) for c in certs])
         cert_file_fullpath = os.path.join(CA_CERT_PATH, CA_CERT_FILENAME)
+        cert_file_fullpath = cloud.paths.join(False, cert_file_fullpath)
         util.write_file(cert_file_fullpath, cert_file_contents, mode=0644)
         # Append cert filename to CA_CERT_CONFIG file.
-        util.write_file(CA_CERT_CONFIG, "\n%s" % CA_CERT_FILENAME, omode="ab")
+        util.write_file(cloud.paths.join(False, CA_CERT_CONFIG),
+                        "\n%s" % CA_CERT_FILENAME, omode="ab")
 
 
-def remove_default_ca_certs():
+def remove_default_ca_certs(cloud):
     """
     Removes all default trusted CA certificates from the system. To actually
     apply the change you must also call L{update_ca_certs}.
     """
-    util.delete_dir_contents(CA_CERT_PATH)
-    util.delete_dir_contents(CA_CERT_SYSTEM_PATH)
-    util.write_file(CA_CERT_CONFIG, "", mode=0644)
+    util.delete_dir_contents(cloud.paths.join(False, CA_CERT_PATH))
+    util.delete_dir_contents(cloud.paths.join(False, CA_CERT_SYSTEM_PATH))
+    util.write_file(cloud.paths.join(False, CA_CERT_CONFIG), "", mode=0644)
     debconf_sel = "ca-certificates ca-certificates/trust_new_crts select no"
     util.subp(('debconf-set-selections', '-'), debconf_sel)
 
 
-def handle(name, cfg, _cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     """
     Call to handle ca-cert sections in cloud-config file.
 
@@ -82,14 +85,14 @@ def handle(name, cfg, _cloud, log, _args):
     # default trusted CA certs first.
     if ca_cert_cfg.get("remove-defaults", False):
         log.debug("Removing default certificates")
-        remove_default_ca_certs()
+        remove_default_ca_certs(cloud)
 
     # If we are given any new trusted CA certs to add, add them.
     if "trusted" in ca_cert_cfg:
         trusted_certs = util.get_cfg_option_list(ca_cert_cfg, "trusted")
         if trusted_certs:
             log.debug("Adding %d certificates" % len(trusted_certs))
-            add_ca_certs(trusted_certs)
+            add_ca_certs(cloud, trusted_certs)
 
     # Update the system with the new cert configuration.
     log.debug("Updating certificates")
diff --git a/cloudinit/transforms/chef.py b/cloudinit/transforms/chef.py
index 31bfb85f..4e8ef346 100644
--- a/cloudinit/transforms/chef.py
+++ b/cloudinit/transforms/chef.py
@@ -36,30 +36,40 @@ def handle(name, cfg, cloud, log, _args):
         return
     chef_cfg = cfg['chef']
 
-    # ensure the chef directories we use exist
-    util.ensure_dirs(['/etc/chef', '/var/log/chef', '/var/lib/chef',
-                     '/var/cache/chef', '/var/backups/chef', '/var/run/chef'])
+    # Ensure the chef directories we use exist
+    c_dirs = [
+        '/etc/chef', 
+        '/var/log/chef', 
+        '/var/lib/chef', 
+        '/var/cache/chef', 
+        '/var/backups/chef', 
+        '/var/run/chef',
+    ]
+    for d in c_dirs:
+        util.ensure_dir(cloud.paths.join(False, d))
 
-    # set the validation key based on the presence of either 'validation_key'
+    # Set the validation key based on the presence of either 'validation_key'
     # or 'validation_cert'. In the case where both exist, 'validation_key'
     # takes precedence
     for key in ('validation_key', 'validation_cert'):
         if key in chef_cfg and chef_cfg[key]:
-            util.write_file('/etc/chef/validation.pem', chef_cfg[key])
+            v_fn = cloud.paths.join(False, '/etc/chef/validation.pem')
+            util.write_file(v_fn, chef_cfg[key])
             break
 
-    # create the chef config from template
+    # Create the chef config from template
     template_fn = cloud.get_template_filename('chef_client.rb')
     if template_fn:
+        iid = str(cloud.datasource.get_instance_id())
         params = {
             'server_url': chef_cfg['server_url'],
-            'node_name': util.get_cfg_option_str(chef_cfg, 'node_name',
-                                    cloud.datasource.get_instance_id()),
+            'node_name': util.get_cfg_option_str(chef_cfg, 'node_name', iid),
             'environment': util.get_cfg_option_str(chef_cfg, 'environment',
                                                    '_default'),
             'validation_name': chef_cfg['validation_name']
         }
-        templater.render_to_file(template_fn, '/etc/chef/client.rb', params)
+        out_fn = cloud.paths.join(False, '/etc/chef/client.rb')
+        templater.render_to_file(template_fn, out_fn, params)
     else:
         log.warn("No template found, not rendering to /etc/chef/client.rb")
 
@@ -71,7 +81,8 @@ def handle(name, cfg, cloud, log, _args):
         initial_attributes = chef_cfg['initial_attributes']
         for k in list(initial_attributes.keys()):
             initial_json[k] = initial_attributes[k]
-    util.write_file('/etc/chef/firstboot.json', json.dumps(initial_json))
+    firstboot_fn = cloud.paths.join(False, '/etc/chef/firstboot.json')
+    util.write_file(firstboot_fn, json.dumps(initial_json))
 
     # If chef is not installed, we install chef based on 'install_type'
     if not os.path.isfile('/usr/bin/chef-client'):
diff --git a/cloudinit/transforms/keys_to_console.py b/cloudinit/transforms/keys_to_console.py
index e974375f..40758198 100644
--- a/cloudinit/transforms/keys_to_console.py
+++ b/cloudinit/transforms/keys_to_console.py
@@ -29,23 +29,24 @@ frequency = PER_INSTANCE
 helper_tool = '/usr/lib/cloud-init/write-ssh-key-fingerprints'
 
 
-def handle(name, cfg, _cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     if not os.path.exists(helper_tool):
         log.warn(("Unable to activate transform %s,"
                   " helper tool not found at %s"), name, helper_tool)
         return
 
     fp_blacklist = util.get_cfg_option_list(cfg,
-        "ssh_fp_console_blacklist", [])
+                                            "ssh_fp_console_blacklist", [])
     key_blacklist = util.get_cfg_option_list(cfg,
-        "ssh_key_console_blacklist", ["ssh-dss"])
+                                             "ssh_key_console_blacklist",
+                                              ["ssh-dss"])
 
     try:
         cmd = [helper_tool]
         cmd.append(','.join(fp_blacklist))
         cmd.append(','.join(key_blacklist))
         (stdout, _stderr) = util.subp(cmd)
-        util.write_file('/dev/console', stdout)
+        util.write_file(cloud.paths.join(False, '/dev/console'), stdout)
     except:
         log.warn("Writing keys to /dev/console failed!")
         raise
diff --git a/cloudinit/transforms/landscape.py b/cloudinit/transforms/landscape.py
index 19948d0e..29ce41b9 100644
--- a/cloudinit/transforms/landscape.py
+++ b/cloudinit/transforms/landscape.py
@@ -33,12 +33,12 @@ from cloudinit.settings import PER_INSTANCE
 
 frequency = PER_INSTANCE
 
-lsc_client_cfg_file = "/etc/landscape/client.conf"
+LSC_CLIENT_CFG_FILE = "/etc/landscape/client.conf"
 
 distros = ['ubuntu']
 
 # defaults taken from stock client.conf in landscape-client 11.07.1.1-0ubuntu2
-lsc_builtincfg = {
+LSC_BUILTIN_CFG = {
   'client': {
     'log_level': "info",
     'url': "https://landscape.canonical.com/message-system",
@@ -48,7 +48,7 @@ lsc_builtincfg = {
 }
 
 
-def handle(name, cfg, _cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     """
     Basically turn a top level 'landscape' entry with a 'client' dict
     and render it to ConfigObj format under '[client]' section in
@@ -66,15 +66,19 @@ def handle(name, cfg, _cloud, log, _args):
                          " but not a dictionary type,"
                          " is a %s instead"), util.obj_name(ls_cloudcfg))
 
-    merged = merge_together([lsc_builtincfg, lsc_client_cfg_file, ls_cloudcfg])
+    lsc_client_fn = cloud.paths.join(True, LSC_CLIENT_CFG_FILE)
+    merged = merge_together([LSC_BUILTIN_CFG, lsc_client_fn, ls_cloudcfg])
 
-    if not os.path.isdir(os.path.dirname(lsc_client_cfg_file)):
-        util.ensure_dir(os.path.dirname(lsc_client_cfg_file))
+    lsc_dir = cloud.paths.join(False, os.path.dirname(lsc_client_fn))
+    if not os.path.isdir(lsc_dir):
+        util.ensure_dir(lsc_dir)
 
     contents = StringIO()
     merged.write(contents)
-    util.write_file(lsc_client_cfg_file, contents.getvalue())
-    log.debug("Wrote landscape config file to %s", lsc_client_cfg_file)
+    contents.flush()
+
+    util.write_file(lsc_client_fn, contents.getvalue())
+    log.debug("Wrote landscape config file to %s", lsc_client_fn)
 
 
 def merge_together(objs):
diff --git a/cloudinit/transforms/mcollective.py b/cloudinit/transforms/mcollective.py
index 5464fe8c..9754d6b8 100644
--- a/cloudinit/transforms/mcollective.py
+++ b/cloudinit/transforms/mcollective.py
@@ -24,8 +24,8 @@ from StringIO import StringIO
 from cloudinit import cfg as config
 from cloudinit import util
 
-pubcert_file = "/etc/mcollective/ssl/server-public.pem"
-pricert_file = "/etc/mcollective/ssl/server-private.pem"
+PUBCERT_FILE = "/etc/mcollective/ssl/server-public.pem"
+PRICERT_FILE = "/etc/mcollective/ssl/server-private.pem"
 
 
 def handle(name, cfg, cloud, log, _args):
@@ -47,7 +47,8 @@ def handle(name, cfg, cloud, log, _args):
         mcollective_config = config.DefaultingConfigParser()
         # Read server.cfg values from original file in order to be able to mix
         # the rest up
-        old_contents = util.load_file('/etc/mcollective/server.cfg')
+        server_cfg_fn = cloud.paths.join(True, '/etc/mcollective/server.cfg')
+        old_contents = util.load_file(server_cfg_fn)
         # It doesn't contain any sections so just add one temporarily
         # Use a hash id based off the contents,
         # just incase of conflicts... (try to not have any...)
@@ -61,17 +62,19 @@ def handle(name, cfg, cloud, log, _args):
             section_head = section_tpl % (attempts)
         sectioned_contents = "%s\n%s" % (section_head, old_contents)
         mcollective_config.readfp(StringIO(sectioned_contents),
-                                  filename='/etc/mcollective/server.cfg')
+                                  filename=server_cfg_fn)
         for (cfg_name, cfg) in mcollective_cfg['conf'].iteritems():
             if cfg_name == 'public-cert':
-                util.write_file(pubcert_file, cfg, mode=0644)
+                pubcert_fn = cloud.paths.join(True, PUBCERT_FILE)
+                util.write_file(pubcert_fn, cfg, mode=0644)
                 mcollective_config.set(cfg_name,
-                    'plugin.ssl_server_public', pubcert_file)
+                    'plugin.ssl_server_public', pubcert_fn)
                 mcollective_config.set(cfg_name, 'securityprovider', 'ssl')
             elif cfg_name == 'private-cert':
-                util.write_file(pricert_file, cfg, mode=0600)
+                pricert_fn = cloud.paths.join(True, PRICERT_FILE)
+                util.write_file(pricert_fn, cfg, mode=0600)
                 mcollective_config.set(cfg_name,
-                    'plugin.ssl_server_private', pricert_file)
+                    'plugin.ssl_server_private', pricert_fn)
                 mcollective_config.set(cfg_name, 'securityprovider', 'ssl')
             else:
                 # Iterate throug the config items, we'll use ConfigParser.set
@@ -80,15 +83,15 @@ def handle(name, cfg, cloud, log, _args):
                     mcollective_config.set(cfg_name, o, v)
         # We got all our config as wanted we'll rename
         # the previous server.cfg and create our new one
-        util.rename('/etc/mcollective/server.cfg',
-                    '/etc/mcollective/server.cfg.old')
+        old_fn = "%s.old" % (server_cfg_fn)
+        util.rename(server_cfg_fn, old_fn)
         # Now we got the whole file, write to disk except the section 
         # we added so that config parser won't error out when trying to read.
         # Note below, that we've just used ConfigParser because it generally
         # works.  Below, we remove the initial 'nullsection' header.
         contents = mcollective_config.stringify()
         contents = contents.replace("%s\n" % (section_head), "")
-        util.write_file('/etc/mcollective/server.cfg', contents, mode=0644)
+        util.write_file(server_cfg_fn, contents, mode=0644)
 
     # Start mcollective
     util.subp(['service', 'mcollective', 'start'], capture=False)
diff --git a/cloudinit/transforms/mounts.py b/cloudinit/transforms/mounts.py
index 44182b87..700fbc44 100644
--- a/cloudinit/transforms/mounts.py
+++ b/cloudinit/transforms/mounts.py
@@ -168,7 +168,7 @@ def handle(_name, cfg, cloud, log, _args):
         cc_lines.append('\t'.join(line))
 
     fstab_lines = []
-    fstab = util.load_file("/etc/fstab")
+    fstab = util.load_file(cloud.paths.join(True, "/etc/fstab"))
     for line in fstab.splitlines():
         try:
             toks = ws.split(line)
@@ -180,7 +180,7 @@ def handle(_name, cfg, cloud, log, _args):
 
     fstab_lines.extend(cc_lines)
     contents = "%s\n" % ('\n'.join(fstab_lines))
-    util.write_file("/etc/fstab", contents)
+    util.write_file(cloud.paths.join(False, "/etc/fstab"), contents)
 
     if needswap:
         try:
@@ -190,7 +190,7 @@ def handle(_name, cfg, cloud, log, _args):
 
     for d in dirs:
         try:
-            util.ensure_dir(d)
+            util.ensure_dir(cloud.paths.join(False, d))
         except:
             util.logexc(log, "Failed to make '%s' config-mount", d)
 
diff --git a/cloudinit/transforms/phone_home.py b/cloudinit/transforms/phone_home.py
index 98ff2b85..a8752527 100644
--- a/cloudinit/transforms/phone_home.py
+++ b/cloudinit/transforms/phone_home.py
@@ -77,7 +77,7 @@ def handle(name, cfg, cloud, log, args):
 
     for (n, path) in pubkeys.iteritems():
         try:
-            all_keys[n] = util.load_file(path)
+            all_keys[n] = util.load_file(cloud.paths.join(True, path))
         except:
             util.logexc(log, ("%s: failed to open, can not"
                               " phone home that data"), path)
diff --git a/cloudinit/transforms/puppet.py b/cloudinit/transforms/puppet.py
index 76cc9732..d55118ea 100644
--- a/cloudinit/transforms/puppet.py
+++ b/cloudinit/transforms/puppet.py
@@ -43,7 +43,8 @@ def handle(name, cfg, cloud, log, _args):
     # ... and then update the puppet configuration
     if 'conf' in puppet_cfg:
         # Add all sections from the conf object to puppet.conf
-        contents = util.load_file('/etc/puppet/puppet.conf')
+        puppet_conf_fn = cloud.paths.join(False, '/etc/puppet/puppet.conf')
+        contents = util.load_file(puppet_conf_fn)
         # Create object for reading puppet.conf values
         puppet_config = config.DefaultingConfigParser()
         # Read puppet.conf values from original file in order to be able to
@@ -51,21 +52,27 @@ def handle(name, cfg, cloud, log, _args):
         cleaned_lines = [i.lstrip() for i in contents.splitlines()]
         cleaned_contents = '\n'.join(cleaned_lines)
         puppet_config.readfp(StringIO(cleaned_contents),
-                             filename='/etc/puppet/puppet.conf')
+                             filename=puppet_conf_fn)
         for (cfg_name, cfg) in puppet_cfg['conf'].iteritems():
-            # ca_cert configuration is a special case
-            # Dump the puppetmaster ca certificate in the correct place
+            # Cert configuration is a special case
+            # Dump the puppet master ca certificate in the correct place
             if cfg_name == 'ca_cert':
                 # Puppet ssl sub-directory isn't created yet
                 # Create it with the proper permissions and ownership
-                util.ensure_dir('/var/lib/puppet/ssl', 0771)
-                util.chownbyid('/var/lib/puppet/ssl',
+                pp_ssl_dir = cloud.paths.join(False, '/var/lib/puppet/ssl')
+                util.ensure_dir(pp_ssl_dir, 0771)
+                util.chownbyid(pp_ssl_dir,
                                pwd.getpwnam('puppet').pw_uid, 0)
-                util.ensure_dir('/var/lib/puppet/ssl/certs/')
-                util.chownbyid('/var/lib/puppet/ssl/certs/',
+                pp_ssl_certs = cloud.paths.join(False, 
+                                                '/var/lib/puppet/ssl/certs/')
+                util.ensure_dir(pp_ssl_certs)
+                util.chownbyid(pp_ssl_certs,
                                pwd.getpwnam('puppet').pw_uid, 0)
-                util.write_file('/var/lib/puppet/ssl/certs/ca.pem', cfg)
-                util.chownbyid('/var/lib/puppet/ssl/certs/ca.pem',
+                pp_ssl_ca_certs = cloud.paths.join(False,
+                                                   ('/var/lib/puppet/'
+                                                    'ssl/certs/ca.pem'))
+                util.write_file(pp_ssl_ca_certs, cfg)
+                util.chownbyid(pp_ssl_ca_certs,
                                pwd.getpwnam('puppet').pw_uid, 0)
             else:
                 # Iterate throug the config items, we'll use ConfigParser.set
@@ -82,10 +89,9 @@ def handle(name, cfg, cloud, log, _args):
                     puppet_config.set(cfg_name, o, v)
             # We got all our config as wanted we'll rename
             # the previous puppet.conf and create our new one
-            util.rename('/etc/puppet/puppet.conf',
-                        '/etc/puppet/puppet.conf.old')
-            contents = puppet_config.stringify()
-            util.write_file('/etc/puppet/puppet.conf', contents)
+            puppet_conf_old_fn = "%s.old" % (puppet_conf_fn)
+            util.rename(puppet_conf_fn, puppet_conf_old_fn)
+            util.write_file(puppet_conf_fn, puppet_config.stringify())
 
     # Set puppet to automatically start
     if os.path.exists('/etc/default/puppet'):
diff --git a/cloudinit/transforms/resizefs.py b/cloudinit/transforms/resizefs.py
index fe012417..fd2bb9e1 100644
--- a/cloudinit/transforms/resizefs.py
+++ b/cloudinit/transforms/resizefs.py
@@ -62,7 +62,7 @@ def get_fs_type(st_dev, path, log):
         raise
 
 
-def handle(name, cfg, _cloud, log, args):
+def handle(name, cfg, cloud, log, args):
     if len(args) != 0:
         resize_root = args[0]
     else:
@@ -74,11 +74,11 @@ def handle(name, cfg, _cloud, log, args):
 
     # TODO is the directory ok to be used??
     resize_root_d = util.get_cfg_option_str(cfg, "resize_rootfs_tmp", "/run")
+    resize_root_d = cloud.paths.join(False, resize_root_d)
     util.ensure_dir(resize_root_d)
 
-    # TODO: allow what is to be resized to
-    # be configurable??
-    resize_what = "/"
+    # TODO: allow what is to be resized to be configurable??
+    resize_what = cloud.paths.join(False)
     with util.SilentTemporaryFile(prefix="cloudinit.resizefs.",
                                   dir=resize_root_d, delete=True) as tfh:
         devpth = tfh.name
diff --git a/cloudinit/transforms/rightscale_userdata.py b/cloudinit/transforms/rightscale_userdata.py
index 8dfd845f..dc06f9ec 100644
--- a/cloudinit/transforms/rightscale_userdata.py
+++ b/cloudinit/transforms/rightscale_userdata.py
@@ -78,6 +78,7 @@ def handle(name, _cfg, cloud, log, _args):
     urls = mdict[my_hookname]
     for (i, url) in enumerate(urls):
         fname = os.path.join(scripts_d, "rightscale-%02i" % (i))
+        fname = cloud.paths.join(False, fname)
         try:
             resp = uhelp.readurl(url)
             # Ensure its a valid http response (and something gotten)
diff --git a/cloudinit/transforms/rsyslog.py b/cloudinit/transforms/rsyslog.py
index 71b74711..f2c1de1e 100644
--- a/cloudinit/transforms/rsyslog.py
+++ b/cloudinit/transforms/rsyslog.py
@@ -71,7 +71,8 @@ def handle(name, cfg, cloud, log, _args):
 
         try:
             contents = "%s\n" % (content)
-            util.write_file(filename, contents, omode=omode)
+            util.write_file(cloud.paths.join(False, filename),
+                            contents, omode=omode)
         except Exception:
             util.logexc(log, "Failed to write to %s", filename)
 
diff --git a/cloudinit/transforms/runcmd.py b/cloudinit/transforms/runcmd.py
index 31a254a5..f121484b 100644
--- a/cloudinit/transforms/runcmd.py
+++ b/cloudinit/transforms/runcmd.py
@@ -33,6 +33,6 @@ def handle(name, cfg, cloud, log, _args):
     cmd = cfg["runcmd"]
     try:
         content = util.shellify(cmd)
-        util.write_file(out_fn, content, 0700)
+        util.write_file(cloud.paths.join(False, out_fn), content, 0700)
     except:
         util.logexc(log, "Failed to shellify %s into file %s", cmd, out_fn)
diff --git a/cloudinit/transforms/salt_minion.py b/cloudinit/transforms/salt_minion.py
index d05d2a1e..16f5286d 100644
--- a/cloudinit/transforms/salt_minion.py
+++ b/cloudinit/transforms/salt_minion.py
@@ -35,6 +35,7 @@ def handle(name, cfg, cloud, log, _args):
     
     # Ensure we can configure files at the right dir
     config_dir = salt_cfg.get("config_dir", '/etc/salt')
+    config_dir = cloud.paths.join(False, config_dir)
     util.ensure_dir(config_dir)
 
     # ... and then update the salt configuration
@@ -47,6 +48,7 @@ def handle(name, cfg, cloud, log, _args):
     # ... copy the key pair if specified
     if 'public_key' in salt_cfg and 'private_key' in salt_cfg:
         pki_dir = salt_cfg.get('pki_dir', '/etc/salt/pki')
+        pki_dir = cloud.paths.join(pki_dir)
         with util.umask(077):
             util.ensure_dir(pki_dir)
             pub_name = os.path.join(pki_dir, 'minion.pub')
diff --git a/cloudinit/transforms/set_passwords.py b/cloudinit/transforms/set_passwords.py
index c0cc4e84..e7049f22 100644
--- a/cloudinit/transforms/set_passwords.py
+++ b/cloudinit/transforms/set_passwords.py
@@ -130,8 +130,8 @@ def handle(_name, cfg, cloud, log, args):
             replaced_auth = True
             new_lines.append(replacement)
 
-        new_contents = "\n".join(new_lines)
-        util.write_file('/etc/ssh/sshd_config', new_contents)
+        util.write_file(cloud.paths.join(False, '/etc/ssh/sshd_config'),
+                        "\n".join(new_lines))
 
         try:
             cmd = ['service']
diff --git a/cloudinit/transforms/ssh.py b/cloudinit/transforms/ssh.py
index b1f2ce89..33d4bb54 100644
--- a/cloudinit/transforms/ssh.py
+++ b/cloudinit/transforms/ssh.py
@@ -64,7 +64,8 @@ def handle(_name, cfg, cloud, log, _args):
             if key in key2file:
                 tgt_fn = key2file[key][0]
                 tgt_perms = key2file[key][1]
-                util.write_file(tgt_fn, val, tgt_perms)
+                util.write_file(cloud.paths.join(False, tgt_fn),
+                                val, tgt_perms)
 
         for (priv, pub) in priv2pub.iteritems():
             if pub in cfg['ssh_keys'] or not priv in cfg['ssh_keys']:
@@ -86,6 +87,7 @@ def handle(_name, cfg, cloud, log, _args):
                                             generate_keys)
         for keytype in genkeys:
             keyfile = '/etc/ssh/ssh_host_%s_key' % (keytype)
+            keyfile = cloud.paths.join(False, keyfile)
             if not os.path.exists(keyfile):
                 cmd = ['ssh-keygen', '-t', keytype, '-N', '', '-f', keyfile]
                 try:
@@ -107,20 +109,21 @@ def handle(_name, cfg, cloud, log, _args):
             cfgkeys = cfg["ssh_authorized_keys"]
             keys.extend(cfgkeys)
 
-        apply_credentials(keys, user, disable_root, disable_root_opts)
+        apply_credentials(keys, user, cloud.paths,
+                          disable_root, disable_root_opts)
     except:
         util.logexc(log, "Applying ssh credentials failed!")
 
 
-def apply_credentials(keys, user, disable_root, disable_root_opts):
+def apply_credentials(keys, user, paths, disable_root, disable_root_opts):
 
     keys = set(keys)
     if user:
-        ssh_util.setup_user_keys(keys, user, '')
+        ssh_util.setup_user_keys(keys, user, '', paths)
 
     if disable_root and user:
         key_prefix = disable_root_opts.replace('$USER', user)
     else:
         key_prefix = ''
 
-    ssh_util.setup_user_keys(keys, 'root', key_prefix)
+    ssh_util.setup_user_keys(keys, 'root', key_prefix, paths)

From d53e557306e5119e9a5ea246b565b14b0f86f23c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 18:07:47 -0700
Subject: [PATCH 226/434] More paths missed (durn), but now fixed.

---
 cloudinit/distros/ubuntu.py              | 2 +-
 cloudinit/transforms/ssh.py              | 4 +++-
 cloudinit/transforms/update_etc_hosts.py | 3 ++-
 3 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 94565b14..eeda2921 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -59,7 +59,7 @@ class Distro(distros.Distro):
         lines.append("# Created by cloud-init")
         lines.append(str(hostname))
         contents = "\n".join(lines)
-        util.write_file(out_fn, contents, 0644)
+        util.write_file(self._paths.join(False, out_fn), contents, 0644)
 
     def update_hostname(self, hostname, prev_file):
         hostname_prev = self._read_hostname(prev_file)
diff --git a/cloudinit/transforms/ssh.py b/cloudinit/transforms/ssh.py
index 33d4bb54..e5e99560 100644
--- a/cloudinit/transforms/ssh.py
+++ b/cloudinit/transforms/ssh.py
@@ -52,7 +52,8 @@ def handle(_name, cfg, cloud, log, _args):
 
     # remove the static keys from the pristine image
     if cfg.get("ssh_deletekeys", True):
-        for f in glob.glob("/etc/ssh/ssh_host_*key*"):
+        key_pth = cloud.paths.join(False, "/etc/ssh/", "ssh_host_*key*")
+        for f in glob.glob(key_pth):
             try:
                 util.del_file(f)
             except:
@@ -88,6 +89,7 @@ def handle(_name, cfg, cloud, log, _args):
         for keytype in genkeys:
             keyfile = '/etc/ssh/ssh_host_%s_key' % (keytype)
             keyfile = cloud.paths.join(False, keyfile)
+            util.ensure_dir(os.path.dirname(keyfile)) 
             if not os.path.exists(keyfile):
                 cmd = ['ssh-keygen', '-t', keytype, '-N', '', '-f', keyfile]
                 try:
diff --git a/cloudinit/transforms/update_etc_hosts.py b/cloudinit/transforms/update_etc_hosts.py
index d0e56183..75615db1 100644
--- a/cloudinit/transforms/update_etc_hosts.py
+++ b/cloudinit/transforms/update_etc_hosts.py
@@ -42,7 +42,8 @@ def handle(name, cfg, cloud, log, _args):
             raise Exception(("No hosts template could be"
                              " found for distro %s") % (distro_n))
 
-        templater.render_to_file(tpl_fn_name, '/etc/hosts',
+        out_fn = cloud.paths.join(False, '/etc/hosts')
+        templater.render_to_file(tpl_fn_name, out_fn,
                                 {'hostname': hostname, 'fqdn': fqdn})
 
     elif manage_hosts == "localhost":

From 0074372a5f16ed4ed17e940bf1fb29869cdc1f3d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 18:30:28 -0700
Subject: [PATCH 227/434] More cleanups around read/write roots

---
 cloudinit/distros/__init__.py |  6 ++++--
 cloudinit/distros/rhel.py     | 32 ++++++++++++++++++--------------
 cloudinit/distros/ubuntu.py   | 35 ++++++++++++++++++++---------------
 3 files changed, 42 insertions(+), 31 deletions(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 483642f3..6a98fdb1 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -100,7 +100,8 @@ class Distro(object):
         new_etchosts = StringIO()
         need_write = False
         need_change = True
-        for line in util.load_file("/etc/hosts").splitlines():
+        hosts_ro_fn = self._paths.join(True, "/etc/hosts")
+        for line in util.load_file(hosts_ro_fn).splitlines():
             if line.strip().startswith(header):
                 continue
             if not line.strip() or line.strip().startswith("#"):
@@ -124,7 +125,8 @@ class Distro(object):
             need_write = True
         if need_write:
             contents = new_etchosts.getvalue()
-            util.write_file("/etc/hosts", contents, mode=0644)
+            util.write_file(self._paths.join(False, "/etc/hosts"),
+                            contents, mode=0644)
 
     def _interface_action(self, action):
         if action not in IFACE_ACTIONS:
diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index aef7f6f3..e9f3f5d9 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -73,13 +73,15 @@ class Distro(distros.Distro):
             lines.insert(0, '# Created by cloud-init')
             contents = "\n".join(lines)
             net_fn = NETWORK_FN_TPL % (dev)
-            net_fn = self._paths.join(False, net_fn)
-            util.write_file(net_fn, contents, 0644)
+            util.write_file(self._paths.join(False, net_fn), contents, 0644)
 
     def set_hostname(self, hostname):
-        self._write_hostname(hostname, "/etc/sysconfig/network")
-        LOG.debug("Setting hostname to %s", hostname)
-        util.subp(['hostname', hostname])
+        out_fn = self._paths.join(False, '/etc/sysconfig/network')
+        self._write_hostname(hostname, out_fn)
+        if out_fn == '/etc/sysconfig/network':
+            # Only do this if we are running in non-adjusted root mode
+            LOG.debug("Setting hostname to %s", hostname)
+            util.subp(['hostname', hostname])
 
     def _write_hostname(self, hostname, out_fn):
         old_contents = []
@@ -105,18 +107,19 @@ class Distro(distros.Distro):
             new_contents.append("# Added by cloud-init")
             new_contents.append("HOSTNAME=%s" % (hostname))
         contents = "\n".join(new_contents)
-        out_fn = self._paths.join(False, out_fn)
         util.write_file(out_fn, contents, 0644)
 
     def update_hostname(self, hostname, prev_file):
         hostname_prev = self._read_hostname(prev_file)
-        hostname_in_sys = self._read_hostname("/etc/sysconfig/network")
+        read_fn = self._paths.join(True, "/etc/sysconfig/network")
+        hostname_in_sys = self._read_hostname(read_fn)
         update_files = []
         if not hostname_prev or hostname_prev != hostname:
             update_files.append(prev_file)
         if (not hostname_in_sys or
-           (hostname_in_sys == hostname_prev and hostname_in_sys != hostname)):
-            update_files.append("/etc/sysconfig/network")
+            (hostname_in_sys == hostname_prev and hostname_in_sys != hostname)):
+            write_fn = self._paths.join(False, "/etc/sysconfig/network")
+            update_files.append(write_fn)
         for fn in update_files:
             try:
                 self._write_hostname(hostname, fn)
@@ -128,6 +131,7 @@ class Distro(distros.Distro):
             LOG.debug(("%s differs from /etc/sysconfig/network."
                         " Assuming user maintained hostname."), prev_file)
         if "/etc/sysconfig/network" in update_files:
+            # Only do this if we are running in non-adjusted root mode
             LOG.debug("Setting hostname to %s", hostname)
             util.subp(['hostname', hostname])
 
@@ -145,7 +149,6 @@ class Distro(distros.Distro):
         return default
 
     def _read_conf(self, filename):
-        filename = self._paths.join(True, filename)
         contents = util.load_file(filename, quiet=True)
         conf_lines = []
         for line in contents.splitlines():
@@ -176,7 +179,8 @@ class Distro(distros.Distro):
             raise Exception(("Invalid timezone %s,"
                              " no file found at %s") % (tz, tz_file))
         # Adjust the sysconfig clock zone setting
-        old_contents = self._read_conf("/etc/sysconfig/clock")
+        read_fn = self._paths.join(True, "/etc/sysconfig/clock")
+        old_contents = self._read_conf(read_fn)
         new_contents = []
         zone_added = False
         # Update the 'ZONE' if it exists instead of appending
@@ -197,10 +201,10 @@ class Distro(distros.Distro):
             new_contents.append("# Added by cloud-init")
             new_contents.append('ZONE="%s"' % (tz))
         tz_contents = "\n".join(new_contents)
-        tz_fn = self._paths.join(False, "/etc/sysconfig/clock")
-        util.write_file(tz_fn, tz_contents)
+        write_fn = self._paths.join(False, "/etc/sysconfig/clock")
+        util.write_file(write_fn, tz_contents)
         # This ensures that the correct tz will be used for the system
-        util.copy(tz_file, "/etc/localtime")
+        util.copy(tz_file, self._paths.join(False, "/etc/localtime"))
 
     def package_command(self, command, args=None):
         cmd = ['yum']
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index eeda2921..515b59c8 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -46,30 +46,35 @@ class Distro(distros.Distro):
         self.package_command('install', pkglist)
 
     def _write_network(self, settings):
-        n_fn = self._paths.join(False, "/etc/network/interfaces")
-        util.write_file(n_fn, settings)
+        net_fn = self._paths.join(False, "/etc/network/interfaces")
+        util.write_file(net_fn, settings)
 
     def set_hostname(self, hostname):
-        self._write_hostname(hostname, "/etc/hostname")
-        LOG.debug("Setting hostname to %s", hostname)
-        util.subp(['hostname', hostname])
+        out_fn = self._paths.join(False, "/etc/hostname")
+        self._write_hostname(hostname, out_fn)
+        if out_fn == '/etc/hostname':
+            # Only do this if we are running in non-adjusted root mode
+            LOG.debug("Setting hostname to %s", hostname)
+            util.subp(['hostname', hostname])
 
     def _write_hostname(self, hostname, out_fn):
         lines = []
         lines.append("# Created by cloud-init")
         lines.append(str(hostname))
         contents = "\n".join(lines)
-        util.write_file(self._paths.join(False, out_fn), contents, 0644)
+        util.write_file(out_fn, contents, 0644)
 
-    def update_hostname(self, hostname, prev_file):
-        hostname_prev = self._read_hostname(prev_file)
-        hostname_in_etc = self._read_hostname("/etc/hostname")
+    def update_hostname(self, hostname, prev_fn):
+        hostname_prev = self._read_hostname(prev_fn)
+        read_fn = self._paths.join(True, "/etc/hostname")
+        hostname_in_etc = self._read_hostname(read_fn)
         update_files = []
         if not hostname_prev or hostname_prev != hostname:
-            update_files.append(prev_file)
+            update_files.append(prev_fn)
         if (not hostname_in_etc or
-           (hostname_in_etc == hostname_prev and hostname_in_etc != hostname)):
-            update_files.append("/etc/hostname")
+            (hostname_in_etc == hostname_prev and hostname_in_etc != hostname)):
+            write_fn = self._paths.join(False, "/etc/hostname")
+            update_files.append(write_fn)
         for fn in update_files:
             try:
                 self._write_hostname(hostname, fn)
@@ -79,13 +84,13 @@ class Distro(distros.Distro):
         if (hostname_in_etc and hostname_prev and
             hostname_in_etc != hostname_prev):
             LOG.debug(("%s differs from /etc/hostname."
-                        " Assuming user maintained hostname."), prev_file)
+                        " Assuming user maintained hostname."), prev_fn)
         if "/etc/hostname" in update_files:
+            # Only do this if we are running in non-adjusted root mode
             LOG.debug("Setting hostname to %s", hostname)
             util.subp(['hostname', hostname])
 
     def _read_hostname(self, filename, default=None):
-        filename = self._paths.join(True, filename)
         contents = util.load_file(filename, quiet=True)
         for line in contents.splitlines():
             c_pos = line.find("#")
@@ -109,7 +114,7 @@ class Distro(distros.Distro):
         tz_contents = "%s\n" % tz
         tz_fn = self._paths.join(False, "/etc/timezone")
         util.write_file(tz_fn, tz_contents)
-        util.copy(tz_file, "/etc/localtime")
+        util.copy(tz_file, self._paths.join(False, "/etc/localtime"))
 
     def package_command(self, command, args=None):
         e = os.environ.copy()

From e80aa985c5abc06e359b3a2f198902172f11ca7c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 18:34:09 -0700
Subject: [PATCH 228/434] Fix logging message spelling

---
 cloudinit/transforms/bootcmd.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/transforms/bootcmd.py b/cloudinit/transforms/bootcmd.py
index 0c45a307..635e3a1f 100644
--- a/cloudinit/transforms/bootcmd.py
+++ b/cloudinit/transforms/bootcmd.py
@@ -31,7 +31,7 @@ def handle(name, cfg, cloud, log, _args):
 
     if "bootcmd" not in cfg:
         log.debug(("Skipping transform named %s,"
-                   " no 'bootcomd' key in configuration"), name)
+                   " no 'bootcmd' key in configuration"), name)
         return
 
     with tempfile.NamedTemporaryFile(suffix=".sh") as tmpf:

From 2d2febd49ea21e2843175eccfc8d454d33c11b4d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 18:43:18 -0700
Subject: [PATCH 229/434] More path joinings found + update in logging of when
 we translate a path

---
 cloudinit/helpers.py                       | 2 +-
 cloudinit/transforms/apt_update_upgrade.py | 4 +++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 9f55a984..09686340 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -253,7 +253,7 @@ class Paths(object):
             # will confuse os.path.join
             joined = joined.lstrip("/")
             joined = os.path.join(root, joined)
-            LOG.debug("Translated %s to adjusted path %s (%s)",
+            LOG.debug("Translated %s to adjusted path %s (read-only=%s)",
                       pre_joined, joined, read_only)
         return joined
 
diff --git a/cloudinit/transforms/apt_update_upgrade.py b/cloudinit/transforms/apt_update_upgrade.py
index 29bbc1ae..f5b4b58f 100644
--- a/cloudinit/transforms/apt_update_upgrade.py
+++ b/cloudinit/transforms/apt_update_upgrade.py
@@ -124,6 +124,7 @@ def rename_apt_lists(omirror, new_mirror, lists_d="/var/lib/apt/lists"):
         return
     olen = len(oprefix)
     for filename in glob.glob("%s_*" % oprefix):
+        # TODO use the cloud.paths.join...
         util.rename(filename, "%s%s" % (nprefix, filename[olen:]))
 
 
@@ -136,7 +137,8 @@ def generate_sources_list(codename, mirror, cloud, log):
     template_fn = cloud.get_template_filename('sources.list')
     if template_fn:
         params = {'mirror': mirror, 'codename': codename}
-        templater.render_to_file(template_fn, '/etc/apt/sources.list', params)
+        out_fn = cloud.paths.join(False, '/etc/apt/sources.list')
+        templater.render_to_file(template_fn, out_fn, params)
     else:
         log.warn("No template found, not rendering /etc/apt/sources.list")
 

From 3984a9004fc185ae3ee4d610f5581dfb5b3e0001 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 19:07:07 -0700
Subject: [PATCH 230/434] 1. Use the help message to show the default 2. Add a
 mode option in to the 'config' subparser that allows the user to affect the
 transform selection phase 3. Some tiny pylint warnings.

---
 bin/cloud-init2.py | 21 ++++++++++++++++-----
 1 file changed, 16 insertions(+), 5 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index 1f938f01..10cf4614 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -167,7 +167,7 @@ def main_init(name, args):
     welcome(name)
     try:
         init.fetch()
-    except sources.DataSourceNotFoundException as e:
+    except sources.DataSourceNotFoundException:
         util.logexc(LOG, "No instance datasource found!")
         # TODO: Return 0 or 1??
         return 1
@@ -223,25 +223,36 @@ def main():
                         version='%(prog)s ' + (version.version_string()))
     parser.add_argument('--file', '-f', action='append', 
                         dest='files',
-                        help='additional configuration file to include',
+                        help=('additional yaml configuration'
+                              ' files to use'),
                         type=argparse.FileType('rb'))
-    parser.add_argument('--debug', '-d', action='store_true', 
-                        help='show additional pre-action logging',
+    parser.add_argument('--debug', '-d', action='store_true',
+                        help=('show additional pre-action'
+                              ' logging (default: %(default)s)'),
                         default=False)
     subparsers = parser.add_subparsers()
 
+    # Possible mode names
+    mode_names = ('init', 'config', 'final')
+
     # Each action and its suboptions (if any)
     parser_init = subparsers.add_parser('init', 
                                         help=('initializes cloud-init and'
                                               ' performs \'init\' transforms'))
     parser_init.add_argument("--local", '-l', action='store_true',
-                             help="start in local mode", default=False)
+                             help="start in local mode (default: %(default)s)",
+                             default=False)
     # This is used so that we can know which action is selected
     parser_init.set_defaults(action='init')
 
     parser_config = subparsers.add_parser('config', 
                                           help=('performs cloud-init '
                                                 '\'config\' transforms'))
+    parser_config.add_argument("--mode", '-m', action='store',
+                             help=("transform configuration name "
+                                    "to use (default: %(default)s)"),
+                             default='config',
+                             choices=mode_names)
     parser_config.set_defaults(action='config')
 
     parser_final = subparsers.add_parser('final', 

From b0f0a89360d1b9b27b6cece6c5475ec30d4f4b04 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 20:57:12 -0700
Subject: [PATCH 231/434] Fix comparison to none, instead of empty in ds_deps
 assignment check.

---
 cloudinit/stages.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index d3e61ddc..95ac5313 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -54,7 +54,7 @@ LOG = logging.getLogger(__name__)
 
 class Init(object):
     def __init__(self, ds_deps=None):
-        if ds_deps:
+        if ds_deps is not None:
             self.ds_deps = ds_deps
         else:
             self.ds_deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]

From 49bfca3b192dac7edc5761c4edf22655c1a32bd6 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 20:57:43 -0700
Subject: [PATCH 232/434] 1. Move the running of transforms to a common
 function that returns how a useful exit code 2. Add in the single transform
 running stub, which seems to be a feature of the previous cloud-init-cfg,
 making it its own action now 3. Adding in the 'config' and 'final' actions,
 which now both go through the same entrypoint function to setup the initial
 object    and then fire off the needed transforms. 4. Cleanup of the
 argparsing code to handle the above cases.

---
 bin/cloud-init2.py | 150 +++++++++++++++++++++++++++++++++------------
 1 file changed, 110 insertions(+), 40 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index 10cf4614..010a1011 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -74,6 +74,20 @@ def welcome(action):
     LOG.info(welcome_msg)
 
 
+def run_transforms(tr, action_name, section):
+    full_section_name = TR_TPL % (section)
+    (ran_am, failures) = tr.run(full_section_name)
+    if not ran_am:
+        msg = ("No '%s' transforms to run"
+               " under section '%s'") % (action_name, full_section_name)
+        sys.stderr.write("%s\n" % (msg))
+        LOG.debug(msg)
+        return 0
+    else:
+        LOG.debug("Ran %s transforms with %s failures", ran_am, len(failures))
+        return len(failures)
+
+
 def main_init(name, args):
     deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
     if args.local:
@@ -106,6 +120,7 @@ def main_init(name, args):
     #    the transform objects configuration
     # 10. Run the transforms for the 'init' stage
     # 11. Done!
+    welcome(name)
     init = stages.Init(deps)
     # Stage 1
     init.read_cfg(cfg_extra_paths)
@@ -113,6 +128,8 @@ def main_init(name, args):
     outfmt = None
     errfmt = None
     try:
+        LOG.debug("Closing stdin")
+        util.close_stdin()
         (outfmt, errfmt) = util.fixup_output(init.cfg, name)
     except:
         util.logexc(LOG, "Failed to setup output redirection!")
@@ -164,7 +181,6 @@ def main_init(name, args):
         # Delete the non-net file as well
         util.del_file(os.path.join(path_helper.get_cpath("data"), "no-net"))
     # Stage 5
-    welcome(name)
     try:
         init.fetch()
     except sources.DataSourceNotFoundException:
@@ -199,26 +215,73 @@ def main_init(name, args):
     except:
         util.logexc(LOG, "Failed to adjust output redirection!")
     # Stage 10
-    section_name = TR_TPL % (name)
-    (ran_am, failures) = tr.run(section_name)
-    if not ran_am:
-        msg = "No %s transforms to run under section %s" % (name, section_name)
-        sys.stderr.write("%s\n" % (msg))
-        LOG.debug(msg)
-        return 0
-    return len(failures)
+    return run_transforms(tr, name, name)
 
 
-def main_config(_name, _args):
+def main_transform(_action_name, args):
+    name = args.mode
+    i_cfgs = []
+    if args.files:
+        for fh in args.files:
+            i_cfgs.append(fh.name)
+    # Cloud-init transform stages are broken up into the following sub-stages
+    # 1. Ensure that the init object fetches its config without errors
+    # 2. Get the datasource from the init object, if it does
+    #    not exist then that means the main_init stage never
+    #    worked, and thus this stage can not run.
+    # 3. Construct the transform object
+    # 4. Adjust any subsequent logging/output redirections using
+    #    the transform objects configuration
+    # 5. Run the transforms for the given stage name
+    # 6. Done!
+    welcome(name)
+    init = stages.Init(ds_deps=[])
+    # Stage 1
+    init.read_cfg(i_cfgs)
+    # Stage 2
+    try:
+        ds = init.fetch()
+    except sources.DataSourceNotFoundException:
+        # There was no datasource found, theres nothing to do
+        util.logexc(LOG, 'Can not apply stage %s, no datasource found', name)
+        return 1
+    # Stage 3
+    tr_cfgs = list(i_cfgs)
+    cc_cfg = init.paths.get_ipath_cur('cloud_config')
+    if settings.CFG_ENV_NAME in os.environ:
+        cc_cfg = os.environ[settings.CFG_ENV_NAME]
+    if cc_cfg and os.path.exists(cc_cfg):
+        tr_cfgs.append(cc_cfg)
+    tr = stages.Transforms(init, tr_cfgs)
+    # Stage 4
+    try:
+        LOG.debug("Closing stdin")
+        util.close_stdin()
+        (outfmt, errfmt) = util.fixup_output(tr.cfg, name)
+    except:
+        util.logexc(LOG, "Failed to setup output redirection!")
+    if args.debug:
+        # Reset so that all the debug handlers are closed out
+        LOG.debug(("Logging being reset, this logger may no"
+                    " longer be active shortly"))
+        logging.resetLogging()
+    logging.setupLogging(cc.cfg)
+    # Stage 5
+    return run_transforms(tr, name, name)
+
+
+def main_query(_name, _args):
     pass
 
 
-def main_final(_name, _args):
+def main_single(_name, _args):
     pass
 
 
 def main():
     parser = argparse.ArgumentParser()
+    
+    # Top level args
     parser.add_argument('--version', '-v', action='version', 
                         version='%(prog)s ' + (version.version_string()))
     parser.add_argument('--file', '-f', action='append', 
@@ -232,56 +295,63 @@ def main():
                         default=False)
     subparsers = parser.add_subparsers()
 
-    # Possible mode names
-    mode_names = ('init', 'config', 'final')
-
-    # Each action and its suboptions (if any)
+    # Each action and its sub-options (if any)
     parser_init = subparsers.add_parser('init', 
                                         help=('initializes cloud-init and'
-                                              ' performs \'init\' transforms'))
+                                              ' performs initial transforms'))
     parser_init.add_argument("--local", '-l', action='store_true',
                              help="start in local mode (default: %(default)s)",
                              default=False)
-    # This is used so that we can know which action is selected
-    parser_init.set_defaults(action='init')
+    # This is used so that we can know which action is selected + 
+    # the functor to use to run this subcommand
+    parser_init.set_defaults(action=('init', main_init))
 
-    parser_config = subparsers.add_parser('config', 
-                                          help=('performs cloud-init '
-                                                '\'config\' transforms'))
-    parser_config.add_argument("--mode", '-m', action='store',
+    # These settings are used for the 'config' and 'final' stages
+    parser_tr = subparsers.add_parser('transform', 
+                                      help=('performs transforms '
+                                            'using a given configuration key'))
+    parser_tr.add_argument("--mode", '-m', action='store',
                              help=("transform configuration name "
                                     "to use (default: %(default)s)"),
                              default='config',
-                             choices=mode_names)
-    parser_config.set_defaults(action='config')
-
-    parser_final = subparsers.add_parser('final', 
-                                         help=('performs cloud-init '
-                                               '\'final\' transforms'))
-    parser_final.set_defaults(action='final')
+                             choices=('config', 'final'))
+    parser_tr.set_defaults(action=('transform', main_transform))
 
+    # These settings are used when you want to query information
+    # stored in the cloud-init data objects/directories/files
     parser_query = subparsers.add_parser('query', 
                                          help=('query information stored '
                                                'in cloud-init'))
-    parser_query.add_argument("--name", action="store",
+    parser_query.add_argument("--name", '-n', action="store",
                               help="item name to query on",
                               required=True,
                               choices=QUERY_DATA_TYPES)
-    parser_query.set_defaults(action='query')
+    parser_query.set_defaults(action=('query', main_query))
+
+    # This subcommand allows you to run a single transform
+    parser_single = subparsers.add_parser('single', 
+                                         help=('run a single transform '))
+    parser_single.set_defaults(action=('single', main_single))
+    parser_single.add_argument("--name", '-n', action="store",
+                              help="transform name to run",
+                              required=True)
+    parser_single.add_argument("--frequency", action="store",
+                              help=("frequency of "
+                                    " the transform (default: %(default)s)"),
+                              required=False,
+                              default=settings.PER_ALWAYS,
+                              choices=settings.FREQUENCIES)
+    parser_single.set_defaults(action=('single', main_single))
+
+
     args = parser.parse_args()
-    
+
     # Setup basic logging to start (until reinitialized)
     if args.debug:
         logging.setupBasicLogging()
 
-    stage_name = args.action
-    stage_mp = {
-        'init': main_init,
-        'config': main_config,
-        'final': main_final,
-    }
-    func = stage_mp.get(stage_name)
-    return func(stage_name, args)
+    (name, functor) = args.action
+    return functor(name, args)
 
 
 if __name__ == '__main__':

From 4c9eba665e8141c6ae5a6a575e05e530da01a74f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 21:01:34 -0700
Subject: [PATCH 233/434] Pylint cleanups.

---
 bin/cloud-init2.py | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index 010a1011..bb32da45 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -23,7 +23,6 @@
 
 import argparse
 import os
-import traceback
 import sys
 
 # This is more just for running from the bin folder
@@ -199,7 +198,7 @@ def main_init(name, args):
                                              freq=settings.PER_INSTANCE)
         if not ran:
             init.consume(settings.PER_ALWAYS)
-    except Exception as e:
+    except Exception:
         util.logexc(LOG, "Consuming user data failed!")
         return 1
     # Stage 8
@@ -240,7 +239,7 @@ def main_transform(_action_name, args):
     init.read_cfg(i_cfgs)
     # Stage 2
     try:
-        ds = init.fetch()
+        init.fetch()
     except sources.DataSourceNotFoundException:
         # There was no datasource found, theres nothing to do
         util.logexc(LOG, 'Can not apply stage %s, no datasource found', name)
@@ -257,7 +256,7 @@ def main_transform(_action_name, args):
     try:
         LOG.debug("Closing stdin")
         util.close_stdin()
-        (outfmt, errfmt) = util.fixup_output(tr.cfg, name)
+        util.fixup_output(tr.cfg, name)
     except:
         util.logexc(LOG, "Failed to setup output redirection!")
     if args.debug:
@@ -265,7 +264,7 @@ def main_transform(_action_name, args):
         LOG.debug(("Logging being reset, this logger may no"
                     " longer be active shortly"))
         logging.resetLogging()
-    logging.setupLogging(cc.cfg)
+    logging.setupLogging(tr.cfg)
     # Stage 5
     return run_transforms(tr, name, name)
 

From 02a44e7af6409179494fcf5905e5bf3efc11cd19 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 21:38:43 -0700
Subject: [PATCH 234/434] 1. Don't force the datasource to always fetch in
 construction (sometimes not wanted) 2. Add a run single transform function
 that can be used by the run single main entrypoint action 3. Add a find
 transform function to be used by the run single action to determine if a
 transform name is valid

---
 cloudinit/stages.py | 31 +++++++++++++++++++++++++++----
 1 file changed, 27 insertions(+), 4 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 95ac5313..7e64d3cd 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -379,7 +379,7 @@ class Init(object):
 
 class Transforms(object):
     def __init__(self, init, cfg_files=None):
-        self.datasource = init.fetch()
+        self.datasource = init.datasource
         self.cfg_files = cfg_files
         self.base_cfg = copy.deepcopy(init.cfg)
         self.init = init
@@ -418,7 +418,6 @@ class Transforms(object):
 
         return util.mergemanydict(t_cfgs)
 
-
     def _read_transforms(self, name):
         module_list = []
         if name not in self.cfg:
@@ -513,7 +512,31 @@ class Transforms(object):
                 failures.append((name, e))
         return (am_ran, failures)
 
-    def run(self, name):
-        raw_mods = self._read_transforms(name)
+    def find_transform(self, tr_name, sections):
+        found_where = []
+        for n in sections:
+            mods = self._read_transforms(n)
+            for mod_info in mods:
+                if mod_info.get('mod') == tr_name:
+                    found_where.append(n)
+        return found_where
+
+    def run_single(self, tr_name, section):
+        mods = self._read_transforms(section)
+        mod_tr = None
+        for mod_info in mods:
+            if mod_info.get('mod') == tr_name:
+                mod_tr = mod_info
+                break
+        if not mod_tr:
+            # Nothing to run, does that transform exist there??
+            return (0, 0)
+        else:
+            raw_mods = [mod_tr]
+            mostly_mods = self._fixup_transforms(raw_mods)
+            return self._run_transforms(mostly_mods)
+
+    def run_section(self, section_name):
+        raw_mods = self.read_transforms(section_name)
         mostly_mods = self._fixup_transforms(raw_mods)
         return self._run_transforms(mostly_mods)

From 0e584f2edd1b7d8e269e27a9a476d08e2fe89253 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 21:44:51 -0700
Subject: [PATCH 235/434] Allow the run single to pass in a set of args and a
 frequency  that will replace the initial sections args and freqency if
 provided.  If not provided then no replacement occurs.

---
 cloudinit/stages.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 7e64d3cd..0c3d5915 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -521,7 +521,7 @@ class Transforms(object):
                     found_where.append(n)
         return found_where
 
-    def run_single(self, tr_name, section):
+    def run_single(self, tr_name, section, args=None, freq=None):
         mods = self._read_transforms(section)
         mod_tr = None
         for mod_info in mods:
@@ -532,6 +532,12 @@ class Transforms(object):
             # Nothing to run, does that transform exist there??
             return (0, 0)
         else:
+            # Adjust the module
+            if args:
+                mod_tr['args'] = args
+            if freq:
+                mod_tr['freq'] = freq
+            # Now resume doing the normal fixups and running
             raw_mods = [mod_tr]
             mostly_mods = self._fixup_transforms(raw_mods)
             return self._run_transforms(mostly_mods)

From 169eb13dfb60d3e8e4a06845f61a2d990d111288 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 21:46:01 -0700
Subject: [PATCH 236/434] Get single module running mode mostly working (still
 needs a little work).

---
 bin/cloud-init2.py | 93 ++++++++++++++++++++++++++++++++++------------
 1 file changed, 70 insertions(+), 23 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index bb32da45..1f8d45bd 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -73,9 +73,22 @@ def welcome(action):
     LOG.info(welcome_msg)
 
 
-def run_transforms(tr, action_name, section):
+def extract_fns(args):
+    # Files are already opened so lets just pass that along
+    # since it would of broke if it couldn't have
+    # read that file already...
+    fn_cfgs = []
+    if args.files:
+        for fh in args.files:
+            # The realpath is more useful in logging
+            # so lets resolve to that...
+            fn_cfgs.append(os.path.realpath(fh.name))
+    return fn_cfgs
+
+
+def run_transform_section(tr, action_name, section):
     full_section_name = TR_TPL % (section)
-    (ran_am, failures) = tr.run(full_section_name)
+    (ran_am, failures) = tr.run_section(full_section_name)
     if not ran_am:
         msg = ("No '%s' transforms to run"
                " under section '%s'") % (action_name, full_section_name)
@@ -92,14 +105,6 @@ def main_init(name, args):
     if args.local:
         deps = [sources.DEP_FILESYSTEM]
 
-    cfg_extra_paths = []
-    if args.files:
-        # Already opened so lets just pass that along
-        # since it would of broke if it couldn't have
-        # read that file
-        for f in args.files:
-            cfg_extra_paths.append(f.name)
-
     if not args.local:
         # TODO: What is this for??
         root_name = "%s.d" % (settings.CLOUD_CONFIG)
@@ -122,7 +127,7 @@ def main_init(name, args):
     welcome(name)
     init = stages.Init(deps)
     # Stage 1
-    init.read_cfg(cfg_extra_paths)
+    init.read_cfg(extract_fns(args))
     # Stage 2
     outfmt = None
     errfmt = None
@@ -201,8 +206,8 @@ def main_init(name, args):
     except Exception:
         util.logexc(LOG, "Consuming user data failed!")
         return 1
-    # Stage 8
-    tr = stages.Transforms(init, cfg_extra_paths)
+    # Stage 8 - TODO - do we really need to re-extract our configs?
+    tr = stages.Transforms(init, extract_fns(args))
     # Stage 9 - TODO is this really needed??
     try:
         outfmt_orig = outfmt
@@ -214,15 +219,11 @@ def main_init(name, args):
     except:
         util.logexc(LOG, "Failed to adjust output redirection!")
     # Stage 10
-    return run_transforms(tr, name, name)
+    return run_transform_section(tr, name, name)
 
 
 def main_transform(_action_name, args):
     name = args.mode
-    i_cfgs = []
-    if args.files:
-        for fh in args.files:
-            i_cfgs.append(fh.name)
     # Cloud-init transform stages are broken up into the following sub-stages
     # 1. Ensure that the init object fetches its config without errors
     # 2. Get the datasource from the init object, if it does
@@ -236,7 +237,7 @@ def main_transform(_action_name, args):
     welcome(name)
     init = stages.Init(ds_deps=[])
     # Stage 1
-    init.read_cfg(i_cfgs)
+    init.read_cfg(extract_fns(args))
     # Stage 2
     try:
         init.fetch()
@@ -245,7 +246,7 @@ def main_transform(_action_name, args):
         util.logexc(LOG, 'Can not apply stage %s, no datasource found', name)
         return 1
     # Stage 3
-    tr_cfgs = list(i_cfgs)
+    tr_cfgs = extract_fns(args)
     cc_cfg = init.paths.get_ipath_cur('cloud_config')
     if settings.CFG_ENV_NAME in os.environ:
         cc_cfg = os.environ[settings.CFG_ENV_NAME]
@@ -266,15 +267,57 @@ def main_transform(_action_name, args):
         logging.resetLogging()
     logging.setupLogging(tr.cfg)
     # Stage 5
-    return run_transforms(tr, name, name)
+    return run_transform_section(tr, name, name)
 
 
 def main_query(_name, _args):
     pass
 
 
-def main_single(_name, _args):
-    pass
+def main_single(name, args):
+    # Cloud-init single stage is broken up into the following sub-stages
+    # 1. Ensure that the init object fetches its config without errors
+    # 2. Check to see if we can find the transform name
+    #    in the 'init', 'final', 'config' stages, if not bail
+    # 3. Get the datasource from the init object, if it does
+    #    not exist then that means the main_init stage never
+    #    worked, and thus this stage can not run.
+    # 4. Construct the transform object
+    # 5. Adjust any subsequent logging/output redirections using
+    #    the transform objects configuration
+    # 6. Run the single transform
+    # 7. Done!
+    transform_name = args.name
+    st_name = "%s:%s" % (name, transform_name)
+    welcome(st_name)
+    init = stages.Init(ds_deps=[])
+    # Stage 1
+    init.read_cfg(extract_fns(args))
+    tr = stages.Transforms(init, extract_fns(args))
+    where_look = [
+        TR_TPL % ('init'),
+        TR_TPL % ('config'),
+        TR_TPL % ('final'),
+    ]
+    found_at = tr.find_transform(transform_name, where_look)
+    if not found_at:
+        msg = ("No known transform named %s "
+              "in sections %s") % (transform_name, where_look)
+        sys.stderr.write("%s\n" % (msg))
+        LOG.warn(msg)
+        return 1
+    else:
+        LOG.debug("Found transform %s in section/s: %s",
+                  transform_name, found_at)
+        LOG.debug("Selecting section %s as its run section.", found_at[0])
+        (_run_am, failures) = tr.run_single(transform_name, found_at[0],
+                                            args.transform_args,
+                                            args.frequency)
+        if failures:
+            LOG.debug("Ran %s but it failed", transform_name)
+            return 1
+        else:
+            return 0
 
 
 def main():
@@ -340,6 +383,10 @@ def main():
                               required=False,
                               default=settings.PER_ALWAYS,
                               choices=settings.FREQUENCIES)
+    parser_single.add_argument("transform_args", nargs="*",
+                              metavar='argument',
+                              help=('any additional arguments to'
+                                    ' pass to this transform'))
     parser_single.set_defaults(action=('single', main_single))
 
 

From da2e42042ccb555694ea0347eead29d457bd8d86 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 21:49:58 -0700
Subject: [PATCH 237/434] Pylint line length fixups.

---
 cloudinit/distros/rhel.py   | 3 ++-
 cloudinit/distros/ubuntu.py | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index e9f3f5d9..b67ae5b8 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -117,7 +117,8 @@ class Distro(distros.Distro):
         if not hostname_prev or hostname_prev != hostname:
             update_files.append(prev_file)
         if (not hostname_in_sys or
-            (hostname_in_sys == hostname_prev and hostname_in_sys != hostname)):
+            (hostname_in_sys == hostname_prev
+             and hostname_in_sys != hostname)):
             write_fn = self._paths.join(False, "/etc/sysconfig/network")
             update_files.append(write_fn)
         for fn in update_files:
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 515b59c8..5a1b572e 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -72,7 +72,8 @@ class Distro(distros.Distro):
         if not hostname_prev or hostname_prev != hostname:
             update_files.append(prev_fn)
         if (not hostname_in_etc or
-            (hostname_in_etc == hostname_prev and hostname_in_etc != hostname)):
+            (hostname_in_etc == hostname_prev and
+             hostname_in_etc != hostname)):
             write_fn = self._paths.join(False, "/etc/hostname")
             update_files.append(write_fn)
         for fn in update_files:

From 0e6f240430a07264341a9edc3a7b9f8a4c8dc851 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 19 Jun 2012 21:50:10 -0700
Subject: [PATCH 238/434] Add dependency on argparse.

---
 Requires | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/Requires b/Requires
index e2ec8ff7..5a350900 100644
--- a/Requires
+++ b/Requires
@@ -23,3 +23,5 @@ configobj>=4.6
 # All new style configurations are in the yaml format
 pyyaml>=3.0
 
+# The new main entrypoint uses argparse instead of optparse
+argparse>=1.1

From 84a1432b47e192d0a3a2ab3a494aba3cee808c9a Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Wed, 20 Jun 2012 00:21:56 -0700
Subject: [PATCH 239/434] Uppercase constants, remove need to use
 cloud.paths.join since scripts_d should already be modified

---
 cloudinit/transforms/rightscale_userdata.py | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/cloudinit/transforms/rightscale_userdata.py b/cloudinit/transforms/rightscale_userdata.py
index dc06f9ec..8385e281 100644
--- a/cloudinit/transforms/rightscale_userdata.py
+++ b/cloudinit/transforms/rightscale_userdata.py
@@ -45,8 +45,8 @@ from urlparse import parse_qs
 
 frequency = PER_INSTANCE
 
-my_name = "cc_rightscale_userdata"
-my_hookname = 'CLOUD_INIT_REMOTE_HOOK'
+MY_NAME = "cc_rightscale_userdata"
+MY_HOOKNAME = 'CLOUD_INIT_REMOTE_HOOK'
 
 
 def handle(name, _cfg, cloud, log, _args):
@@ -58,10 +58,10 @@ def handle(name, _cfg, cloud, log, _args):
 
     try:
         mdict = parse_qs(ud)
-        if not mdict or not my_hookname in mdict:
+        if not mdict or not MY_HOOKNAME in mdict:
             log.debug(("Skipping transform %s, "
                        "did not find %s in parsed"
-                       " raw userdata"), name, my_hookname)
+                       " raw userdata"), name, MY_HOOKNAME)
             return
     except:
         util.logexc(log, ("Failed to parse query string %s"
@@ -75,10 +75,9 @@ def handle(name, _cfg, cloud, log, _args):
     # TODO: maybe this should just be a new user data handler??
     # Instead of a late transform that acts like a user data handler?
     scripts_d = cloud.get_ipath_cur('scripts')
-    urls = mdict[my_hookname]
+    urls = mdict[MY_HOOKNAME]
     for (i, url) in enumerate(urls):
         fname = os.path.join(scripts_d, "rightscale-%02i" % (i))
-        fname = cloud.paths.join(False, fname)
         try:
             resp = uhelp.readurl(url)
             # Ensure its a valid http response (and something gotten)
@@ -88,7 +87,7 @@ def handle(name, _cfg, cloud, log, _args):
         except Exception as e:
             captured_excps.append(e)
             util.logexc(log, "%s failed to read %s and write %s",
-                        my_name, url, fname)
+                        MY_NAME, url, fname)
 
     if wrote_fns:
         log.debug("Wrote out rightscale userdata to %s files", len(wrote_fns))

From fc20df93a648dcbf0f4cc52346ef95d7938349a9 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Wed, 20 Jun 2012 00:26:45 -0700
Subject: [PATCH 240/434] Always provide a path here, in this case the root
 path

---
 cloudinit/transforms/resizefs.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/transforms/resizefs.py b/cloudinit/transforms/resizefs.py
index fd2bb9e1..1690094a 100644
--- a/cloudinit/transforms/resizefs.py
+++ b/cloudinit/transforms/resizefs.py
@@ -78,7 +78,7 @@ def handle(name, cfg, cloud, log, args):
     util.ensure_dir(resize_root_d)
 
     # TODO: allow what is to be resized to be configurable??
-    resize_what = cloud.paths.join(False)
+    resize_what = cloud.paths.join(False, "/")
     with util.SilentTemporaryFile(prefix="cloudinit.resizefs.",
                                   dir=resize_root_d, delete=True) as tfh:
         devpth = tfh.name

From d1d46275b293d5714729053786098778de2ed6e4 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Wed, 20 Jun 2012 00:29:51 -0700
Subject: [PATCH 241/434] Ensure any authorized key file found in authorized
 keys is path adjusted as well

---
 cloudinit/ssh_util.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index 96143d32..fef3d40f 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -244,7 +244,7 @@ def setup_user_keys(keys, user, key_prefix, paths):
             akeys = akeys.replace("%%", '%')
             if not akeys.startswith('/'):
                 akeys = os.path.join(pwent.pw_dir, akeys)
-            authorized_keys = akeys
+            authorized_keys = paths.join(False, akeys)
         except (IOError, OSError):
             authorized_keys = os.path.join(ssh_dir, 'authorized_keys')
             util.logexc(LOG, ("Failed extracting 'AuthorizedKeysFile'"

From ed59370877c470abcbb7b0e135fb4d11f1ddac89 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Wed, 20 Jun 2012 00:31:45 -0700
Subject: [PATCH 242/434] Show the lock object name and the lock value - useful
 for debugging

---
 cloudinit/helpers.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 09686340..21d203db 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -155,8 +155,8 @@ class Runners(object):
             if not lk:
                 raise LockFailure("Failed to acquire lock for %s" % name)
             else:
-                LOG.debug("Running %s with args %s using lock %s",
-                          functor, args, lk)
+                LOG.debug("Running %s with args %s using lock %s (%s)",
+                          functor, args, util.obj_name(lk), lk)
                 if isinstance(args, (dict)):
                     results = functor(**args)
                 else:

From 9f373034e42b148f5a833000fb136e1a565841b2 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Wed, 20 Jun 2012 00:36:43 -0700
Subject: [PATCH 243/434] Change this function name back after made it back to
 protected after making the run single transform mode work

---
 cloudinit/stages.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 0c3d5915..f39b6532 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -543,6 +543,6 @@ class Transforms(object):
             return self._run_transforms(mostly_mods)
 
     def run_section(self, section_name):
-        raw_mods = self.read_transforms(section_name)
+        raw_mods = self._read_transforms(section_name)
         mostly_mods = self._fixup_transforms(raw_mods)
         return self._run_transforms(mostly_mods)

From 0bb5df891257f3722234e89dfc2c4faa5f05cfc1 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Wed, 20 Jun 2012 00:41:39 -0700
Subject: [PATCH 244/434] Use comparisons instead of xrange, until python 3
 when it should be more efficent

---
 cloudinit/url_helper.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index c69da1bb..1c583eba 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -59,11 +59,14 @@ class UrlResponse(object):
             return str(self.contents)
 
     def ok(self, redirects_ok=False):
+        upper = 300
         if redirects_ok:
-            return self.code in xrange(200, 400)
+            upper = 400
+        if self.code >= 200 and self.code < upper:
+            return True
         else:
-            return self.code in xrange(200, 300)
-
+            return False
+    
 
 def readurl(url, data=None, timeout=None,
             retries=0, sec_between=1, headers=None):

From d9981c5f019edec352eaa979f65a39c4be76499d Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Wed, 20 Jun 2012 00:43:46 -0700
Subject: [PATCH 245/434] Show log message that says ec2 route disabling is not
 enabled

---
 cloudinit/transforms/disable_ec2_metadata.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/cloudinit/transforms/disable_ec2_metadata.py b/cloudinit/transforms/disable_ec2_metadata.py
index 3c0dd57b..c7d26029 100644
--- a/cloudinit/transforms/disable_ec2_metadata.py
+++ b/cloudinit/transforms/disable_ec2_metadata.py
@@ -27,7 +27,10 @@ frequency = PER_ALWAYS
 reject_cmd = ['route', 'add', '-host', '169.254.169.254', 'reject']
 
 
-def handle(_name, cfg, _cloud, _log, _args):
+def handle(name, cfg, _cloud, log, _args):
     disabled = util.get_cfg_option_bool(cfg, "disable_ec2_metadata", False)
     if disabled:
         util.subp(reject_cmd)
+    else:
+        log.debug(("Skipping transform named %s,"
+                   " disabling the ec2 route not enabled"), name)

From 00e1cd2e4f99c1eeccdec9e62ac3dd09bfdac688 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 12:02:17 -0700
Subject: [PATCH 246/434] Make the single run mode setup the output redirection
 and logging accordingly

---
 bin/cloud-init2.py | 68 ++++++++++++++++++++++++++++------------------
 1 file changed, 42 insertions(+), 26 deletions(-)

diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
index 1f8d45bd..135e4114 100755
--- a/bin/cloud-init2.py
+++ b/bin/cloud-init2.py
@@ -54,10 +54,6 @@ QUERY_DATA_TYPES = [
 LOG = logging.getLogger()
 
 
-def warn(wstr):
-    sys.stderr.write("WARN: %s\n" % (wstr))
-
-
 def welcome(action):
     msg = ("Cloud-init v. {{version}} running '{{action}}' at "
            "{{timestamp}}. Up {{uptime}} seconds.")
@@ -202,6 +198,8 @@ def main_init(name, args):
                                              args=[settings.PER_INSTANCE],
                                              freq=settings.PER_INSTANCE)
         if not ran:
+            # Just consume anything that is set to run per
+            # always if nothing ran in the per instance section
             init.consume(settings.PER_ALWAYS)
     except Exception:
         util.logexc(LOG, "Consuming user data failed!")
@@ -217,12 +215,12 @@ def main_init(name, args):
             LOG.warn("Stdout, stderr changing to (%s, %s)", outfmt, errfmt)
             (outfmt, errfmt) = util.fixup_output(tr.cfg, name)
     except:
-        util.logexc(LOG, "Failed to adjust output redirection!")
+        util.logexc(LOG, "Failed to re-adjust output redirection!")
     # Stage 10
     return run_transform_section(tr, name, name)
 
 
-def main_transform(_action_name, args):
+def main_transform(action_name, args):
     name = args.mode
     # Cloud-init transform stages are broken up into the following sub-stages
     # 1. Ensure that the init object fetches its config without errors
@@ -234,7 +232,7 @@ def main_transform(_action_name, args):
     #    the transform objects configuration
     # 5. Run the transforms for the given stage name
     # 6. Done!
-    welcome(name)
+    welcome("%s:%s" % (action_name, name))
     init = stages.Init(ds_deps=[])
     # Stage 1
     init.read_cfg(extract_fns(args))
@@ -243,7 +241,7 @@ def main_transform(_action_name, args):
         init.fetch()
     except sources.DataSourceNotFoundException:
         # There was no datasource found, theres nothing to do
-        util.logexc(LOG, 'Can not apply stage %s, no datasource found', name)
+        util.logexc(LOG, 'Can not apply stage %s, no datasource found!', name)
         return 1
     # Stage 3
     tr_cfgs = extract_fns(args)
@@ -287,34 +285,52 @@ def main_single(name, args):
     #    the transform objects configuration
     # 6. Run the single transform
     # 7. Done!
-    transform_name = args.name
-    st_name = "%s:%s" % (name, transform_name)
-    welcome(st_name)
+    tr_name = args.name
+    welcome("%s:%s" % (name, tr_name))
     init = stages.Init(ds_deps=[])
     # Stage 1
     init.read_cfg(extract_fns(args))
     tr = stages.Transforms(init, extract_fns(args))
-    where_look = [
-        TR_TPL % ('init'),
-        TR_TPL % ('config'),
-        TR_TPL % ('final'),
-    ]
-    found_at = tr.find_transform(transform_name, where_look)
+    where_look_mp = {
+        TR_TPL % ('init'): 'init',
+        TR_TPL % ('config'): 'config',
+        TR_TPL % ('final'): 'final',
+    }
+    where_look = list(where_look_mp.keys())
+    found_at = tr.find_transform(tr_name, where_look)
     if not found_at:
         msg = ("No known transform named %s "
-              "in sections %s") % (transform_name, where_look)
-        sys.stderr.write("%s\n" % (msg))
+              "in sections (%s)") % (tr_name, ", ".join(where_look))
         LOG.warn(msg)
         return 1
     else:
-        LOG.debug("Found transform %s in section/s: %s",
-                  transform_name, found_at)
-        LOG.debug("Selecting section %s as its run section.", found_at[0])
-        (_run_am, failures) = tr.run_single(transform_name, found_at[0],
-                                            args.transform_args,
-                                            args.frequency)
+        LOG.debug("Found transform %s in sections: %s",
+                  tr_name, found_at)
+        sect_name = found_at[0]
+        LOG.debug("Selecting section %s as its 'source' section.", sect_name)
+        tr_args = args.transform_args
+        if tr_args:
+            LOG.debug("Using passed in arguments %s", tr_args)
+        tr_freq = args.frequency
+        if tr_freq:
+            LOG.debug("Using passed in frequency %s", tr_freq)
+        try:
+            LOG.debug("Closing stdin")
+            util.close_stdin()
+            # This seems to use the short name, instead of the long name
+            util.fixup_output(tr.cfg, where_look_mp.get(sect_name))
+        except:
+            util.logexc(LOG, "Failed to setup output redirection!")
+        if args.debug:
+            # Reset so that all the debug handlers are closed out
+            LOG.debug(("Logging being reset, this logger may no"
+                       " longer be active shortly"))
+            logging.resetLogging()
+        logging.setupLogging(tr.cfg)
+        (_run_am, failures) = tr.run_single(tr_name, sect_name,
+                                            tr_args, tr_freq)
         if failures:
-            LOG.debug("Ran %s but it failed", transform_name)
+            LOG.debug("Ran %s but it failed", tr_name)
             return 1
         else:
             return 0

From d2892598762c03883dd6b25da1a16487ff77d57c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 12:10:20 -0700
Subject: [PATCH 247/434] Removed the older binaries, now supplemented by a
 unified binary.

---
 bin/cloud-init-cfg.py   | 115 --------
 bin/cloud-init-query.py |  56 ----
 bin/cloud-init.py       | 564 +++++++++++++++++++++++++++-------------
 bin/cloud-init2.py      | 421 ------------------------------
 4 files changed, 378 insertions(+), 778 deletions(-)
 delete mode 100755 bin/cloud-init-cfg.py
 delete mode 100755 bin/cloud-init-query.py
 delete mode 100755 bin/cloud-init2.py

diff --git a/bin/cloud-init-cfg.py b/bin/cloud-init-cfg.py
deleted file mode 100755
index 3a475c1c..00000000
--- a/bin/cloud-init-cfg.py
+++ /dev/null
@@ -1,115 +0,0 @@
-#!/usr/bin/python
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2009-2010 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-import sys
-import cloudinit
-import cloudinit.util as util
-import cloudinit.CloudConfig as CC
-import logging
-import os
-
-
-def Usage(out=sys.stdout):
-    out.write("Usage: %s name\n" % sys.argv[0])
-
-
-def main():
-    # expect to be called with
-    #   name [ freq [ args ]
-    #   run the cloud-config job 'name' at with given args
-    # or
-    #   read cloud config jobs from config (builtin -> system)
-    #   and run all in order
-
-    util.close_stdin()
-
-    modename = "config"
-
-    if len(sys.argv) < 2:
-        Usage(sys.stderr)
-        sys.exit(1)
-    if sys.argv[1] == "all":
-        name = "all"
-        if len(sys.argv) > 2:
-            modename = sys.argv[2]
-    else:
-        freq = None
-        run_args = []
-        name = sys.argv[1]
-        if len(sys.argv) > 2:
-            freq = sys.argv[2]
-            if freq == "None":
-                freq = None
-        if len(sys.argv) > 3:
-            run_args = sys.argv[3:]
-
-    cfg_path = cloudinit.get_ipath_cur("cloud_config")
-    cfg_env_name = cloudinit.cfg_env_name
-    if cfg_env_name in os.environ:
-        cfg_path = os.environ[cfg_env_name]
-
-    cloud = cloudinit.CloudInit(ds_deps=[])  # ds_deps=[], get only cached
-    try:
-        cloud.get_data_source()
-    except cloudinit.DataSourceNotFoundException as e:
-        # there was no datasource found, theres nothing to do
-        sys.exit(0)
-
-    cc = CC.CloudConfig(cfg_path, cloud)
-
-    try:
-        (outfmt, errfmt) = CC.get_output_cfg(cc.cfg, modename)
-        CC.redirect_output(outfmt, errfmt)
-    except Exception as e:
-        err("Failed to get and set output config: %s\n" % e)
-
-    cloudinit.logging_set_from_cfg(cc.cfg)
-    log = logging.getLogger()
-    log.info("cloud-init-cfg %s" % sys.argv[1:])
-
-    module_list = []
-    if name == "all":
-        modlist_cfg_name = "cloud_%s_modules" % modename
-        module_list = CC.read_cc_modules(cc.cfg, modlist_cfg_name)
-        if not len(module_list):
-            err("no modules to run in cloud_config [%s]" % modename, log)
-            sys.exit(0)
-    else:
-        module_list.append([name, freq] + run_args)
-
-    failures = CC.run_cc_modules(cc, module_list, log)
-    if len(failures):
-        err("errors running cloud_config [%s]: %s" % (modename, failures), log)
-    sys.exit(len(failures))
-
-
-def err(msg, log=None):
-    if log:
-        log.error(msg)
-    sys.stderr.write(msg + "\n")
-
-
-def fail(msg, log=None):
-    err(msg, log)
-    sys.exit(1)
-
-if __name__ == '__main__':
-    main()
diff --git a/bin/cloud-init-query.py b/bin/cloud-init-query.py
deleted file mode 100755
index 856cf462..00000000
--- a/bin/cloud-init-query.py
+++ /dev/null
@@ -1,56 +0,0 @@
-#!/usr/bin/python
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2009-2010 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-import sys
-import cloudinit
-import cloudinit.CloudConfig
-
-
-def Usage(out=sys.stdout):
-    out.write("Usage: %s name\n" % sys.argv[0])
-
-
-def main():
-    # expect to be called with name of item to fetch
-    if len(sys.argv) != 2:
-        Usage(sys.stderr)
-        sys.exit(1)
-
-    cfg_path = cloudinit.get_ipath_cur("cloud_config")
-    cc = cloudinit.CloudConfig.CloudConfig(cfg_path)
-    data = {
-        'user_data': cc.cloud.get_userdata(),
-        'user_data_raw': cc.cloud.get_userdata_raw(),
-        'instance_id': cc.cloud.get_instance_id(),
-    }
-
-    name = sys.argv[1].replace('-', '_')
-
-    if name not in data:
-        sys.stderr.write("unknown name '%s'.  Known values are:\n  %s\n" %
-            (sys.argv[1], ' '.join(data.keys())))
-        sys.exit(1)
-
-    print data[name]
-    sys.exit(0)
-
-if __name__ == '__main__':
-    main()
diff --git a/bin/cloud-init.py b/bin/cloud-init.py
index 2acea3f8..99ecdaf9 100755
--- a/bin/cloud-init.py
+++ b/bin/cloud-init.py
@@ -1,11 +1,13 @@
 #!/usr/bin/python
 # vi: ts=4 expandtab
 #
-#    Copyright (C) 2009-2010 Canonical Ltd.
+#    Copyright (C) 2012 Canonical Ltd.
 #    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
 #
 #    Author: Scott Moser <scott.moser@canonical.com>
 #    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
 #
 #    This program is free software: you can redistribute it and/or modify
 #    it under the terms of the GNU General Public License version 3, as
@@ -19,211 +21,401 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import subprocess
+import argparse
+import os
 import sys
 
-import cloudinit
-import cloudinit.util as util
-import cloudinit.CloudConfig as CC
-import cloudinit.DataSource as ds
-import cloudinit.netinfo as netinfo
-import time
-import traceback
-import logging
-import errno
-import os
+# This is more just for running from the bin folder
+possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
+        sys.argv[0]), os.pardir, os.pardir))
+if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
+    sys.path.insert(0, possible_topdir)
+
+from cloudinit import log as logging
+from cloudinit import netinfo
+from cloudinit import settings
+from cloudinit import sources
+from cloudinit import stages
+from cloudinit import templater
+from cloudinit import util
+from cloudinit import version
 
 
-def warn(wstr):
-    sys.stderr.write("WARN:%s" % wstr)
+# Transform section template
+TR_TPL = "cloud_%s_modules"
+
+# Things u can query on
+QUERY_DATA_TYPES = [
+    'data',
+    'data_raw',
+    'instance_id',
+]
+
+LOG = logging.getLogger()
 
 
-def main():
-    util.close_stdin()
-
-    cmds = ("start", "start-local")
-    deps = {"start": (ds.DEP_FILESYSTEM, ds.DEP_NETWORK),
-            "start-local": (ds.DEP_FILESYSTEM, )}
-
-    cmd = ""
-    if len(sys.argv) > 1:
-        cmd = sys.argv[1]
-
-    cfg_path = None
-    if len(sys.argv) > 2:
-        # this is really for debugging only
-        # but you can invoke on development system with ./config/cloud.cfg
-        cfg_path = sys.argv[2]
-
-    if not cmd in cmds:
-        sys.stderr.write("bad command %s. use one of %s\n" % (cmd, cmds))
-        sys.exit(1)
-
-    now = time.strftime("%a, %d %b %Y %H:%M:%S %z", time.gmtime())
-    try:
-        uptimef = open("/proc/uptime")
-        uptime = uptimef.read().split(" ")[0]
-        uptimef.close()
-    except IOError as e:
-        warn("unable to open /proc/uptime\n")
-        uptime = "na"
-
-    cmdline_msg = None
-    cmdline_exc = None
-    if cmd == "start":
-        target = "%s.d/%s" % (cloudinit.system_config,
-            "91_kernel_cmdline_url.cfg")
-        if os.path.exists(target):
-            cmdline_msg = "cmdline: %s existed" % target
-        else:
-            cmdline = util.get_cmdline()
-            try:
-                (key, url, content) = cloudinit.get_cmdline_url(
-                    cmdline=cmdline)
-                if key and content:
-                    util.write_file(target, content, mode=0600)
-                    cmdline_msg = ("cmdline: wrote %s from %s, %s" %
-                        (target, key, url))
-                elif key:
-                    cmdline_msg = ("cmdline: %s, %s had no cloud-config" %
-                        (key, url))
-            except Exception:
-                cmdline_exc = ("cmdline: '%s' raised exception\n%s" %
-                    (cmdline, traceback.format_exc()))
-                warn(cmdline_exc)
-
-    try:
-        cfg = cloudinit.get_base_cfg(cfg_path)
-    except Exception as e:
-        warn("Failed to get base config. falling back to builtin: %s\n" % e)
-        try:
-            cfg = cloudinit.get_builtin_cfg()
-        except Exception as e:
-            warn("Unable to load builtin config\n")
-            raise
-
-    try:
-        (outfmt, errfmt) = CC.get_output_cfg(cfg, "init")
-        CC.redirect_output(outfmt, errfmt)
-    except Exception as e:
-        warn("Failed to get and set output config: %s\n" % e)
-
-    cloudinit.logging_set_from_cfg(cfg)
-    log = logging.getLogger()
-
-    if cmdline_exc:
-        log.debug(cmdline_exc)
-    elif cmdline_msg:
-        log.debug(cmdline_msg)
-
-    try:
-        cloudinit.initfs()
-    except Exception as e:
-        warn("failed to initfs, likely bad things to come: %s\n" % str(e))
-
-    nonet_path = "%s/%s" % (cloudinit.get_cpath("data"), "no-net")
-
-    if cmd == "start":
-        print netinfo.debug_info()
-
-        stop_files = (cloudinit.get_ipath_cur("obj_pkl"), nonet_path)
-        # if starting as the network start, there are cases
-        # where everything is already done for us, and it makes
-        # most sense to exit early and silently
-        for f in stop_files:
-            try:
-                fp = open(f, "r")
-                fp.close()
-            except:
-                continue
-
-            log.debug("no need for cloud-init start to run (%s)\n", f)
-            sys.exit(0)
-    elif cmd == "start-local":
-        # cache is not instance specific, so it has to be purged
-        # but we want 'start' to benefit from a cache if
-        # a previous start-local populated one
-        manclean = util.get_cfg_option_bool(cfg, 'manual_cache_clean', False)
-        if manclean:
-            log.debug("not purging cache, manual_cache_clean = True")
-        cloudinit.purge_cache(not manclean)
-
-        try:
-            os.unlink(nonet_path)
-        except OSError as e:
-            if e.errno != errno.ENOENT:
-                raise
-
-    msg = "cloud-init %s running: %s. up %s seconds" % (cmd, now, uptime)
-    sys.stderr.write(msg + "\n")
+def welcome(action):
+    msg = ("Cloud-init v. {{version}} running '{{action}}' at "
+           "{{timestamp}}. Up {{uptime}} seconds.")
+    tpl_params = {
+        'version': version.version_string(),
+        'uptime': util.uptime(),
+        'timestamp': util.time_rfc2822(),
+        'action': action,
+    }
+    welcome_msg = "%s" % (templater.render_string(msg, tpl_params))
+    sys.stderr.write("%s\n" % (welcome_msg))
     sys.stderr.flush()
+    LOG.info(welcome_msg)
 
-    log.info(msg)
 
-    cloud = cloudinit.CloudInit(ds_deps=deps[cmd])
+def extract_fns(args):
+    # Files are already opened so lets just pass that along
+    # since it would of broke if it couldn't have
+    # read that file already...
+    fn_cfgs = []
+    if args.files:
+        for fh in args.files:
+            # The realpath is more useful in logging
+            # so lets resolve to that...
+            fn_cfgs.append(os.path.realpath(fh.name))
+    return fn_cfgs
 
+
+def run_transform_section(tr, action_name, section):
+    full_section_name = TR_TPL % (section)
+    (ran_am, failures) = tr.run_section(full_section_name)
+    if not ran_am:
+        msg = ("No '%s' transforms to run"
+               " under section '%s'") % (action_name, full_section_name)
+        sys.stderr.write("%s\n" % (msg))
+        LOG.debug(msg)
+        return 0
+    else:
+        LOG.debug("Ran %s transforms with %s failures", ran_am, len(failures))
+        return len(failures)
+
+
+def main_init(name, args):
+    deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
+    if args.local:
+        deps = [sources.DEP_FILESYSTEM]
+
+    if not args.local:
+        # TODO: What is this for??
+        root_name = "%s.d" % (settings.CLOUD_CONFIG)
+        target_fn = os.path.join(root_name, "91_kernel_cmdline_url.cfg")
+        util.read_write_cmdline_url(target_fn)
+
+    # Cloud-init 'init' stage is broken up into the following sub-stages
+    # 1. Ensure that the init object fetches its config without errors
+    # 2. Setup logging/output redirections with resultant config (if any)
+    # 3. Initialize the cloud-init filesystem
+    # 4. Check if we can stop early by looking for various files
+    # 5. Fetch the datasource
+    # 6. Connect to the current instance location + update the cache
+    # 7. Consume the userdata (handlers get activated here)
+    # 8. Construct the transform object
+    # 9. Adjust any subsequent logging/output redirections using
+    #    the transform objects configuration
+    # 10. Run the transforms for the 'init' stage
+    # 11. Done!
+    welcome(name)
+    init = stages.Init(deps)
+    # Stage 1
+    init.read_cfg(extract_fns(args))
+    # Stage 2
+    outfmt = None
+    errfmt = None
     try:
-        cloud.get_data_source()
-    except cloudinit.DataSourceNotFoundException as e:
-        sys.stderr.write("no instance data found in %s\n" % cmd)
-        sys.exit(0)
-
-    # set this as the current instance
-    cloud.set_cur_instance()
-
-    # store the metadata
-    cloud.update_cache()
-
-    msg = "found data source: %s" % cloud.datasource
-    sys.stderr.write(msg + "\n")
-    log.debug(msg)
-
-    # parse the user data (ec2-run-userdata.py)
-    try:
-        ran = cloud.sem_and_run("consume_userdata", cloudinit.per_instance,
-            cloud.consume_userdata, [cloudinit.per_instance], False)
-        if not ran:
-            cloud.consume_userdata(cloudinit.per_always)
+        LOG.debug("Closing stdin")
+        util.close_stdin()
+        (outfmt, errfmt) = util.fixup_output(init.cfg, name)
     except:
-        warn("consuming user data failed!\n")
-        raise
-
-    cfg_path = cloudinit.get_ipath_cur("cloud_config")
-    cc = CC.CloudConfig(cfg_path, cloud)
-
-    # if the output config changed, update output and err
+        util.logexc(LOG, "Failed to setup output redirection!")
+    if args.debug:
+        # Reset so that all the debug handlers are closed out
+        LOG.debug(("Logging being reset, this logger may no"
+                    " longer be active shortly"))
+        logging.resetLogging()
+    logging.setupLogging(init.cfg)
+    # Stage 3
+    try:
+        init.initialize()
+    except Exception:
+        util.logexc(LOG, "Failed to initialize, likely bad things to come!")
+    # Stage 4
+    path_helper = init.paths
+    if not args.local:
+        sys.stderr.write("%s\n" % (netinfo.debug_info()))
+        LOG.debug(("Checking to see if files that we need already"
+                   " exist from a previous run that would allow us"
+                   " to stop early."))
+        stop_files = [
+            os.path.join(path_helper.get_cpath("data"), "no-net"),
+            path_helper.get_ipath_cur("obj_pkl"),
+        ]
+        existing_files = []
+        for fn in stop_files:
+            try:
+                c = util.load_file(fn)
+                if len(c):
+                    existing_files.append((fn, len(c)))
+            except Exception:
+                pass
+        if existing_files:
+            LOG.debug("Exiting early due to the existence of %s files",
+                      existing_files)
+            return 0
+    else:
+        # The cache is not instance specific, so it has to be purged
+        # but we want 'start' to benefit from a cache if
+        # a previous start-local populated one...
+        manual_clean = util.get_cfg_option_bool(init.cfg,
+                                                'manual_cache_clean', False)
+        if manual_clean:
+            LOG.debug("Not purging instance link, manual cleaning enabled")
+            init.purge_cache(False)
+        else:
+            init.purge_cache()
+        # Delete the non-net file as well
+        util.del_file(os.path.join(path_helper.get_cpath("data"), "no-net"))
+    # Stage 5
+    try:
+        init.fetch()
+    except sources.DataSourceNotFoundException:
+        util.logexc(LOG, "No instance datasource found!")
+        # TODO: Return 0 or 1??
+        return 1
+    # Stage 6
+    iid = init.instancify()
+    LOG.debug("%s will now be targeting instance id: %s", name, iid)
+    init.update()
+    # Stage 7
+    try:
+        (ran, _results) = init.cloudify().run('consume_userdata',
+                                             init.consume,
+                                             args=[settings.PER_INSTANCE],
+                                             freq=settings.PER_INSTANCE)
+        if not ran:
+            # Just consume anything that is set to run per
+            # always if nothing ran in the per instance section
+            init.consume(settings.PER_ALWAYS)
+    except Exception:
+        util.logexc(LOG, "Consuming user data failed!")
+        return 1
+    # Stage 8 - TODO - do we really need to re-extract our configs?
+    tr = stages.Transforms(init, extract_fns(args))
+    # Stage 9 - TODO is this really needed??
     try:
         outfmt_orig = outfmt
         errfmt_orig = errfmt
-        (outfmt, errfmt) = CC.get_output_cfg(cc.cfg, "init")
+        (outfmt, errfmt) = util.get_output_cfg(tr.cfg, name)
         if outfmt_orig != outfmt or errfmt_orig != errfmt:
-            warn("stdout, stderr changing to (%s,%s)" % (outfmt, errfmt))
-            CC.redirect_output(outfmt, errfmt)
-    except Exception as e:
-        warn("Failed to get and set output config: %s\n" % e)
+            LOG.warn("Stdout, stderr changing to (%s, %s)", outfmt, errfmt)
+            (outfmt, errfmt) = util.fixup_output(tr.cfg, name)
+    except:
+        util.logexc(LOG, "Failed to re-adjust output redirection!")
+    # Stage 10
+    return run_transform_section(tr, name, name)
 
-    # send the cloud-config ready event
-    cc_path = cloudinit.get_ipath_cur('cloud_config')
-    cc_ready = cc.cfg.get("cc_ready_cmd",
-        ['initctl', 'emit', 'cloud-config',
-         '%s=%s' % (cloudinit.cfg_env_name, cc_path)])
-    if cc_ready:
-        if isinstance(cc_ready, str):
-            cc_ready = ['sh', '-c', cc_ready]
-        subprocess.Popen(cc_ready).communicate()
 
-    module_list = CC.read_cc_modules(cc.cfg, "cloud_init_modules")
+def main_transform(action_name, args):
+    name = args.mode
+    # Cloud-init transform stages are broken up into the following sub-stages
+    # 1. Ensure that the init object fetches its config without errors
+    # 2. Get the datasource from the init object, if it does
+    #    not exist then that means the main_init stage never
+    #    worked, and thus this stage can not run.
+    # 3. Construct the transform object
+    # 4. Adjust any subsequent logging/output redirections using
+    #    the transform objects configuration
+    # 5. Run the transforms for the given stage name
+    # 6. Done!
+    welcome("%s:%s" % (action_name, name))
+    init = stages.Init(ds_deps=[])
+    # Stage 1
+    init.read_cfg(extract_fns(args))
+    # Stage 2
+    try:
+        init.fetch()
+    except sources.DataSourceNotFoundException:
+        # There was no datasource found, theres nothing to do
+        util.logexc(LOG, 'Can not apply stage %s, no datasource found!', name)
+        return 1
+    # Stage 3
+    tr_cfgs = extract_fns(args)
+    cc_cfg = init.paths.get_ipath_cur('cloud_config')
+    if settings.CFG_ENV_NAME in os.environ:
+        cc_cfg = os.environ[settings.CFG_ENV_NAME]
+    if cc_cfg and os.path.exists(cc_cfg):
+        tr_cfgs.append(cc_cfg)
+    tr = stages.Transforms(init, tr_cfgs)
+    # Stage 4
+    try:
+        LOG.debug("Closing stdin")
+        util.close_stdin()
+        util.fixup_output(tr.cfg, name)
+    except:
+        util.logexc(LOG, "Failed to setup output redirection!")
+    if args.debug:
+        # Reset so that all the debug handlers are closed out
+        LOG.debug(("Logging being reset, this logger may no"
+                    " longer be active shortly"))
+        logging.resetLogging()
+    logging.setupLogging(tr.cfg)
+    # Stage 5
+    return run_transform_section(tr, name, name)
 
-    failures = []
-    if len(module_list):
-        failures = CC.run_cc_modules(cc, module_list, log)
+
+def main_query(name, _args):
+    raise NotImplementedError("Action '%s' is not currently implemented" % (name))
+
+
+def main_single(name, args):
+    # Cloud-init single stage is broken up into the following sub-stages
+    # 1. Ensure that the init object fetches its config without errors
+    # 2. Check to see if we can find the transform name
+    #    in the 'init', 'final', 'config' stages, if not bail
+    # 3. Get the datasource from the init object, if it does
+    #    not exist then that means the main_init stage never
+    #    worked, and thus this stage can not run.
+    # 4. Construct the transform object
+    # 5. Adjust any subsequent logging/output redirections using
+    #    the transform objects configuration
+    # 6. Run the single transform
+    # 7. Done!
+    tr_name = args.name
+    welcome("%s:%s" % (name, tr_name))
+    init = stages.Init(ds_deps=[])
+    # Stage 1
+    init.read_cfg(extract_fns(args))
+    tr = stages.Transforms(init, extract_fns(args))
+    where_look_mp = {
+        TR_TPL % ('init'): 'init',
+        TR_TPL % ('config'): 'config',
+        TR_TPL % ('final'): 'final',
+    }
+    where_look = list(where_look_mp.keys())
+    found_at = tr.find_transform(tr_name, where_look)
+    if not found_at:
+        msg = ("No known transform named %s "
+              "in sections (%s)") % (tr_name, ", ".join(where_look))
+        LOG.warn(msg)
+        return 1
     else:
-        msg = "no cloud_init_modules to run"
-        sys.stderr.write(msg + "\n")
-        log.debug(msg)
-        sys.exit(0)
+        LOG.debug("Found transform %s in sections: %s",
+                  tr_name, found_at)
+        sect_name = found_at[0]
+        LOG.debug("Selecting section %s as its 'source' section.", sect_name)
+        tr_args = args.transform_args
+        if tr_args:
+            LOG.debug("Using passed in arguments %s", tr_args)
+        tr_freq = args.frequency
+        if tr_freq:
+            LOG.debug("Using passed in frequency %s", tr_freq)
+        try:
+            LOG.debug("Closing stdin")
+            util.close_stdin()
+            # This seems to use the short name, instead of the long name
+            util.fixup_output(tr.cfg, where_look_mp.get(sect_name))
+        except:
+            util.logexc(LOG, "Failed to setup output redirection!")
+        if args.debug:
+            # Reset so that all the debug handlers are closed out
+            LOG.debug(("Logging being reset, this logger may no"
+                       " longer be active shortly"))
+            logging.resetLogging()
+        logging.setupLogging(tr.cfg)
+        (_run_am, failures) = tr.run_single(tr_name, sect_name,
+                                            tr_args, tr_freq)
+        if failures:
+            LOG.debug("Ran %s but it failed", tr_name)
+            return 1
+        else:
+            return 0
+
+
+def main():
+    parser = argparse.ArgumentParser()
+    
+    # Top level args
+    parser.add_argument('--version', '-v', action='version', 
+                        version='%(prog)s ' + (version.version_string()))
+    parser.add_argument('--file', '-f', action='append', 
+                        dest='files',
+                        help=('additional yaml configuration'
+                              ' files to use'),
+                        type=argparse.FileType('rb'))
+    parser.add_argument('--debug', '-d', action='store_true',
+                        help=('show additional pre-action'
+                              ' logging (default: %(default)s)'),
+                        default=False)
+    subparsers = parser.add_subparsers()
+
+    # Each action and its sub-options (if any)
+    parser_init = subparsers.add_parser('init', 
+                                        help=('initializes cloud-init and'
+                                              ' performs initial transforms'))
+    parser_init.add_argument("--local", '-l', action='store_true',
+                             help="start in local mode (default: %(default)s)",
+                             default=False)
+    # This is used so that we can know which action is selected + 
+    # the functor to use to run this subcommand
+    parser_init.set_defaults(action=('init', main_init))
+
+    # These settings are used for the 'config' and 'final' stages
+    parser_tr = subparsers.add_parser('transform', 
+                                      help=('performs transforms '
+                                            'using a given configuration key'))
+    parser_tr.add_argument("--mode", '-m', action='store',
+                             help=("transform configuration name "
+                                    "to use (default: %(default)s)"),
+                             default='config',
+                             choices=('config', 'final'))
+    parser_tr.set_defaults(action=('transform', main_transform))
+
+    # These settings are used when you want to query information
+    # stored in the cloud-init data objects/directories/files
+    parser_query = subparsers.add_parser('query', 
+                                         help=('query information stored '
+                                               'in cloud-init'))
+    parser_query.add_argument("--name", '-n', action="store",
+                              help="item name to query on",
+                              required=True,
+                              choices=QUERY_DATA_TYPES)
+    parser_query.set_defaults(action=('query', main_query))
+
+    # This subcommand allows you to run a single transform
+    parser_single = subparsers.add_parser('single', 
+                                         help=('run a single transform '))
+    parser_single.set_defaults(action=('single', main_single))
+    parser_single.add_argument("--name", '-n', action="store",
+                              help="transform name to run",
+                              required=True)
+    parser_single.add_argument("--frequency", action="store",
+                              help=("frequency of "
+                                    " the transform (default: %(default)s)"),
+                              required=False,
+                              default=settings.PER_ALWAYS,
+                              choices=settings.FREQUENCIES)
+    parser_single.add_argument("transform_args", nargs="*",
+                              metavar='argument',
+                              help=('any additional arguments to'
+                                    ' pass to this transform'))
+    parser_single.set_defaults(action=('single', main_single))
+
+
+    args = parser.parse_args()
+
+    # Setup basic logging to start (until reinitialized)
+    if args.debug:
+        logging.setupBasicLogging()
+
+    (name, functor) = args.action
+    return functor(name, args)
 
-    sys.exit(len(failures))
 
 if __name__ == '__main__':
-    main()
+    sys.exit(main())
+
diff --git a/bin/cloud-init2.py b/bin/cloud-init2.py
deleted file mode 100755
index 135e4114..00000000
--- a/bin/cloud-init2.py
+++ /dev/null
@@ -1,421 +0,0 @@
-#!/usr/bin/python
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2012 Canonical Ltd.
-#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
-#    Copyright (C) 2012 Yahoo! Inc.
-#
-#    Author: Scott Moser <scott.moser@canonical.com>
-#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
-#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-import argparse
-import os
-import sys
-
-# This is more just for running from the bin folder
-possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
-        sys.argv[0]), os.pardir, os.pardir))
-if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
-    sys.path.insert(0, possible_topdir)
-
-from cloudinit import log as logging
-from cloudinit import netinfo
-from cloudinit import settings
-from cloudinit import sources
-from cloudinit import stages
-from cloudinit import templater
-from cloudinit import util
-from cloudinit import version
-
-
-# Transform section template
-TR_TPL = "cloud_%s_modules"
-
-# Things u can query on
-QUERY_DATA_TYPES = [
-    'data',
-    'data_raw',
-    'instance_id',
-]
-
-LOG = logging.getLogger()
-
-
-def welcome(action):
-    msg = ("Cloud-init v. {{version}} running '{{action}}' at "
-           "{{timestamp}}. Up {{uptime}} seconds.")
-    tpl_params = {
-        'version': version.version_string(),
-        'uptime': util.uptime(),
-        'timestamp': util.time_rfc2822(),
-        'action': action,
-    }
-    welcome_msg = "%s" % (templater.render_string(msg, tpl_params))
-    sys.stderr.write("%s\n" % (welcome_msg))
-    sys.stderr.flush()
-    LOG.info(welcome_msg)
-
-
-def extract_fns(args):
-    # Files are already opened so lets just pass that along
-    # since it would of broke if it couldn't have
-    # read that file already...
-    fn_cfgs = []
-    if args.files:
-        for fh in args.files:
-            # The realpath is more useful in logging
-            # so lets resolve to that...
-            fn_cfgs.append(os.path.realpath(fh.name))
-    return fn_cfgs
-
-
-def run_transform_section(tr, action_name, section):
-    full_section_name = TR_TPL % (section)
-    (ran_am, failures) = tr.run_section(full_section_name)
-    if not ran_am:
-        msg = ("No '%s' transforms to run"
-               " under section '%s'") % (action_name, full_section_name)
-        sys.stderr.write("%s\n" % (msg))
-        LOG.debug(msg)
-        return 0
-    else:
-        LOG.debug("Ran %s transforms with %s failures", ran_am, len(failures))
-        return len(failures)
-
-
-def main_init(name, args):
-    deps = [sources.DEP_FILESYSTEM, sources.DEP_NETWORK]
-    if args.local:
-        deps = [sources.DEP_FILESYSTEM]
-
-    if not args.local:
-        # TODO: What is this for??
-        root_name = "%s.d" % (settings.CLOUD_CONFIG)
-        target_fn = os.path.join(root_name, "91_kernel_cmdline_url.cfg")
-        util.read_write_cmdline_url(target_fn)
-
-    # Cloud-init 'init' stage is broken up into the following sub-stages
-    # 1. Ensure that the init object fetches its config without errors
-    # 2. Setup logging/output redirections with resultant config (if any)
-    # 3. Initialize the cloud-init filesystem
-    # 4. Check if we can stop early by looking for various files
-    # 5. Fetch the datasource
-    # 6. Connect to the current instance location + update the cache
-    # 7. Consume the userdata (handlers get activated here)
-    # 8. Construct the transform object
-    # 9. Adjust any subsequent logging/output redirections using
-    #    the transform objects configuration
-    # 10. Run the transforms for the 'init' stage
-    # 11. Done!
-    welcome(name)
-    init = stages.Init(deps)
-    # Stage 1
-    init.read_cfg(extract_fns(args))
-    # Stage 2
-    outfmt = None
-    errfmt = None
-    try:
-        LOG.debug("Closing stdin")
-        util.close_stdin()
-        (outfmt, errfmt) = util.fixup_output(init.cfg, name)
-    except:
-        util.logexc(LOG, "Failed to setup output redirection!")
-    if args.debug:
-        # Reset so that all the debug handlers are closed out
-        LOG.debug(("Logging being reset, this logger may no"
-                    " longer be active shortly"))
-        logging.resetLogging()
-    logging.setupLogging(init.cfg)
-    # Stage 3
-    try:
-        init.initialize()
-    except Exception:
-        util.logexc(LOG, "Failed to initialize, likely bad things to come!")
-    # Stage 4
-    path_helper = init.paths
-    if not args.local:
-        sys.stderr.write("%s\n" % (netinfo.debug_info()))
-        LOG.debug(("Checking to see if files that we need already"
-                   " exist from a previous run that would allow us"
-                   " to stop early."))
-        stop_files = [
-            os.path.join(path_helper.get_cpath("data"), "no-net"),
-            path_helper.get_ipath_cur("obj_pkl"),
-        ]
-        existing_files = []
-        for fn in stop_files:
-            try:
-                c = util.load_file(fn)
-                if len(c):
-                    existing_files.append((fn, len(c)))
-            except Exception:
-                pass
-        if existing_files:
-            LOG.debug("Exiting early due to the existence of %s files",
-                      existing_files)
-            return 0
-    else:
-        # The cache is not instance specific, so it has to be purged
-        # but we want 'start' to benefit from a cache if
-        # a previous start-local populated one...
-        manual_clean = util.get_cfg_option_bool(init.cfg,
-                                                'manual_cache_clean', False)
-        if manual_clean:
-            LOG.debug("Not purging instance link, manual cleaning enabled")
-            init.purge_cache(False)
-        else:
-            init.purge_cache()
-        # Delete the non-net file as well
-        util.del_file(os.path.join(path_helper.get_cpath("data"), "no-net"))
-    # Stage 5
-    try:
-        init.fetch()
-    except sources.DataSourceNotFoundException:
-        util.logexc(LOG, "No instance datasource found!")
-        # TODO: Return 0 or 1??
-        return 1
-    # Stage 6
-    iid = init.instancify()
-    LOG.debug("%s will now be targeting instance id: %s", name, iid)
-    init.update()
-    # Stage 7
-    try:
-        (ran, _results) = init.cloudify().run('consume_userdata',
-                                             init.consume,
-                                             args=[settings.PER_INSTANCE],
-                                             freq=settings.PER_INSTANCE)
-        if not ran:
-            # Just consume anything that is set to run per
-            # always if nothing ran in the per instance section
-            init.consume(settings.PER_ALWAYS)
-    except Exception:
-        util.logexc(LOG, "Consuming user data failed!")
-        return 1
-    # Stage 8 - TODO - do we really need to re-extract our configs?
-    tr = stages.Transforms(init, extract_fns(args))
-    # Stage 9 - TODO is this really needed??
-    try:
-        outfmt_orig = outfmt
-        errfmt_orig = errfmt
-        (outfmt, errfmt) = util.get_output_cfg(tr.cfg, name)
-        if outfmt_orig != outfmt or errfmt_orig != errfmt:
-            LOG.warn("Stdout, stderr changing to (%s, %s)", outfmt, errfmt)
-            (outfmt, errfmt) = util.fixup_output(tr.cfg, name)
-    except:
-        util.logexc(LOG, "Failed to re-adjust output redirection!")
-    # Stage 10
-    return run_transform_section(tr, name, name)
-
-
-def main_transform(action_name, args):
-    name = args.mode
-    # Cloud-init transform stages are broken up into the following sub-stages
-    # 1. Ensure that the init object fetches its config without errors
-    # 2. Get the datasource from the init object, if it does
-    #    not exist then that means the main_init stage never
-    #    worked, and thus this stage can not run.
-    # 3. Construct the transform object
-    # 4. Adjust any subsequent logging/output redirections using
-    #    the transform objects configuration
-    # 5. Run the transforms for the given stage name
-    # 6. Done!
-    welcome("%s:%s" % (action_name, name))
-    init = stages.Init(ds_deps=[])
-    # Stage 1
-    init.read_cfg(extract_fns(args))
-    # Stage 2
-    try:
-        init.fetch()
-    except sources.DataSourceNotFoundException:
-        # There was no datasource found, theres nothing to do
-        util.logexc(LOG, 'Can not apply stage %s, no datasource found!', name)
-        return 1
-    # Stage 3
-    tr_cfgs = extract_fns(args)
-    cc_cfg = init.paths.get_ipath_cur('cloud_config')
-    if settings.CFG_ENV_NAME in os.environ:
-        cc_cfg = os.environ[settings.CFG_ENV_NAME]
-    if cc_cfg and os.path.exists(cc_cfg):
-        tr_cfgs.append(cc_cfg)
-    tr = stages.Transforms(init, tr_cfgs)
-    # Stage 4
-    try:
-        LOG.debug("Closing stdin")
-        util.close_stdin()
-        util.fixup_output(tr.cfg, name)
-    except:
-        util.logexc(LOG, "Failed to setup output redirection!")
-    if args.debug:
-        # Reset so that all the debug handlers are closed out
-        LOG.debug(("Logging being reset, this logger may no"
-                    " longer be active shortly"))
-        logging.resetLogging()
-    logging.setupLogging(tr.cfg)
-    # Stage 5
-    return run_transform_section(tr, name, name)
-
-
-def main_query(_name, _args):
-    pass
-
-
-def main_single(name, args):
-    # Cloud-init single stage is broken up into the following sub-stages
-    # 1. Ensure that the init object fetches its config without errors
-    # 2. Check to see if we can find the transform name
-    #    in the 'init', 'final', 'config' stages, if not bail
-    # 3. Get the datasource from the init object, if it does
-    #    not exist then that means the main_init stage never
-    #    worked, and thus this stage can not run.
-    # 4. Construct the transform object
-    # 5. Adjust any subsequent logging/output redirections using
-    #    the transform objects configuration
-    # 6. Run the single transform
-    # 7. Done!
-    tr_name = args.name
-    welcome("%s:%s" % (name, tr_name))
-    init = stages.Init(ds_deps=[])
-    # Stage 1
-    init.read_cfg(extract_fns(args))
-    tr = stages.Transforms(init, extract_fns(args))
-    where_look_mp = {
-        TR_TPL % ('init'): 'init',
-        TR_TPL % ('config'): 'config',
-        TR_TPL % ('final'): 'final',
-    }
-    where_look = list(where_look_mp.keys())
-    found_at = tr.find_transform(tr_name, where_look)
-    if not found_at:
-        msg = ("No known transform named %s "
-              "in sections (%s)") % (tr_name, ", ".join(where_look))
-        LOG.warn(msg)
-        return 1
-    else:
-        LOG.debug("Found transform %s in sections: %s",
-                  tr_name, found_at)
-        sect_name = found_at[0]
-        LOG.debug("Selecting section %s as its 'source' section.", sect_name)
-        tr_args = args.transform_args
-        if tr_args:
-            LOG.debug("Using passed in arguments %s", tr_args)
-        tr_freq = args.frequency
-        if tr_freq:
-            LOG.debug("Using passed in frequency %s", tr_freq)
-        try:
-            LOG.debug("Closing stdin")
-            util.close_stdin()
-            # This seems to use the short name, instead of the long name
-            util.fixup_output(tr.cfg, where_look_mp.get(sect_name))
-        except:
-            util.logexc(LOG, "Failed to setup output redirection!")
-        if args.debug:
-            # Reset so that all the debug handlers are closed out
-            LOG.debug(("Logging being reset, this logger may no"
-                       " longer be active shortly"))
-            logging.resetLogging()
-        logging.setupLogging(tr.cfg)
-        (_run_am, failures) = tr.run_single(tr_name, sect_name,
-                                            tr_args, tr_freq)
-        if failures:
-            LOG.debug("Ran %s but it failed", tr_name)
-            return 1
-        else:
-            return 0
-
-
-def main():
-    parser = argparse.ArgumentParser()
-    
-    # Top level args
-    parser.add_argument('--version', '-v', action='version', 
-                        version='%(prog)s ' + (version.version_string()))
-    parser.add_argument('--file', '-f', action='append', 
-                        dest='files',
-                        help=('additional yaml configuration'
-                              ' files to use'),
-                        type=argparse.FileType('rb'))
-    parser.add_argument('--debug', '-d', action='store_true',
-                        help=('show additional pre-action'
-                              ' logging (default: %(default)s)'),
-                        default=False)
-    subparsers = parser.add_subparsers()
-
-    # Each action and its sub-options (if any)
-    parser_init = subparsers.add_parser('init', 
-                                        help=('initializes cloud-init and'
-                                              ' performs initial transforms'))
-    parser_init.add_argument("--local", '-l', action='store_true',
-                             help="start in local mode (default: %(default)s)",
-                             default=False)
-    # This is used so that we can know which action is selected + 
-    # the functor to use to run this subcommand
-    parser_init.set_defaults(action=('init', main_init))
-
-    # These settings are used for the 'config' and 'final' stages
-    parser_tr = subparsers.add_parser('transform', 
-                                      help=('performs transforms '
-                                            'using a given configuration key'))
-    parser_tr.add_argument("--mode", '-m', action='store',
-                             help=("transform configuration name "
-                                    "to use (default: %(default)s)"),
-                             default='config',
-                             choices=('config', 'final'))
-    parser_tr.set_defaults(action=('transform', main_transform))
-
-    # These settings are used when you want to query information
-    # stored in the cloud-init data objects/directories/files
-    parser_query = subparsers.add_parser('query', 
-                                         help=('query information stored '
-                                               'in cloud-init'))
-    parser_query.add_argument("--name", '-n', action="store",
-                              help="item name to query on",
-                              required=True,
-                              choices=QUERY_DATA_TYPES)
-    parser_query.set_defaults(action=('query', main_query))
-
-    # This subcommand allows you to run a single transform
-    parser_single = subparsers.add_parser('single', 
-                                         help=('run a single transform '))
-    parser_single.set_defaults(action=('single', main_single))
-    parser_single.add_argument("--name", '-n', action="store",
-                              help="transform name to run",
-                              required=True)
-    parser_single.add_argument("--frequency", action="store",
-                              help=("frequency of "
-                                    " the transform (default: %(default)s)"),
-                              required=False,
-                              default=settings.PER_ALWAYS,
-                              choices=settings.FREQUENCIES)
-    parser_single.add_argument("transform_args", nargs="*",
-                              metavar='argument',
-                              help=('any additional arguments to'
-                                    ' pass to this transform'))
-    parser_single.set_defaults(action=('single', main_single))
-
-
-    args = parser.parse_args()
-
-    # Setup basic logging to start (until reinitialized)
-    if args.debug:
-        logging.setupBasicLogging()
-
-    (name, functor) = args.action
-    return functor(name, args)
-
-
-if __name__ == '__main__':
-    sys.exit(main())
-

From a21fead263f04957e1c91496531a08f7f737f5de Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 12:12:53 -0700
Subject: [PATCH 248/434] Add message about query not being implemented yet.

---
 bin/cloud-init.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bin/cloud-init.py b/bin/cloud-init.py
index 99ecdaf9..8fb3a740 100755
--- a/bin/cloud-init.py
+++ b/bin/cloud-init.py
@@ -269,7 +269,8 @@ def main_transform(action_name, args):
 
 
 def main_query(name, _args):
-    raise NotImplementedError("Action '%s' is not currently implemented" % (name))
+    raise NotImplementedError(("Action '%s' is not"
+                               " currently implemented") % (name))
 
 
 def main_single(name, args):

From f4fa291248b842363d6d34e279145bc8f07ac60c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 12:13:14 -0700
Subject: [PATCH 249/434] Add the ability to only fetch a local datasource
 instead of also trying to fetch an offical datasource from an external
 source.

---
 cloudinit/stages.py | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index f39b6532..334d5004 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -209,13 +209,13 @@ class Init(object):
         cfg_list = self.cfg.get('datasource_list') or []
         return (cfg_list, pkg_list)
 
-    def _get_data_source(self):
+    def _get_data_source(self, local_only=False):
         if self.datasource:
             return self.datasource
         ds = self._restore_from_cache()
         if ds:
-            LOG.debug("Restored from cache datasource: %s" % ds)
-        else:
+            LOG.debug("Restored from cache, datasource: %s", ds)
+        if not ds and not local_only:
             (cfg_list, pkg_list) = self._get_datasources()
             # Deep copy so that user-data handlers can not modify
             # (which will affect user-data handlers down the line...)
@@ -225,10 +225,11 @@ class Init(object):
                                                self.paths,
                                                ds_deps, cfg_list, pkg_list)
             LOG.debug("Loaded datasource %s - %s", dsname, ds)
-        self.datasource = ds
-        # Ensure we adjust our path members datasource
-        # now that we have one (thus allowing ipath to be used)
-        self.paths.datasource = ds
+        if ds:
+            self.datasource = ds
+            # Ensure we adjust our path members datasource
+            # now that we have one (thus allowing ipath to be used)
+            self.paths.datasource = ds
         return ds
 
     def _reflect_cur_instance(self):
@@ -276,8 +277,8 @@ class Init(object):
                         "%s\n" % (previous_iid))
         return iid
 
-    def fetch(self):
-        return self._get_data_source()
+    def fetch(self, local_only=False):
+        return self._get_data_source(local_only)
 
     def instancify(self):
         return self._reflect_cur_instance()

From e928d74318671a62de3fb6a513b4a719f44ccf72 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 12:22:43 -0700
Subject: [PATCH 250/434] Remove the .py extension for this new main program
 binary.

---
 bin/{cloud-init.py => cloud-init} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename bin/{cloud-init.py => cloud-init} (100%)

diff --git a/bin/cloud-init.py b/bin/cloud-init
similarity index 100%
rename from bin/cloud-init.py
rename to bin/cloud-init

From d221d29fb214f831536d696231a756d7812432e2 Mon Sep 17 00:00:00 2001
From: Scott Moser <smoser@ubuntu.com>
Date: Wed, 20 Jun 2012 16:24:24 -0400
Subject: [PATCH 251/434] update tools/bddeb and debian.trunk packaging

 * debian.trunk/changelog: increase debian version to '1' to avoid lintian
   error
 * debian.trunk/control: bump standards version
 * debian.trunk/rules: remove cloud-init-run-module symlink (been deprecated
   for some time)
 * tools/bddeb: read version from ChangeLog rather than setup.py
---
 debian.trunk/changelog | 2 +-
 debian.trunk/control   | 2 +-
 debian.trunk/rules     | 1 -
 setup.py               | 3 +--
 tools/bddeb            | 6 +++---
 5 files changed, 6 insertions(+), 8 deletions(-)

diff --git a/debian.trunk/changelog b/debian.trunk/changelog
index 53e3678c..a36d00d6 100644
--- a/debian.trunk/changelog
+++ b/debian.trunk/changelog
@@ -1,4 +1,4 @@
-cloud-init (VERSION~REVNO-0) UNRELEASED; urgency=low
+cloud-init (VERSION~REVNO-1) UNRELEASED; urgency=low
 
   * build
 
diff --git a/debian.trunk/control b/debian.trunk/control
index f2eec1e4..f0dcef6a 100644
--- a/debian.trunk/control
+++ b/debian.trunk/control
@@ -10,7 +10,7 @@ Build-Depends: cdbs,
                pylint,
                python-mocker,
 XS-Python-Version: all
-Standards-Version: 3.9.1
+Standards-Version: 3.9.3
 
 Package: cloud-init
 Architecture: all
diff --git a/debian.trunk/rules b/debian.trunk/rules
index 19384687..0f79136c 100755
--- a/debian.trunk/rules
+++ b/debian.trunk/rules
@@ -13,7 +13,6 @@ cloud-init-fixups:
 	for x in $(DEB_DESTDIR)/usr/bin/*.py; do mv "$$x" "$${x%.py}"; done
 	install -d $(DEB_DESTDIR)/etc/rsyslog.d
 	cp tools/21-cloudinit.conf $(DEB_DESTDIR)/etc/rsyslog.d/21-cloudinit.conf
-	ln -sf cloud-init-per $(DEB_DESTDIR)/usr/bin/cloud-init-run-module
 
 # You only need to run this immediately after checking out the package from
 # revision control.
diff --git a/setup.py b/setup.py
index 96f889d8..9ee58b9a 100755
--- a/setup.py
+++ b/setup.py
@@ -70,8 +70,7 @@ setup(name='cloud-init',
       author_email='scott.moser@canonical.com',
       url='http://launchpad.net/cloud-init/',
       packages=find_packages(),
-      scripts=['bin/cloud-init.py',
-               'bin/cloud-init-cfg.py',
+      scripts=['bin/cloud-init',
                'tools/cloud-init-per',
                ],
       data_files=[('/etc/cloud', glob('config/*.cfg')),
diff --git a/tools/bddeb b/tools/bddeb
index 598f71bb..b162b06f 100755
--- a/tools/bddeb
+++ b/tools/bddeb
@@ -8,8 +8,8 @@ set -e
 trap "rm -Rf '${TEMP_D}'" exit
 files=$(bzr ls --versioned)
 revno=$(bzr revno)
-version=$(awk \
-  -F= '$1 ~ /version$/ { gsub("[^0-9.]","",$2); print $2; }' setup.py)
+version=$(awk -F: \
+   '$1 ~ /[0-9][.][0-9]+[.][0-9]+/ { print $1 ; exit(0); }' ChangeLog )
 mkdir "${TEMP_D}/cloud-init"
 otar="$TEMP_D/cloud-init_$version~bzr${revno}.orig.tar.gz"
 tar -czf - ${files} > "$otar"
@@ -25,7 +25,7 @@ debuild "$@"
 #for x in ../*.deb; do
 #   echo wrote ${x##*/}
 #done
-debname="cloud-init_${version}~bzr${revno}-0_all.deb"
+debname="cloud-init_${version}~bzr${revno}-1_all.deb"
 mv "../$debname" "$start"
 link="$start/cloud-init_all.deb"
 echo "wrote $debname"

From 6a3633b4be07079a9ba9a4bdbe9c69aac755b0a3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:06:24 -0700
Subject: [PATCH 252/434] Add in the new binary to be used in files found.

---
 Makefile | 1 +
 1 file changed, 1 insertion(+)

diff --git a/Makefile b/Makefile
index 683475fd..82c5dedb 100644
--- a/Makefile
+++ b/Makefile
@@ -1,5 +1,6 @@
 CWD=$(shell pwd)
 PY_FILES=$(shell find cloudinit bin -name "*.py")
+PY_FILES+="bin/cloud-init"
 
 all: test
 

From 844dcdb4c4177962db2827b3fec75cdebfa8ee36 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:30:30 -0700
Subject: [PATCH 253/434] 1. Use the name modules where transforms was used 2.
 Reflect the move back to config 'modules' in the other cli options 3. Have
 the single mode not need to lookup the module but use the general import path

---
 bin/cloud-init | 180 +++++++++++++++++++++++--------------------------
 1 file changed, 84 insertions(+), 96 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index 8fb3a740..032d5f39 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -25,12 +25,19 @@ import argparse
 import os
 import sys
 
-# This is more just for running from the bin folder
+# This is more just for running from the bin folder so that
+# cloud-init binary can find the cloudinit module
 possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
         sys.argv[0]), os.pardir, os.pardir))
 if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
     sys.path.insert(0, possible_topdir)
 
+# This is so config modules can be found
+if os.path.exists(os.path.join(possible_topdir,
+                 "cloudinit", 'config', "__init__.py")):
+    sys.path.insert(0, os.path.join(possible_topdir, 'cloudinit', 'config'))
+
+
 from cloudinit import log as logging
 from cloudinit import netinfo
 from cloudinit import settings
@@ -41,8 +48,8 @@ from cloudinit import util
 from cloudinit import version
 
 
-# Transform section template
-TR_TPL = "cloud_%s_modules"
+# Module section template
+MOD_SECTION_TPL = "cloud_%s_modules"
 
 # Things u can query on
 QUERY_DATA_TYPES = [
@@ -68,7 +75,6 @@ def welcome(action):
     sys.stderr.flush()
     LOG.info(welcome_msg)
 
-
 def extract_fns(args):
     # Files are already opened so lets just pass that along
     # since it would of broke if it couldn't have
@@ -82,17 +88,17 @@ def extract_fns(args):
     return fn_cfgs
 
 
-def run_transform_section(tr, action_name, section):
-    full_section_name = TR_TPL % (section)
-    (ran_am, failures) = tr.run_section(full_section_name)
+def run_module_section(mods, action_name, section):
+    full_section_name = MOD_SECTION_TPL % (section)
+    (ran_am, failures) = mods.run_section(full_section_name)
     if not ran_am:
-        msg = ("No '%s' transforms to run"
+        msg = ("No '%s' modules to run"
                " under section '%s'") % (action_name, full_section_name)
         sys.stderr.write("%s\n" % (msg))
         LOG.debug(msg)
         return 0
     else:
-        LOG.debug("Ran %s transforms with %s failures", ran_am, len(failures))
+        LOG.debug("Ran %s modules with %s failures", ran_am, len(failures))
         return len(failures)
 
 
@@ -115,10 +121,10 @@ def main_init(name, args):
     # 5. Fetch the datasource
     # 6. Connect to the current instance location + update the cache
     # 7. Consume the userdata (handlers get activated here)
-    # 8. Construct the transform object
+    # 8. Construct the modules object
     # 9. Adjust any subsequent logging/output redirections using
-    #    the transform objects configuration
-    # 10. Run the transforms for the 'init' stage
+    #    the modules objects configuration
+    # 10. Run the modules for the 'init' stage
     # 11. Done!
     welcome(name)
     init = stages.Init(deps)
@@ -205,32 +211,32 @@ def main_init(name, args):
         util.logexc(LOG, "Consuming user data failed!")
         return 1
     # Stage 8 - TODO - do we really need to re-extract our configs?
-    tr = stages.Transforms(init, extract_fns(args))
+    mods = stages.Modules(init, extract_fns(args))
     # Stage 9 - TODO is this really needed??
     try:
         outfmt_orig = outfmt
         errfmt_orig = errfmt
-        (outfmt, errfmt) = util.get_output_cfg(tr.cfg, name)
+        (outfmt, errfmt) = util.get_output_cfg(mods.cfg, name)
         if outfmt_orig != outfmt or errfmt_orig != errfmt:
             LOG.warn("Stdout, stderr changing to (%s, %s)", outfmt, errfmt)
-            (outfmt, errfmt) = util.fixup_output(tr.cfg, name)
+            (outfmt, errfmt) = util.fixup_output(mods.cfg, name)
     except:
         util.logexc(LOG, "Failed to re-adjust output redirection!")
     # Stage 10
-    return run_transform_section(tr, name, name)
+    return run_module_section(mods, name, name)
 
 
-def main_transform(action_name, args):
+def main_modules(action_name, args):
     name = args.mode
-    # Cloud-init transform stages are broken up into the following sub-stages
+    # Cloud-init 'modules' stages are broken up into the following sub-stages
     # 1. Ensure that the init object fetches its config without errors
     # 2. Get the datasource from the init object, if it does
     #    not exist then that means the main_init stage never
     #    worked, and thus this stage can not run.
-    # 3. Construct the transform object
+    # 3. Construct the modules object
     # 4. Adjust any subsequent logging/output redirections using
-    #    the transform objects configuration
-    # 5. Run the transforms for the given stage name
+    #    the modules objects configuration
+    # 5. Run the modules for the given stage name
     # 6. Done!
     welcome("%s:%s" % (action_name, name))
     init = stages.Init(ds_deps=[])
@@ -244,18 +250,18 @@ def main_transform(action_name, args):
         util.logexc(LOG, 'Can not apply stage %s, no datasource found!', name)
         return 1
     # Stage 3
-    tr_cfgs = extract_fns(args)
+    mod_cfgs = extract_fns(args)
     cc_cfg = init.paths.get_ipath_cur('cloud_config')
     if settings.CFG_ENV_NAME in os.environ:
         cc_cfg = os.environ[settings.CFG_ENV_NAME]
     if cc_cfg and os.path.exists(cc_cfg):
-        tr_cfgs.append(cc_cfg)
-    tr = stages.Transforms(init, tr_cfgs)
+        mod_cfgs.append(cc_cfg)
+    mods = stages.Modules(init, mod_cfgs)
     # Stage 4
     try:
         LOG.debug("Closing stdin")
         util.close_stdin()
-        util.fixup_output(tr.cfg, name)
+        util.fixup_output(mods.cfg, name)
     except:
         util.logexc(LOG, "Failed to setup output redirection!")
     if args.debug:
@@ -263,9 +269,9 @@ def main_transform(action_name, args):
         LOG.debug(("Logging being reset, this logger may no"
                     " longer be active shortly"))
         logging.resetLogging()
-    logging.setupLogging(tr.cfg)
+    logging.setupLogging(mods.cfg)
     # Stage 5
-    return run_transform_section(tr, name, name)
+    return run_module_section(mods, name, name)
 
 
 def main_query(name, _args):
@@ -276,65 +282,49 @@ def main_query(name, _args):
 def main_single(name, args):
     # Cloud-init single stage is broken up into the following sub-stages
     # 1. Ensure that the init object fetches its config without errors
-    # 2. Check to see if we can find the transform name
-    #    in the 'init', 'final', 'config' stages, if not bail
-    # 3. Get the datasource from the init object, if it does
-    #    not exist then that means the main_init stage never
-    #    worked, and thus this stage can not run.
-    # 4. Construct the transform object
-    # 5. Adjust any subsequent logging/output redirections using
-    #    the transform objects configuration
-    # 6. Run the single transform
-    # 7. Done!
-    tr_name = args.name
-    welcome("%s:%s" % (name, tr_name))
+    # 2. Construct the modules object
+    # 3. Adjust any subsequent logging/output redirections using
+    #    the modules objects configuration
+    # 4. Run the single module
+    # 5. Done!
+    mod_name = args.name
+    welcome("%s:%s" % (name, mod_name))
     init = stages.Init(ds_deps=[])
     # Stage 1
     init.read_cfg(extract_fns(args))
-    tr = stages.Transforms(init, extract_fns(args))
-    where_look_mp = {
-        TR_TPL % ('init'): 'init',
-        TR_TPL % ('config'): 'config',
-        TR_TPL % ('final'): 'final',
-    }
-    where_look = list(where_look_mp.keys())
-    found_at = tr.find_transform(tr_name, where_look)
-    if not found_at:
-        msg = ("No known transform named %s "
-              "in sections (%s)") % (tr_name, ", ".join(where_look))
-        LOG.warn(msg)
+    mods = stages.Modules(init, extract_fns(args))
+    mod_args = args.module_args
+    if mod_args:
+        LOG.debug("Using passed in arguments %s", mod_args)
+    mod_freq = args.frequency
+    if mod_freq:
+        LOG.debug("Using passed in frequency %s", mod_freq)
+    # Stage 3
+    try:
+        LOG.debug("Closing stdin")
+        util.close_stdin()
+        util.fixup_output(mods.cfg, None)
+    except:
+        util.logexc(LOG, "Failed to setup output redirection!")
+    if args.debug:
+        # Reset so that all the debug handlers are closed out
+        LOG.debug(("Logging being reset, this logger may no"
+                   " longer be active shortly"))
+        logging.resetLogging()
+    logging.setupLogging(mods.cfg)
+    # Stage 4
+    try:
+        (_run_am, failures) = mods.run_single(mod_name,
+                                              mod_args,
+                                              mod_freq)
+    except ImportError:
+        util.logexc(LOG, "Failed at importing module %s", mod_name)
+        return 1
+    if failures:
+        LOG.debug("Ran %s but it failed", mod_name)
         return 1
     else:
-        LOG.debug("Found transform %s in sections: %s",
-                  tr_name, found_at)
-        sect_name = found_at[0]
-        LOG.debug("Selecting section %s as its 'source' section.", sect_name)
-        tr_args = args.transform_args
-        if tr_args:
-            LOG.debug("Using passed in arguments %s", tr_args)
-        tr_freq = args.frequency
-        if tr_freq:
-            LOG.debug("Using passed in frequency %s", tr_freq)
-        try:
-            LOG.debug("Closing stdin")
-            util.close_stdin()
-            # This seems to use the short name, instead of the long name
-            util.fixup_output(tr.cfg, where_look_mp.get(sect_name))
-        except:
-            util.logexc(LOG, "Failed to setup output redirection!")
-        if args.debug:
-            # Reset so that all the debug handlers are closed out
-            LOG.debug(("Logging being reset, this logger may no"
-                       " longer be active shortly"))
-            logging.resetLogging()
-        logging.setupLogging(tr.cfg)
-        (_run_am, failures) = tr.run_single(tr_name, sect_name,
-                                            tr_args, tr_freq)
-        if failures:
-            LOG.debug("Ran %s but it failed", tr_name)
-            return 1
-        else:
-            return 0
+        return 0
 
 
 def main():
@@ -357,7 +347,7 @@ def main():
     # Each action and its sub-options (if any)
     parser_init = subparsers.add_parser('init', 
                                         help=('initializes cloud-init and'
-                                              ' performs initial transforms'))
+                                              ' performs initial modules'))
     parser_init.add_argument("--local", '-l', action='store_true',
                              help="start in local mode (default: %(default)s)",
                              default=False)
@@ -366,15 +356,15 @@ def main():
     parser_init.set_defaults(action=('init', main_init))
 
     # These settings are used for the 'config' and 'final' stages
-    parser_tr = subparsers.add_parser('transform', 
-                                      help=('performs transforms '
+    parser_mod = subparsers.add_parser('modules', 
+                                      help=('activates modules '
                                             'using a given configuration key'))
-    parser_tr.add_argument("--mode", '-m', action='store',
-                             help=("transform configuration name "
+    parser_mod.add_argument("--mode", '-m', action='store',
+                             help=("module configuration name "
                                     "to use (default: %(default)s)"),
                              default='config',
-                             choices=('config', 'final'))
-    parser_tr.set_defaults(action=('transform', main_transform))
+                             choices=('init', 'config', 'final'))
+    parser_mod.set_defaults(action=('modules', main_modules))
 
     # These settings are used when you want to query information
     # stored in the cloud-init data objects/directories/files
@@ -387,23 +377,21 @@ def main():
                               choices=QUERY_DATA_TYPES)
     parser_query.set_defaults(action=('query', main_query))
 
-    # This subcommand allows you to run a single transform
+    # This subcommand allows you to run a single module
     parser_single = subparsers.add_parser('single', 
-                                         help=('run a single transform '))
+                                         help=('run a single module '))
     parser_single.set_defaults(action=('single', main_single))
     parser_single.add_argument("--name", '-n', action="store",
-                              help="transform name to run",
+                              help="module name to run",
                               required=True)
     parser_single.add_argument("--frequency", action="store",
-                              help=("frequency of "
-                                    " the transform (default: %(default)s)"),
+                              help=("frequency of the module"),
                               required=False,
-                              default=settings.PER_ALWAYS,
                               choices=settings.FREQUENCIES)
-    parser_single.add_argument("transform_args", nargs="*",
+    parser_single.add_argument("module_args", nargs="*",
                               metavar='argument',
                               help=('any additional arguments to'
-                                    ' pass to this transform'))
+                                    ' pass to this module'))
     parser_single.set_defaults(action=('single', main_single))
 
 

From 8aca7214dc9d21ddb72a9b821eaa4cd0d5fea886 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:32:50 -0700
Subject: [PATCH 254/434] 1. Show what we are importing 2. Don't rethrow as a
 runtime exception, let people using this just catch the real error...

---
 cloudinit/importer.py | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/cloudinit/importer.py b/cloudinit/importer.py
index 0344d0de..a36b87bc 100644
--- a/cloudinit/importer.py
+++ b/cloudinit/importer.py
@@ -22,10 +22,18 @@
 
 import sys
 
+from cloudinit import log as logging
+from cloudinit import util
 
+LOG = logging.getLogger(__name__)
+
+
+# Simple wrapper that allows us to add more logging in...
 def import_module(module_name):
     try:
+        LOG.debug("Attempting to import module %s", module_name)
         __import__(module_name)
         return sys.modules[module_name]
-    except ImportError as err:
-        raise RuntimeError('Could not load module %s: %s' % (module_name, err))
+    except:
+        util.logexc(LOG, 'Failed at importing %s', module_name)
+        raise

From e8a1908cdb83e7b0b19694c4767247ad0a50903d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:33:21 -0700
Subject: [PATCH 255/434] Move back to the old dashs mixed with underscores for
 now until checking/migrating and then using canonicalized name is done.

---
 config/cloud.cfg | 21 +++++++++------------
 1 file changed, 9 insertions(+), 12 deletions(-)

diff --git a/config/cloud.cfg b/config/cloud.cfg
index b11b5aa5..a87b613d 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -1,11 +1,11 @@
 # The top level settings are used as transforms
 # and system configuration.
 
-# This user will have its passwd adjusted
+# This user will have its password adjusted
 user: ubuntu
 
 # If this is set, 'root' will not be able to ssh in and they 
-# will get a message to login instead as the above $user
+# will get a message to login instead as the above $user (ubuntu)
 disable_root: true
 
 # This will cause the set+update hostname module to not operate (if true)
@@ -18,21 +18,18 @@ preserve_hostname: false
 #      timeout: 5 # (defaults to 50 seconds)
 #      max_wait: 10 # (defaults to 120 seconds)
 
-# The transform that run in the 'init' stage
+# The modules that run in the 'init' stage
 cloud_init_modules:
-# This is the hash way of specifying a transform
- - name: bootcmd
-# This is the string way of specifying a transform
  - bootcmd
  - resizefs
- - set-hostname
- - update-hostname
- - update-etc-hosts
+ - set_hostname
+ - update_hostname
+ - update_etc_hosts
  - ca-certs
  - rsyslog
  - ssh
 
- # The transforms that run in the 'config' stage
+# The modules that run in the 'config' stage
 cloud_config_modules:
  - mounts
  - ssh-import-id
@@ -51,9 +48,9 @@ cloud_config_modules:
  - runcmd
  - byobu
 
-# The transforms that run in the 'final' stage
+# The modules that run in the 'final' stage
 cloud_final_modules:
- - rightscale-userdata
+ - rightscale_userdata
  - scripts-per-once
  - scripts-per-boot
  - scripts-per-instance

From 6a1e0d2426f8ce3d19c78b98e297ac18d54120df Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:34:09 -0700
Subject: [PATCH 256/434] 1. Add a comment that the upstart dir should probably
 be put elsewhere sometime (in a distro specific build?)    since not all
 distros fully support upstart that is in config here or even have upstart in
 general at all (for various reasons) 2. Found out that we really do need to
 specify these 2 packages due to the following    a. The cloudinit root needs
 to be a package (pretty obvious)    b. Not so obvious is the cloudinit.conf
 also needs to be a package so that its modules can be directly imported
 without       referring to the module name.

---
 setup.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/setup.py b/setup.py
index 9ee58b9a..d2e022f0 100755
--- a/setup.py
+++ b/setup.py
@@ -26,7 +26,6 @@ import os
 import re
 
 from distutils.core import setup
-from setuptools import find_packages
 
 
 def is_f(p):
@@ -69,13 +68,17 @@ setup(name='cloud-init',
       author='Scott Moser',
       author_email='scott.moser@canonical.com',
       url='http://launchpad.net/cloud-init/',
-      packages=find_packages(),
+      # This second package referencing cloudinit.conf.*
+      # makes the config modules accessible to the whole
+      # import system...
+      packages=['cloudinit', 'cloudinit.conf'],
       scripts=['bin/cloud-init',
                'tools/cloud-init-per',
                ],
       data_files=[('/etc/cloud', glob('config/*.cfg')),
                   ('/etc/cloud/cloud.cfg.d', glob('config/cloud.cfg.d/*')),
                   ('/etc/cloud/templates', glob('templates/*')),
+                  # Only really need for upstart based systems
                   ('/etc/init', glob('upstart/*.conf')),
                   ('/usr/share/cloud-init', []),
                   ('/usr/lib/cloud-init',

From 84e97a885fd407290b28aacff0af1f7afd56540d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:36:02 -0700
Subject: [PATCH 257/434] Move the configparser helper to here since it being
 in a cfg.py is confusing when there is also a directory named 'config'

---
 cloudinit/helpers.py | 63 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 63 insertions(+)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 21d203db..45633e0f 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -23,8 +23,11 @@
 from time import time
 
 import contextlib
+import io
 import os
 
+from ConfigParser import (NoSectionError, NoOptionError, RawConfigParser)
+
 from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE)
 
 from cloudinit import log as logging
@@ -298,3 +301,63 @@ class Paths(object):
             return None
         else:
             return ipath
+
+
+# This config parser will not throw when sections don't exist
+# and you are setting values on those sections which is useful
+# when writing to new options that may not have corresponding
+# sections. Also it can default other values when doing gets
+# so that if those sections/options do not exist you will
+# get a default instead of an error. Another useful case where
+# you can avoid catching exceptions that you typically don't
+# care about...
+
+class DefaultingConfigParser(RawConfigParser):
+    DEF_INT = 0
+    DEF_FLOAT = 0.0
+    DEF_BOOLEAN = False
+    DEF_BASE = None
+
+    def get(self, section, option):
+        value = self.DEF_BASE
+        try:
+            value = RawConfigParser.get(self, section, option)
+        except NoSectionError:
+            pass
+        except NoOptionError:
+            pass
+        return value
+
+    def set(self, section, option, value):
+        if not self.has_section(section) and section.lower() != 'default':
+            self.add_section(section)
+        RawConfigParser.set(self, section, option, value)
+
+    def remove_option(self, section, option):
+        if self.has_option(section, option):
+            RawConfigParser.remove_option(self, section, option)
+
+    def getboolean(self, section, option):
+        if not self.has_option(section, option):
+            return self.DEF_BOOLEAN
+        return RawConfigParser.getboolean(self, section, option)
+
+    def getfloat(self, section, option):
+        if not self.has_option(section, option):
+            return self.DEF_FLOAT
+        return RawConfigParser.getfloat(self, section, option)
+
+    def getint(self, section, option):
+        if not self.has_option(section, option):
+            return self.DEF_INT
+        return RawConfigParser.getint(self, section, option)
+
+    def stringify(self, header=None):
+        contents = ''
+        with io.BytesIO() as outputstream:
+            self.write(outputstream)
+            outputstream.flush()
+            contents = outputstream.getvalue()
+            if header:
+                contents = "\n".join([header, contents])
+        return contents

From 44886fb12ef798c49a72f5138f5279cdcd133075 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:36:47 -0700
Subject: [PATCH 258/434] Removed this to avoid confusion with cfg and then
 having a config dir.

---
 cloudinit/cfg.py | 80 ------------------------------------------------
 1 file changed, 80 deletions(-)
 delete mode 100644 cloudinit/cfg.py

diff --git a/cloudinit/cfg.py b/cloudinit/cfg.py
deleted file mode 100644
index 215ed855..00000000
--- a/cloudinit/cfg.py
+++ /dev/null
@@ -1,80 +0,0 @@
-# vi: ts=4 expandtab
-#
-#    Copyright (C) 2012 Yahoo! Inc.
-#
-#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
-#
-#    This program is free software: you can redistribute it and/or modify
-#    it under the terms of the GNU General Public License version 3, as
-#    published by the Free Software Foundation.
-#
-#    This program is distributed in the hope that it will be useful,
-#    but WITHOUT ANY WARRANTY; without even the implied warranty of
-#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-#    GNU General Public License for more details.
-#
-#    You should have received a copy of the GNU General Public License
-#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-import io
-
-from ConfigParser import (NoSectionError, NoOptionError, RawConfigParser)
-
-# This config parser will not throw when sections don't exist
-# and you are setting values on those sections which is useful
-# when writing to new options that may not have corresponding
-# sections. Also it can default other values when doing gets
-# so that if those sections/options do not exist you will
-# get a default instead of an error. Another useful case where
-# you can avoid catching exceptions that you typically don't
-# care about...
-
-class DefaultingConfigParser(RawConfigParser):
-    DEF_INT = 0
-    DEF_FLOAT = 0.0
-    DEF_BOOLEAN = False
-    DEF_BASE = None
-
-    def get(self, section, option):
-        value = self.DEF_BASE
-        try:
-            value = RawConfigParser.get(self, section, option)
-        except NoSectionError:
-            pass
-        except NoOptionError:
-            pass
-        return value
-
-    def set(self, section, option, value):
-        if not self.has_section(section) and section.lower() != 'default':
-            self.add_section(section)
-        RawConfigParser.set(self, section, option, value)
-
-    def remove_option(self, section, option):
-        if self.has_option(section, option):
-            RawConfigParser.remove_option(self, section, option)
-
-    def getboolean(self, section, option):
-        if not self.has_option(section, option):
-            return self.DEF_BOOLEAN
-        return RawConfigParser.getboolean(self, section, option)
-
-    def getfloat(self, section, option):
-        if not self.has_option(section, option):
-            return self.DEF_FLOAT
-        return RawConfigParser.getfloat(self, section, option)
-
-    def getint(self, section, option):
-        if not self.has_option(section, option):
-            return self.DEF_INT
-        return RawConfigParser.getint(self, section, option)
-
-    def stringify(self, header=None):
-        contents = ''
-        with io.BytesIO() as outputstream:
-            self.write(outputstream)
-            outputstream.flush()
-            contents = outputstream.getvalue()
-            if header:
-                contents = "\n".join([header, contents])
-        return contents

From a535a200882757f612168a8c28089f89c2f17a40 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:37:10 -0700
Subject: [PATCH 259/434] The 'cfg' module has been removed and moved to
 'helpers' to avoid confusion. These modules used the 'cfg' modules so
 adjusted them.

---
 cloudinit/{transforms => config}/__init__.py                  | 0
 cloudinit/{transforms => config}/apt_pipelining.py            | 0
 cloudinit/{transforms => config}/apt_update_upgrade.py        | 0
 cloudinit/{transforms => config}/bootcmd.py                   | 0
 cloudinit/{transforms => config}/byobu.py                     | 0
 cloudinit/{transforms => config}/ca_certs.py                  | 0
 .../{transforms/mcollective.py => config/cc_mcollective.py}   | 4 ++--
 cloudinit/{transforms/puppet.py => config/cc_puppet.py}       | 4 ++--
 cloudinit/{transforms => config}/chef.py                      | 0
 cloudinit/{transforms => config}/disable_ec2_metadata.py      | 0
 cloudinit/{transforms => config}/final_message.py             | 0
 cloudinit/{transforms => config}/foo.py                       | 0
 cloudinit/{transforms => config}/grub_dpkg.py                 | 0
 cloudinit/{transforms => config}/keys_to_console.py           | 0
 cloudinit/{transforms => config}/landscape.py                 | 0
 cloudinit/{transforms => config}/locale.py                    | 0
 cloudinit/{transforms => config}/mounts.py                    | 0
 cloudinit/{transforms => config}/phone_home.py                | 0
 cloudinit/{transforms => config}/resizefs.py                  | 0
 cloudinit/{transforms => config}/rightscale_userdata.py       | 0
 cloudinit/{transforms => config}/rsyslog.py                   | 0
 cloudinit/{transforms => config}/runcmd.py                    | 0
 cloudinit/{transforms => config}/salt_minion.py               | 0
 cloudinit/{transforms => config}/scripts_per_boot.py          | 0
 cloudinit/{transforms => config}/scripts_per_instance.py      | 0
 cloudinit/{transforms => config}/scripts_per_once.py          | 0
 cloudinit/{transforms => config}/scripts_user.py              | 0
 cloudinit/{transforms => config}/set_hostname.py              | 0
 cloudinit/{transforms => config}/set_passwords.py             | 0
 cloudinit/{transforms => config}/ssh.py                       | 0
 cloudinit/{transforms => config}/ssh_import_id.py             | 0
 cloudinit/{transforms => config}/timezone.py                  | 0
 cloudinit/{transforms => config}/update_etc_hosts.py          | 0
 cloudinit/{transforms => config}/update_hostname.py           | 0
 34 files changed, 4 insertions(+), 4 deletions(-)
 rename cloudinit/{transforms => config}/__init__.py (100%)
 rename cloudinit/{transforms => config}/apt_pipelining.py (100%)
 rename cloudinit/{transforms => config}/apt_update_upgrade.py (100%)
 rename cloudinit/{transforms => config}/bootcmd.py (100%)
 rename cloudinit/{transforms => config}/byobu.py (100%)
 rename cloudinit/{transforms => config}/ca_certs.py (100%)
 rename cloudinit/{transforms/mcollective.py => config/cc_mcollective.py} (97%)
 rename cloudinit/{transforms/puppet.py => config/cc_puppet.py} (98%)
 rename cloudinit/{transforms => config}/chef.py (100%)
 rename cloudinit/{transforms => config}/disable_ec2_metadata.py (100%)
 rename cloudinit/{transforms => config}/final_message.py (100%)
 rename cloudinit/{transforms => config}/foo.py (100%)
 rename cloudinit/{transforms => config}/grub_dpkg.py (100%)
 rename cloudinit/{transforms => config}/keys_to_console.py (100%)
 rename cloudinit/{transforms => config}/landscape.py (100%)
 rename cloudinit/{transforms => config}/locale.py (100%)
 rename cloudinit/{transforms => config}/mounts.py (100%)
 rename cloudinit/{transforms => config}/phone_home.py (100%)
 rename cloudinit/{transforms => config}/resizefs.py (100%)
 rename cloudinit/{transforms => config}/rightscale_userdata.py (100%)
 rename cloudinit/{transforms => config}/rsyslog.py (100%)
 rename cloudinit/{transforms => config}/runcmd.py (100%)
 rename cloudinit/{transforms => config}/salt_minion.py (100%)
 rename cloudinit/{transforms => config}/scripts_per_boot.py (100%)
 rename cloudinit/{transforms => config}/scripts_per_instance.py (100%)
 rename cloudinit/{transforms => config}/scripts_per_once.py (100%)
 rename cloudinit/{transforms => config}/scripts_user.py (100%)
 rename cloudinit/{transforms => config}/set_hostname.py (100%)
 rename cloudinit/{transforms => config}/set_passwords.py (100%)
 rename cloudinit/{transforms => config}/ssh.py (100%)
 rename cloudinit/{transforms => config}/ssh_import_id.py (100%)
 rename cloudinit/{transforms => config}/timezone.py (100%)
 rename cloudinit/{transforms => config}/update_etc_hosts.py (100%)
 rename cloudinit/{transforms => config}/update_hostname.py (100%)

diff --git a/cloudinit/transforms/__init__.py b/cloudinit/config/__init__.py
similarity index 100%
rename from cloudinit/transforms/__init__.py
rename to cloudinit/config/__init__.py
diff --git a/cloudinit/transforms/apt_pipelining.py b/cloudinit/config/apt_pipelining.py
similarity index 100%
rename from cloudinit/transforms/apt_pipelining.py
rename to cloudinit/config/apt_pipelining.py
diff --git a/cloudinit/transforms/apt_update_upgrade.py b/cloudinit/config/apt_update_upgrade.py
similarity index 100%
rename from cloudinit/transforms/apt_update_upgrade.py
rename to cloudinit/config/apt_update_upgrade.py
diff --git a/cloudinit/transforms/bootcmd.py b/cloudinit/config/bootcmd.py
similarity index 100%
rename from cloudinit/transforms/bootcmd.py
rename to cloudinit/config/bootcmd.py
diff --git a/cloudinit/transforms/byobu.py b/cloudinit/config/byobu.py
similarity index 100%
rename from cloudinit/transforms/byobu.py
rename to cloudinit/config/byobu.py
diff --git a/cloudinit/transforms/ca_certs.py b/cloudinit/config/ca_certs.py
similarity index 100%
rename from cloudinit/transforms/ca_certs.py
rename to cloudinit/config/ca_certs.py
diff --git a/cloudinit/transforms/mcollective.py b/cloudinit/config/cc_mcollective.py
similarity index 97%
rename from cloudinit/transforms/mcollective.py
rename to cloudinit/config/cc_mcollective.py
index 9754d6b8..4cec6494 100644
--- a/cloudinit/transforms/mcollective.py
+++ b/cloudinit/config/cc_mcollective.py
@@ -21,7 +21,7 @@
 
 from StringIO import StringIO
 
-from cloudinit import cfg as config
+from cloudinit import helpers
 from cloudinit import util
 
 PUBCERT_FILE = "/etc/mcollective/ssl/server-public.pem"
@@ -44,7 +44,7 @@ def handle(name, cfg, cloud, log, _args):
     # ... and then update the mcollective configuration
     if 'conf' in mcollective_cfg:
         # Create object for reading server.cfg values
-        mcollective_config = config.DefaultingConfigParser()
+        mcollective_config = helpers.DefaultingConfigParser()
         # Read server.cfg values from original file in order to be able to mix
         # the rest up
         server_cfg_fn = cloud.paths.join(True, '/etc/mcollective/server.cfg')
diff --git a/cloudinit/transforms/puppet.py b/cloudinit/config/cc_puppet.py
similarity index 98%
rename from cloudinit/transforms/puppet.py
rename to cloudinit/config/cc_puppet.py
index d55118ea..5fb88bf2 100644
--- a/cloudinit/transforms/puppet.py
+++ b/cloudinit/config/cc_puppet.py
@@ -24,7 +24,7 @@ import os
 import pwd
 import socket
 
-from cloudinit import cfg as config
+from cloudinit import helpers
 from cloudinit import util
 
 
@@ -46,7 +46,7 @@ def handle(name, cfg, cloud, log, _args):
         puppet_conf_fn = cloud.paths.join(False, '/etc/puppet/puppet.conf')
         contents = util.load_file(puppet_conf_fn)
         # Create object for reading puppet.conf values
-        puppet_config = config.DefaultingConfigParser()
+        puppet_config = helpers.DefaultingConfigParser()
         # Read puppet.conf values from original file in order to be able to
         # mix the rest up. First clean them up (TODO is this really needed??)
         cleaned_lines = [i.lstrip() for i in contents.splitlines()]
diff --git a/cloudinit/transforms/chef.py b/cloudinit/config/chef.py
similarity index 100%
rename from cloudinit/transforms/chef.py
rename to cloudinit/config/chef.py
diff --git a/cloudinit/transforms/disable_ec2_metadata.py b/cloudinit/config/disable_ec2_metadata.py
similarity index 100%
rename from cloudinit/transforms/disable_ec2_metadata.py
rename to cloudinit/config/disable_ec2_metadata.py
diff --git a/cloudinit/transforms/final_message.py b/cloudinit/config/final_message.py
similarity index 100%
rename from cloudinit/transforms/final_message.py
rename to cloudinit/config/final_message.py
diff --git a/cloudinit/transforms/foo.py b/cloudinit/config/foo.py
similarity index 100%
rename from cloudinit/transforms/foo.py
rename to cloudinit/config/foo.py
diff --git a/cloudinit/transforms/grub_dpkg.py b/cloudinit/config/grub_dpkg.py
similarity index 100%
rename from cloudinit/transforms/grub_dpkg.py
rename to cloudinit/config/grub_dpkg.py
diff --git a/cloudinit/transforms/keys_to_console.py b/cloudinit/config/keys_to_console.py
similarity index 100%
rename from cloudinit/transforms/keys_to_console.py
rename to cloudinit/config/keys_to_console.py
diff --git a/cloudinit/transforms/landscape.py b/cloudinit/config/landscape.py
similarity index 100%
rename from cloudinit/transforms/landscape.py
rename to cloudinit/config/landscape.py
diff --git a/cloudinit/transforms/locale.py b/cloudinit/config/locale.py
similarity index 100%
rename from cloudinit/transforms/locale.py
rename to cloudinit/config/locale.py
diff --git a/cloudinit/transforms/mounts.py b/cloudinit/config/mounts.py
similarity index 100%
rename from cloudinit/transforms/mounts.py
rename to cloudinit/config/mounts.py
diff --git a/cloudinit/transforms/phone_home.py b/cloudinit/config/phone_home.py
similarity index 100%
rename from cloudinit/transforms/phone_home.py
rename to cloudinit/config/phone_home.py
diff --git a/cloudinit/transforms/resizefs.py b/cloudinit/config/resizefs.py
similarity index 100%
rename from cloudinit/transforms/resizefs.py
rename to cloudinit/config/resizefs.py
diff --git a/cloudinit/transforms/rightscale_userdata.py b/cloudinit/config/rightscale_userdata.py
similarity index 100%
rename from cloudinit/transforms/rightscale_userdata.py
rename to cloudinit/config/rightscale_userdata.py
diff --git a/cloudinit/transforms/rsyslog.py b/cloudinit/config/rsyslog.py
similarity index 100%
rename from cloudinit/transforms/rsyslog.py
rename to cloudinit/config/rsyslog.py
diff --git a/cloudinit/transforms/runcmd.py b/cloudinit/config/runcmd.py
similarity index 100%
rename from cloudinit/transforms/runcmd.py
rename to cloudinit/config/runcmd.py
diff --git a/cloudinit/transforms/salt_minion.py b/cloudinit/config/salt_minion.py
similarity index 100%
rename from cloudinit/transforms/salt_minion.py
rename to cloudinit/config/salt_minion.py
diff --git a/cloudinit/transforms/scripts_per_boot.py b/cloudinit/config/scripts_per_boot.py
similarity index 100%
rename from cloudinit/transforms/scripts_per_boot.py
rename to cloudinit/config/scripts_per_boot.py
diff --git a/cloudinit/transforms/scripts_per_instance.py b/cloudinit/config/scripts_per_instance.py
similarity index 100%
rename from cloudinit/transforms/scripts_per_instance.py
rename to cloudinit/config/scripts_per_instance.py
diff --git a/cloudinit/transforms/scripts_per_once.py b/cloudinit/config/scripts_per_once.py
similarity index 100%
rename from cloudinit/transforms/scripts_per_once.py
rename to cloudinit/config/scripts_per_once.py
diff --git a/cloudinit/transforms/scripts_user.py b/cloudinit/config/scripts_user.py
similarity index 100%
rename from cloudinit/transforms/scripts_user.py
rename to cloudinit/config/scripts_user.py
diff --git a/cloudinit/transforms/set_hostname.py b/cloudinit/config/set_hostname.py
similarity index 100%
rename from cloudinit/transforms/set_hostname.py
rename to cloudinit/config/set_hostname.py
diff --git a/cloudinit/transforms/set_passwords.py b/cloudinit/config/set_passwords.py
similarity index 100%
rename from cloudinit/transforms/set_passwords.py
rename to cloudinit/config/set_passwords.py
diff --git a/cloudinit/transforms/ssh.py b/cloudinit/config/ssh.py
similarity index 100%
rename from cloudinit/transforms/ssh.py
rename to cloudinit/config/ssh.py
diff --git a/cloudinit/transforms/ssh_import_id.py b/cloudinit/config/ssh_import_id.py
similarity index 100%
rename from cloudinit/transforms/ssh_import_id.py
rename to cloudinit/config/ssh_import_id.py
diff --git a/cloudinit/transforms/timezone.py b/cloudinit/config/timezone.py
similarity index 100%
rename from cloudinit/transforms/timezone.py
rename to cloudinit/config/timezone.py
diff --git a/cloudinit/transforms/update_etc_hosts.py b/cloudinit/config/update_etc_hosts.py
similarity index 100%
rename from cloudinit/transforms/update_etc_hosts.py
rename to cloudinit/config/update_etc_hosts.py
diff --git a/cloudinit/transforms/update_hostname.py b/cloudinit/config/update_hostname.py
similarity index 100%
rename from cloudinit/transforms/update_hostname.py
rename to cloudinit/config/update_hostname.py

From 214dd527cb17e7340b452a84815ba4808beb283b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:39:09 -0700
Subject: [PATCH 260/434] Renamed back to 'cc_*' with the reasoning being that
 'cc_' provides some protection against module name collisions when importing.

---
 cloudinit/config/__init__.py                  | 19 +++++++++++--------
 ...apt_pipelining.py => cc_apt_pipelining.py} |  0
 ...te_upgrade.py => cc_apt_update_upgrade.py} |  0
 .../config/{bootcmd.py => cc_bootcmd.py}      |  0
 cloudinit/config/{byobu.py => cc_byobu.py}    |  0
 .../config/{ca_certs.py => cc_ca_certs.py}    |  0
 cloudinit/config/{chef.py => cc_chef.py}      |  0
 ...metadata.py => cc_disable_ec2_metadata.py} |  0
 .../{final_message.py => cc_final_message.py} |  0
 cloudinit/config/{foo.py => cc_foo.py}        |  0
 .../config/{grub_dpkg.py => cc_grub_dpkg.py}  |  0
 ...ys_to_console.py => cc_keys_to_console.py} |  0
 .../config/{landscape.py => cc_landscape.py}  |  0
 cloudinit/config/{locale.py => cc_locale.py}  |  0
 cloudinit/config/{mounts.py => cc_mounts.py}  |  0
 .../{phone_home.py => cc_phone_home.py}       |  0
 .../config/{resizefs.py => cc_resizefs.py}    |  0
 ..._userdata.py => cc_rightscale_userdata.py} |  0
 .../config/{rsyslog.py => cc_rsyslog.py}      |  0
 cloudinit/config/{runcmd.py => cc_runcmd.py}  |  0
 .../{salt_minion.py => cc_salt_minion.py}     |  0
 ...pts_per_boot.py => cc_scripts_per_boot.py} |  0
 ...instance.py => cc_scripts_per_instance.py} |  0
 ...pts_per_once.py => cc_scripts_per_once.py} |  0
 .../{scripts_user.py => cc_scripts_user.py}   |  0
 .../{set_hostname.py => cc_set_hostname.py}   |  0
 .../{set_passwords.py => cc_set_passwords.py} |  0
 cloudinit/config/{ssh.py => cc_ssh.py}        |  0
 .../{ssh_import_id.py => cc_ssh_import_id.py} |  0
 .../config/{timezone.py => cc_timezone.py}    |  0
 ...te_etc_hosts.py => cc_update_etc_hosts.py} |  0
 ...date_hostname.py => cc_update_hostname.py} |  0
 32 files changed, 11 insertions(+), 8 deletions(-)
 rename cloudinit/config/{apt_pipelining.py => cc_apt_pipelining.py} (100%)
 rename cloudinit/config/{apt_update_upgrade.py => cc_apt_update_upgrade.py} (100%)
 rename cloudinit/config/{bootcmd.py => cc_bootcmd.py} (100%)
 rename cloudinit/config/{byobu.py => cc_byobu.py} (100%)
 rename cloudinit/config/{ca_certs.py => cc_ca_certs.py} (100%)
 rename cloudinit/config/{chef.py => cc_chef.py} (100%)
 rename cloudinit/config/{disable_ec2_metadata.py => cc_disable_ec2_metadata.py} (100%)
 rename cloudinit/config/{final_message.py => cc_final_message.py} (100%)
 rename cloudinit/config/{foo.py => cc_foo.py} (100%)
 rename cloudinit/config/{grub_dpkg.py => cc_grub_dpkg.py} (100%)
 rename cloudinit/config/{keys_to_console.py => cc_keys_to_console.py} (100%)
 rename cloudinit/config/{landscape.py => cc_landscape.py} (100%)
 rename cloudinit/config/{locale.py => cc_locale.py} (100%)
 rename cloudinit/config/{mounts.py => cc_mounts.py} (100%)
 rename cloudinit/config/{phone_home.py => cc_phone_home.py} (100%)
 rename cloudinit/config/{resizefs.py => cc_resizefs.py} (100%)
 rename cloudinit/config/{rightscale_userdata.py => cc_rightscale_userdata.py} (100%)
 rename cloudinit/config/{rsyslog.py => cc_rsyslog.py} (100%)
 rename cloudinit/config/{runcmd.py => cc_runcmd.py} (100%)
 rename cloudinit/config/{salt_minion.py => cc_salt_minion.py} (100%)
 rename cloudinit/config/{scripts_per_boot.py => cc_scripts_per_boot.py} (100%)
 rename cloudinit/config/{scripts_per_instance.py => cc_scripts_per_instance.py} (100%)
 rename cloudinit/config/{scripts_per_once.py => cc_scripts_per_once.py} (100%)
 rename cloudinit/config/{scripts_user.py => cc_scripts_user.py} (100%)
 rename cloudinit/config/{set_hostname.py => cc_set_hostname.py} (100%)
 rename cloudinit/config/{set_passwords.py => cc_set_passwords.py} (100%)
 rename cloudinit/config/{ssh.py => cc_ssh.py} (100%)
 rename cloudinit/config/{ssh_import_id.py => cc_ssh_import_id.py} (100%)
 rename cloudinit/config/{timezone.py => cc_timezone.py} (100%)
 rename cloudinit/config/{update_etc_hosts.py => cc_update_etc_hosts.py} (100%)
 rename cloudinit/config/{update_hostname.py => cc_update_hostname.py} (100%)

diff --git a/cloudinit/config/__init__.py b/cloudinit/config/__init__.py
index 5cd08575..74e2f275 100644
--- a/cloudinit/config/__init__.py
+++ b/cloudinit/config/__init__.py
@@ -25,29 +25,32 @@ from cloudinit import log as logging
 
 LOG = logging.getLogger(__name__)
 
-# TODO remove this from being a prefix??
-TRANSFORM_PREFIX = ''  # "cc_"
+# This prefix is used to make it less 
+# of a change that when importing
+# we will not find something else with the same
+# name in the lookup path...
+MOD_PREFIX = "cc_"
 
 
-def form_transform_name(name, mod=__name__):
+def form_module_name(name):
     canon_name = name.replace("-", "_")
     if canon_name.lower().endswith(".py"):
         canon_name = canon_name[0:(len(canon_name) - 3)]
     canon_name = canon_name.strip()
     if not canon_name:
         return None
-    if not canon_name.startswith(TRANSFORM_PREFIX):
-        canon_name = '%s%s' % (TRANSFORM_PREFIX, canon_name)
-    return ".".join([str(mod), str(canon_name)])
+    if not canon_name.startswith(MOD_PREFIX):
+        canon_name = '%s%s' % (MOD_PREFIX, canon_name)
+    return canon_name
 
 
-def fixup_transform(mod, def_freq=PER_INSTANCE):
+def fixup_module(mod, def_freq=PER_INSTANCE):
     if not hasattr(mod, 'frequency'):
         setattr(mod, 'frequency', def_freq)
     else:
         freq = mod.frequency
         if freq and freq not in FREQUENCIES:
-            LOG.warn("Transform %s has an unknown frequency %s", mod, freq)
+            LOG.warn("Module %s has an unknown frequency %s", mod, freq)
     if not hasattr(mod, 'handle'):
         def empty_handle(_name, _cfg, _cloud, _log, _args):
             pass
diff --git a/cloudinit/config/apt_pipelining.py b/cloudinit/config/cc_apt_pipelining.py
similarity index 100%
rename from cloudinit/config/apt_pipelining.py
rename to cloudinit/config/cc_apt_pipelining.py
diff --git a/cloudinit/config/apt_update_upgrade.py b/cloudinit/config/cc_apt_update_upgrade.py
similarity index 100%
rename from cloudinit/config/apt_update_upgrade.py
rename to cloudinit/config/cc_apt_update_upgrade.py
diff --git a/cloudinit/config/bootcmd.py b/cloudinit/config/cc_bootcmd.py
similarity index 100%
rename from cloudinit/config/bootcmd.py
rename to cloudinit/config/cc_bootcmd.py
diff --git a/cloudinit/config/byobu.py b/cloudinit/config/cc_byobu.py
similarity index 100%
rename from cloudinit/config/byobu.py
rename to cloudinit/config/cc_byobu.py
diff --git a/cloudinit/config/ca_certs.py b/cloudinit/config/cc_ca_certs.py
similarity index 100%
rename from cloudinit/config/ca_certs.py
rename to cloudinit/config/cc_ca_certs.py
diff --git a/cloudinit/config/chef.py b/cloudinit/config/cc_chef.py
similarity index 100%
rename from cloudinit/config/chef.py
rename to cloudinit/config/cc_chef.py
diff --git a/cloudinit/config/disable_ec2_metadata.py b/cloudinit/config/cc_disable_ec2_metadata.py
similarity index 100%
rename from cloudinit/config/disable_ec2_metadata.py
rename to cloudinit/config/cc_disable_ec2_metadata.py
diff --git a/cloudinit/config/final_message.py b/cloudinit/config/cc_final_message.py
similarity index 100%
rename from cloudinit/config/final_message.py
rename to cloudinit/config/cc_final_message.py
diff --git a/cloudinit/config/foo.py b/cloudinit/config/cc_foo.py
similarity index 100%
rename from cloudinit/config/foo.py
rename to cloudinit/config/cc_foo.py
diff --git a/cloudinit/config/grub_dpkg.py b/cloudinit/config/cc_grub_dpkg.py
similarity index 100%
rename from cloudinit/config/grub_dpkg.py
rename to cloudinit/config/cc_grub_dpkg.py
diff --git a/cloudinit/config/keys_to_console.py b/cloudinit/config/cc_keys_to_console.py
similarity index 100%
rename from cloudinit/config/keys_to_console.py
rename to cloudinit/config/cc_keys_to_console.py
diff --git a/cloudinit/config/landscape.py b/cloudinit/config/cc_landscape.py
similarity index 100%
rename from cloudinit/config/landscape.py
rename to cloudinit/config/cc_landscape.py
diff --git a/cloudinit/config/locale.py b/cloudinit/config/cc_locale.py
similarity index 100%
rename from cloudinit/config/locale.py
rename to cloudinit/config/cc_locale.py
diff --git a/cloudinit/config/mounts.py b/cloudinit/config/cc_mounts.py
similarity index 100%
rename from cloudinit/config/mounts.py
rename to cloudinit/config/cc_mounts.py
diff --git a/cloudinit/config/phone_home.py b/cloudinit/config/cc_phone_home.py
similarity index 100%
rename from cloudinit/config/phone_home.py
rename to cloudinit/config/cc_phone_home.py
diff --git a/cloudinit/config/resizefs.py b/cloudinit/config/cc_resizefs.py
similarity index 100%
rename from cloudinit/config/resizefs.py
rename to cloudinit/config/cc_resizefs.py
diff --git a/cloudinit/config/rightscale_userdata.py b/cloudinit/config/cc_rightscale_userdata.py
similarity index 100%
rename from cloudinit/config/rightscale_userdata.py
rename to cloudinit/config/cc_rightscale_userdata.py
diff --git a/cloudinit/config/rsyslog.py b/cloudinit/config/cc_rsyslog.py
similarity index 100%
rename from cloudinit/config/rsyslog.py
rename to cloudinit/config/cc_rsyslog.py
diff --git a/cloudinit/config/runcmd.py b/cloudinit/config/cc_runcmd.py
similarity index 100%
rename from cloudinit/config/runcmd.py
rename to cloudinit/config/cc_runcmd.py
diff --git a/cloudinit/config/salt_minion.py b/cloudinit/config/cc_salt_minion.py
similarity index 100%
rename from cloudinit/config/salt_minion.py
rename to cloudinit/config/cc_salt_minion.py
diff --git a/cloudinit/config/scripts_per_boot.py b/cloudinit/config/cc_scripts_per_boot.py
similarity index 100%
rename from cloudinit/config/scripts_per_boot.py
rename to cloudinit/config/cc_scripts_per_boot.py
diff --git a/cloudinit/config/scripts_per_instance.py b/cloudinit/config/cc_scripts_per_instance.py
similarity index 100%
rename from cloudinit/config/scripts_per_instance.py
rename to cloudinit/config/cc_scripts_per_instance.py
diff --git a/cloudinit/config/scripts_per_once.py b/cloudinit/config/cc_scripts_per_once.py
similarity index 100%
rename from cloudinit/config/scripts_per_once.py
rename to cloudinit/config/cc_scripts_per_once.py
diff --git a/cloudinit/config/scripts_user.py b/cloudinit/config/cc_scripts_user.py
similarity index 100%
rename from cloudinit/config/scripts_user.py
rename to cloudinit/config/cc_scripts_user.py
diff --git a/cloudinit/config/set_hostname.py b/cloudinit/config/cc_set_hostname.py
similarity index 100%
rename from cloudinit/config/set_hostname.py
rename to cloudinit/config/cc_set_hostname.py
diff --git a/cloudinit/config/set_passwords.py b/cloudinit/config/cc_set_passwords.py
similarity index 100%
rename from cloudinit/config/set_passwords.py
rename to cloudinit/config/cc_set_passwords.py
diff --git a/cloudinit/config/ssh.py b/cloudinit/config/cc_ssh.py
similarity index 100%
rename from cloudinit/config/ssh.py
rename to cloudinit/config/cc_ssh.py
diff --git a/cloudinit/config/ssh_import_id.py b/cloudinit/config/cc_ssh_import_id.py
similarity index 100%
rename from cloudinit/config/ssh_import_id.py
rename to cloudinit/config/cc_ssh_import_id.py
diff --git a/cloudinit/config/timezone.py b/cloudinit/config/cc_timezone.py
similarity index 100%
rename from cloudinit/config/timezone.py
rename to cloudinit/config/cc_timezone.py
diff --git a/cloudinit/config/update_etc_hosts.py b/cloudinit/config/cc_update_etc_hosts.py
similarity index 100%
rename from cloudinit/config/update_etc_hosts.py
rename to cloudinit/config/cc_update_etc_hosts.py
diff --git a/cloudinit/config/update_hostname.py b/cloudinit/config/cc_update_hostname.py
similarity index 100%
rename from cloudinit/config/update_hostname.py
rename to cloudinit/config/cc_update_hostname.py

From 66e91af60ddc202a191371c06fece475ca8427e4 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:39:56 -0700
Subject: [PATCH 261/434] Catch the import error rather than the runtime error.

---
 cloudinit/distros/__init__.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 6a98fdb1..45dd85ec 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -147,10 +147,10 @@ class Distro(object):
 def fetch(distro_name, mods=(__name__, )):
     mod = None
     for m in mods:
+        mod_name = "%s.%s" % (m, distro_name)
         try:
-            mod_name = "%s.%s" % (m, distro_name)
             mod = importer.import_module(mod_name)
-        except RuntimeError:
+        except ImportError:
             pass
     if not mod:
         raise RuntimeError("No distribution found for distro %s"

From 9f8c697088861f2a0586515c6a62536fb075eca8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:40:16 -0700
Subject: [PATCH 262/434] Change to import error instead of runtime error.

---
 cloudinit/sources/__init__.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 35fc01df..8ab7cf54 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -198,11 +198,13 @@ def list_sources(cfg_list, depends, pkg_list):
         for pkg in pkg_list:
             pkg_name = []
             if pkg:
+                # Any package name given, this affects
+                # the lookup path
                 pkg_name.append(str(pkg))
             pkg_name.append(ds_name)
             try:
                 mod = importer.import_module(".".join(pkg_name))
-            except RuntimeError:
+            except ImportError:
                 continue
             lister = getattr(mod, "get_datasource_list", None)
             if not lister:

From 8ed740ce0f45dadf2b77dd45e41486e276b67ef0 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 16:40:39 -0700
Subject: [PATCH 263/434] 1. Rename to modules instead of transforms 2. Run
 single will now attempt to run a module of a given name, if it can find it
 (no restrictions on config)

---
 cloudinit/stages.py | 80 +++++++++++++++++++--------------------------
 1 file changed, 33 insertions(+), 47 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 334d5004..ae6e2de5 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -35,18 +35,20 @@ from cloudinit.settings import (OLD_CLOUD_CONFIG)
 from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
 
 from cloudinit import handlers
+
+# Default handlers (used if not overridden)
 from cloudinit.handlers import boot_hook as bh_part
 from cloudinit.handlers import cloud_config as cc_part
 from cloudinit.handlers import shell_script as ss_part
 from cloudinit.handlers import upstart_job as up_part
 
 from cloudinit import cloud
+from cloudinit import config
 from cloudinit import distros
 from cloudinit import helpers
 from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import sources
-from cloudinit import transforms
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)
@@ -319,8 +321,10 @@ class Init(object):
     
         # Add the path to the plugins dir to the top of our list for import
         # instance dir should be read before cloud-dir
-        sys.path.insert(0, cdir)
-        sys.path.insert(0, idir)
+        if cdir and cdir not in sys.path:
+            sys.path.insert(0, cdir)
+        if idir and idir not in sys.path:
+            sys.path.insert(0, idir)
 
         # Ensure datasource fetched before activation (just incase)
         user_data_msg = self.datasource.get_userdata()
@@ -378,7 +382,7 @@ class Init(object):
             called.append(mod)
 
 
-class Transforms(object):
+class Modules(object):
     def __init__(self, init, cfg_files=None):
         self.datasource = init.datasource
         self.cfg_files = cfg_files
@@ -392,7 +396,7 @@ class Transforms(object):
         # None check to avoid empty case
         if self._cached_cfg is None:
             self._cached_cfg = self._get_config()
-            LOG.debug("Loading 'transform' config %s", self._cached_cfg)
+            LOG.debug("Loading 'module' config %s", self._cached_cfg)
         return self._cached_cfg
 
     def _get_config(self):
@@ -419,7 +423,7 @@ class Transforms(object):
 
         return util.mergemanydict(t_cfgs)
 
-    def _read_transforms(self, name):
+    def _read_modules(self, name):
         module_list = []
         if name not in self.cfg:
             return module_list
@@ -464,28 +468,28 @@ class Transforms(object):
                                  (item, util.obj_name(item)))
         return module_list
 
-    def _fixup_transforms(self, raw_mods):
+    def _fixup_modules(self, raw_mods):
         mostly_mods = []
         for raw_mod in raw_mods:
             raw_name = raw_mod['mod']
             freq = raw_mod.get('freq')
             run_args = raw_mod.get('args') or []
-            mod_name = transforms.form_transform_name(raw_name)
+            mod_name = config.form_module_name(raw_name)
             if not mod_name:
                 continue
             if freq and freq not in FREQUENCIES:
-                LOG.warn(("Config specified transform %s"
+                LOG.warn(("Config specified module %s"
                           " has an unknown frequency %s"), raw_name, freq)
                 # Reset it so when ran it will get set to a known value
                 freq = None
-            mod = transforms.fixup_transform(importer.import_module(mod_name))
+            mod = config.fixup_module(importer.import_module(mod_name))
             mostly_mods.append([mod, raw_name, freq, run_args])
         return mostly_mods
 
-    def _run_transforms(self, mostly_mods):
+    def _run_modules(self, mostly_mods):
         failures = []
         d_name = self.init.distro.name
-        c_cloud = self.init.cloudify()
+        cc = self.init.cloudify()
         am_ran = 0
         for (mod, name, freq, args) in mostly_mods:
             try:
@@ -496,54 +500,36 @@ class Transforms(object):
                     freq = PER_INSTANCE
                 worked_distros = mod.distros
                 if (worked_distros and d_name not in worked_distros):
-                    LOG.warn(("Transform %s is verified on %s distros"
+                    LOG.warn(("Module %s is verified on %s distros"
                               " but not on %s distro. It may or may not work"
                               " correctly."), name, worked_distros, d_name)
                 # Deep copy the config so that modules can't alter it
                 # Use the transforms logger and not our own
                 func_args = [name, copy.deepcopy(self.cfg),
-                             c_cloud, transforms.LOG, args]
+                             cc, config.LOG, args]
                 # Mark it as having started running
                 am_ran += 1
                 # This name will affect the semaphore name created
                 run_name = "config-%s" % (name)
-                c_cloud.run(run_name, mod.handle, func_args, freq=freq)
+                cc.run(run_name, mod.handle, func_args, freq=freq)
             except Exception as e:
                 util.logexc(LOG, "Running %s (%s) failed", name, mod)
                 failures.append((name, e))
         return (am_ran, failures)
 
-    def find_transform(self, tr_name, sections):
-        found_where = []
-        for n in sections:
-            mods = self._read_transforms(n)
-            for mod_info in mods:
-                if mod_info.get('mod') == tr_name:
-                    found_where.append(n)
-        return found_where
-
-    def run_single(self, tr_name, section, args=None, freq=None):
-        mods = self._read_transforms(section)
-        mod_tr = None
-        for mod_info in mods:
-            if mod_info.get('mod') == tr_name:
-                mod_tr = mod_info
-                break
-        if not mod_tr:
-            # Nothing to run, does that transform exist there??
-            return (0, 0)
-        else:
-            # Adjust the module
-            if args:
-                mod_tr['args'] = args
-            if freq:
-                mod_tr['freq'] = freq
-            # Now resume doing the normal fixups and running
-            raw_mods = [mod_tr]
-            mostly_mods = self._fixup_transforms(raw_mods)
-            return self._run_transforms(mostly_mods)
+    def run_single(self, mod_name, args=None, freq=None):
+        # Form the users module 'specs'
+        mod_to_be = {
+            'mod': mod_name,
+            'args': args,
+            'freq': freq,
+        }
+        # Now resume doing the normal fixups and running
+        raw_mods = [mod_to_be]
+        mostly_mods = self._fixup_modules(raw_mods)
+        return self._run_modules(mostly_mods)
 
     def run_section(self, section_name):
-        raw_mods = self._read_transforms(section_name)
-        mostly_mods = self._fixup_transforms(raw_mods)
-        return self._run_transforms(mostly_mods)
+        raw_mods = self._read_modules(section_name)
+        mostly_mods = self._fixup_modules(raw_mods)
+        return self._run_modules(mostly_mods)

From ea70a98476ffd9b78c2c4250e0b583bc2834b74b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 17:13:55 -0700
Subject: [PATCH 264/434] Massive pylint + pep8 fixups!

---
 bin/cloud-init                              | 20 +++++------
 cloudinit/cloud.py                          |  3 +-
 cloudinit/config/__init__.py                |  2 +-
 cloudinit/config/cc_chef.py                 | 14 ++++----
 cloudinit/config/cc_disable_ec2_metadata.py |  4 +--
 cloudinit/config/cc_final_message.py        |  8 ++---
 cloudinit/config/cc_foo.py                  |  8 ++---
 cloudinit/config/cc_keys_to_console.py      |  8 ++---
 cloudinit/config/cc_landscape.py            |  2 +-
 cloudinit/config/cc_mcollective.py          |  4 +--
 cloudinit/config/cc_mounts.py               | 13 ++++---
 cloudinit/config/cc_phone_home.py           | 11 ++++--
 cloudinit/config/cc_puppet.py               |  2 +-
 cloudinit/config/cc_resizefs.py             | 10 +++---
 cloudinit/config/cc_salt_minion.py          |  2 +-
 cloudinit/config/cc_scripts_per_boot.py     |  6 ++--
 cloudinit/config/cc_scripts_per_instance.py |  6 ++--
 cloudinit/config/cc_scripts_per_once.py     |  6 ++--
 cloudinit/config/cc_scripts_user.py         |  6 ++--
 cloudinit/config/cc_set_passwords.py        |  4 +--
 cloudinit/config/cc_ssh.py                  | 39 +++++++++++----------
 cloudinit/distros/__init__.py               |  1 -
 cloudinit/distros/rhel.py                   | 14 ++++----
 cloudinit/distros/ubuntu.py                 |  6 ++--
 cloudinit/handlers/__init__.py              |  8 ++---
 cloudinit/helpers.py                        |  6 ++--
 cloudinit/log.py                            |  2 --
 cloudinit/settings.py                       |  2 +-
 cloudinit/sources/DataSourceCloudStack.py   |  2 +-
 cloudinit/sources/DataSourceConfigDrive.py  |  2 +-
 cloudinit/sources/DataSourceEc2.py          |  6 ++--
 cloudinit/sources/DataSourceMAAS.py         |  1 +
 cloudinit/sources/DataSourceNoCloud.py      |  2 +-
 cloudinit/ssh_util.py                       |  5 ++-
 cloudinit/stages.py                         |  6 ++--
 cloudinit/url_helper.py                     | 14 ++++----
 cloudinit/user_data.py                      | 28 +++++++--------
 cloudinit/util.py                           | 37 +++++++++----------
 38 files changed, 159 insertions(+), 161 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index 032d5f39..c1788ef4 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -75,6 +75,7 @@ def welcome(action):
     sys.stderr.flush()
     LOG.info(welcome_msg)
 
+
 def extract_fns(args):
     # Files are already opened so lets just pass that along
     # since it would of broke if it couldn't have
@@ -329,11 +330,11 @@ def main_single(name, args):
 
 def main():
     parser = argparse.ArgumentParser()
-    
+
     # Top level args
-    parser.add_argument('--version', '-v', action='version', 
+    parser.add_argument('--version', '-v', action='version',
                         version='%(prog)s ' + (version.version_string()))
-    parser.add_argument('--file', '-f', action='append', 
+    parser.add_argument('--file', '-f', action='append',
                         dest='files',
                         help=('additional yaml configuration'
                               ' files to use'),
@@ -345,18 +346,18 @@ def main():
     subparsers = parser.add_subparsers()
 
     # Each action and its sub-options (if any)
-    parser_init = subparsers.add_parser('init', 
+    parser_init = subparsers.add_parser('init',
                                         help=('initializes cloud-init and'
                                               ' performs initial modules'))
     parser_init.add_argument("--local", '-l', action='store_true',
                              help="start in local mode (default: %(default)s)",
                              default=False)
-    # This is used so that we can know which action is selected + 
+    # This is used so that we can know which action is selected +
     # the functor to use to run this subcommand
     parser_init.set_defaults(action=('init', main_init))
 
     # These settings are used for the 'config' and 'final' stages
-    parser_mod = subparsers.add_parser('modules', 
+    parser_mod = subparsers.add_parser('modules',
                                       help=('activates modules '
                                             'using a given configuration key'))
     parser_mod.add_argument("--mode", '-m', action='store',
@@ -368,7 +369,7 @@ def main():
 
     # These settings are used when you want to query information
     # stored in the cloud-init data objects/directories/files
-    parser_query = subparsers.add_parser('query', 
+    parser_query = subparsers.add_parser('query',
                                          help=('query information stored '
                                                'in cloud-init'))
     parser_query.add_argument("--name", '-n', action="store",
@@ -378,7 +379,7 @@ def main():
     parser_query.set_defaults(action=('query', main_query))
 
     # This subcommand allows you to run a single module
-    parser_single = subparsers.add_parser('single', 
+    parser_single = subparsers.add_parser('single',
                                          help=('run a single module '))
     parser_single.set_defaults(action=('single', main_single))
     parser_single.add_argument("--name", '-n', action="store",
@@ -394,10 +395,10 @@ def main():
                                     ' pass to this module'))
     parser_single.set_defaults(action=('single', main_single))
 
-
     args = parser.parse_args()
 
     # Setup basic logging to start (until reinitialized)
+    # iff in debug mode...
     if args.debug:
         logging.setupBasicLogging()
 
@@ -407,4 +408,3 @@ def main():
 
 if __name__ == '__main__':
     sys.exit(main())
-
diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index 90679202..6cdcb76a 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -38,6 +38,7 @@ LOG = logging.getLogger(__name__)
 # as providing a backwards compatible object that can be maintained
 # while the stages/other objects can be worked on independently...
 
+
 class Cloud(object):
     def __init__(self, datasource, paths, cfg, distro, runners):
         self.datasource = datasource
@@ -71,7 +72,7 @@ class Cloud(object):
     # The rest of thes are just useful proxies
     def get_userdata(self):
         return self.datasource.get_userdata()
-    
+
     def get_instance_id(self):
         return self.datasource.get_instance_id()
 
diff --git a/cloudinit/config/__init__.py b/cloudinit/config/__init__.py
index 74e2f275..02e32462 100644
--- a/cloudinit/config/__init__.py
+++ b/cloudinit/config/__init__.py
@@ -25,7 +25,7 @@ from cloudinit import log as logging
 
 LOG = logging.getLogger(__name__)
 
-# This prefix is used to make it less 
+# This prefix is used to make it less
 # of a change that when importing
 # we will not find something else with the same
 # name in the lookup path...
diff --git a/cloudinit/config/cc_chef.py b/cloudinit/config/cc_chef.py
index 4e8ef346..74af2a7e 100644
--- a/cloudinit/config/cc_chef.py
+++ b/cloudinit/config/cc_chef.py
@@ -24,7 +24,7 @@ import os
 from cloudinit import templater
 from cloudinit import util
 
-ruby_version_default = "1.8"
+RUBY_VERSION_DEFAULT = "1.8"
 
 
 def handle(name, cfg, cloud, log, _args):
@@ -38,11 +38,11 @@ def handle(name, cfg, cloud, log, _args):
 
     # Ensure the chef directories we use exist
     c_dirs = [
-        '/etc/chef', 
-        '/var/log/chef', 
-        '/var/lib/chef', 
-        '/var/cache/chef', 
-        '/var/backups/chef', 
+        '/etc/chef',
+        '/var/log/chef',
+        '/var/lib/chef',
+        '/var/cache/chef',
+        '/var/backups/chef',
         '/var/run/chef',
     ]
     for d in c_dirs:
@@ -92,7 +92,7 @@ def handle(name, cfg, cloud, log, _args):
             # this will install and run the chef-client from gems
             chef_version = util.get_cfg_option_str(chef_cfg, 'version', None)
             ruby_version = util.get_cfg_option_str(chef_cfg, 'ruby_version',
-                                                   ruby_version_default)
+                                                   RUBY_VERSION_DEFAULT)
             install_chef_from_gems(cloud.distro, ruby_version, chef_version)
             # and finally, run chef-client
             log.debug('Running chef-client')
diff --git a/cloudinit/config/cc_disable_ec2_metadata.py b/cloudinit/config/cc_disable_ec2_metadata.py
index c7d26029..62cca7cc 100644
--- a/cloudinit/config/cc_disable_ec2_metadata.py
+++ b/cloudinit/config/cc_disable_ec2_metadata.py
@@ -24,13 +24,13 @@ from cloudinit.settings import PER_ALWAYS
 
 frequency = PER_ALWAYS
 
-reject_cmd = ['route', 'add', '-host', '169.254.169.254', 'reject']
+REJECT_CMD = ['route', 'add', '-host', '169.254.169.254', 'reject']
 
 
 def handle(name, cfg, _cloud, log, _args):
     disabled = util.get_cfg_option_bool(cfg, "disable_ec2_metadata", False)
     if disabled:
-        util.subp(reject_cmd)
+        util.subp(REJECT_CMD)
     else:
         log.debug(("Skipping transform named %s,"
                    " disabling the ec2 route not enabled"), name)
diff --git a/cloudinit/config/cc_final_message.py b/cloudinit/config/cc_final_message.py
index c257b6d0..fd59aa1e 100644
--- a/cloudinit/config/cc_final_message.py
+++ b/cloudinit/config/cc_final_message.py
@@ -28,7 +28,7 @@ from cloudinit.settings import PER_ALWAYS
 
 frequency = PER_ALWAYS
 
-final_message_def = ("Cloud-init v. {{version}} finished at {{timestamp}}."
+FINAL_MESSAGE_DEF = ("Cloud-init v. {{version}} finished at {{timestamp}}."
                      " Up {{uptime}} seconds.")
 
 
@@ -39,21 +39,21 @@ def handle(_name, cfg, cloud, log, args):
         msg_in = args[0]
     else:
         msg_in = util.get_cfg_option_str(cfg, "final_message")
-    
+
     if not msg_in:
         template_fn = cloud.get_template_filename('final_message')
         if template_fn:
             msg_in = util.load_file(template_fn)
 
     if not msg_in:
-        msg_in = final_message_def
+        msg_in = FINAL_MESSAGE_DEF
 
     uptime = util.uptime()
     ts = util.time_rfc2822()
     cver = version.version_string()
     try:
         subs = {
-            'uptime': uptime, 
+            'uptime': uptime,
             'timestamp': ts,
             'version': cver,
         }
diff --git a/cloudinit/config/cc_foo.py b/cloudinit/config/cc_foo.py
index 99135704..e81e7faa 100644
--- a/cloudinit/config/cc_foo.py
+++ b/cloudinit/config/cc_foo.py
@@ -30,19 +30,19 @@ from cloudinit.settings import PER_INSTANCE
 #    as well as any datasource provided configuration
 #    c) A cloud object that can be used to access various
 #    datasource and paths for the given distro and data provided
-#    by the various datasource instance types. 
+#    by the various datasource instance types.
 #    d) A argument list that may or may not be empty to this module.
 #    Typically those are from module configuration where the module
 #    is defined with some extra configuration that will eventually
 #    be translated from yaml into arguments to this module.
 # 2. A optional 'frequency' that defines how often this module should be ran.
-#    Typically one of PER_INSTANCE, PER_ALWAYS, PER_ONCE. If not 
-#    provided PER_INSTANCE will be assumed. 
+#    Typically one of PER_INSTANCE, PER_ALWAYS, PER_ONCE. If not
+#    provided PER_INSTANCE will be assumed.
 #    See settings.py for these constants.
 # 3. A optional 'distros' array/set/tuple that defines the known distros
 #    this module will work with (if not all of them). This is used to write
 #    a warning out if a module is being ran on a untested distribution for
-#    informational purposes. If non existent all distros are assumed and 
+#    informational purposes. If non existent all distros are assumed and
 #    no warning occurs.
 
 frequency = PER_INSTANCE
diff --git a/cloudinit/config/cc_keys_to_console.py b/cloudinit/config/cc_keys_to_console.py
index 40758198..a8fb3ba7 100644
--- a/cloudinit/config/cc_keys_to_console.py
+++ b/cloudinit/config/cc_keys_to_console.py
@@ -26,13 +26,13 @@ from cloudinit import util
 frequency = PER_INSTANCE
 
 # This is a tool that cloud init provides
-helper_tool = '/usr/lib/cloud-init/write-ssh-key-fingerprints'
+HELPER_TOOL = '/usr/lib/cloud-init/write-ssh-key-fingerprints'
 
 
 def handle(name, cfg, cloud, log, _args):
-    if not os.path.exists(helper_tool):
+    if not os.path.exists(HELPER_TOOL):
         log.warn(("Unable to activate transform %s,"
-                  " helper tool not found at %s"), name, helper_tool)
+                  " helper tool not found at %s"), name, HELPER_TOOL)
         return
 
     fp_blacklist = util.get_cfg_option_list(cfg,
@@ -42,7 +42,7 @@ def handle(name, cfg, cloud, log, _args):
                                               ["ssh-dss"])
 
     try:
-        cmd = [helper_tool]
+        cmd = [HELPER_TOOL]
         cmd.append(','.join(fp_blacklist))
         cmd.append(','.join(key_blacklist))
         (stdout, _stderr) = util.subp(cmd)
diff --git a/cloudinit/config/cc_landscape.py b/cloudinit/config/cc_landscape.py
index 29ce41b9..599276a7 100644
--- a/cloudinit/config/cc_landscape.py
+++ b/cloudinit/config/cc_landscape.py
@@ -62,7 +62,7 @@ def handle(name, cfg, cloud, log, _args):
     ls_cloudcfg = cfg.get("landscape", {})
 
     if not isinstance(ls_cloudcfg, dict):
-        raise Exception(("'landscape' key existed in config," 
+        raise Exception(("'landscape' key existed in config,"
                          " but not a dictionary type,"
                          " is a %s instead"), util.obj_name(ls_cloudcfg))
 
diff --git a/cloudinit/config/cc_mcollective.py b/cloudinit/config/cc_mcollective.py
index 4cec6494..ba5e13ca 100644
--- a/cloudinit/config/cc_mcollective.py
+++ b/cloudinit/config/cc_mcollective.py
@@ -52,7 +52,7 @@ def handle(name, cfg, cloud, log, _args):
         # It doesn't contain any sections so just add one temporarily
         # Use a hash id based off the contents,
         # just incase of conflicts... (try to not have any...)
-        # This is so that an error won't occur when reading (and no 
+        # This is so that an error won't occur when reading (and no
         # sections exist in the file)
         section_tpl = "[nullsection_%s]"
         attempts = 0
@@ -85,7 +85,7 @@ def handle(name, cfg, cloud, log, _args):
         # the previous server.cfg and create our new one
         old_fn = "%s.old" % (server_cfg_fn)
         util.rename(server_cfg_fn, old_fn)
-        # Now we got the whole file, write to disk except the section 
+        # Now we got the whole file, write to disk except the section
         # we added so that config parser won't error out when trying to read.
         # Note below, that we've just used ConfigParser because it generally
         # works.  Below, we remove the initial 'nullsection' header.
diff --git a/cloudinit/config/cc_mounts.py b/cloudinit/config/cc_mounts.py
index 700fbc44..ab097c2a 100644
--- a/cloudinit/config/cc_mounts.py
+++ b/cloudinit/config/cc_mounts.py
@@ -24,10 +24,10 @@ import re
 
 from cloudinit import util
 
-# shortname matches 'sda', 'sda1', 'xvda', 'hda', 'sdb', xvdb, vda, vdd1
-shortname_filter = r"^[x]{0,1}[shv]d[a-z][0-9]*$"
-shortname = re.compile(shortname_filter)
-ws = re.compile("[%s]+" % (whitespace))
+# Shortname matches 'sda', 'sda1', 'xvda', 'hda', 'sdb', xvdb, vda, vdd1
+SHORTNAME_FILTER = r"^[x]{0,1}[shv]d[a-z][0-9]*$"
+SHORTNAME = re.compile(SHORTNAME_FILTER)
+WS = re.compile("[%s]+" % (whitespace))
 
 
 def is_mdname(name):
@@ -55,7 +55,6 @@ def handle(_name, cfg, cloud, log, _args):
     if "mounts" in cfg:
         cfgmnt = cfg["mounts"]
 
-    
     for i in range(len(cfgmnt)):
         # skip something that wasn't a list
         if not isinstance(cfgmnt[i], list):
@@ -85,7 +84,7 @@ def handle(_name, cfg, cloud, log, _args):
                 cfgmnt[i][0] = renamed
                 log.debug("Mapped metadata name %s to %s", startname, renamed)
         else:
-            if shortname.match(startname):
+            if SHORTNAME.match(startname):
                 renamed = "/dev/%s" % startname
                 log.debug("Mapped shortname name %s to %s", startname, renamed)
                 cfgmnt[i][0] = renamed
@@ -171,7 +170,7 @@ def handle(_name, cfg, cloud, log, _args):
     fstab = util.load_file(cloud.paths.join(True, "/etc/fstab"))
     for line in fstab.splitlines():
         try:
-            toks = ws.split(line)
+            toks = WS.split(line)
             if toks[3].find(comment) != -1:
                 continue
         except:
diff --git a/cloudinit/config/cc_phone_home.py b/cloudinit/config/cc_phone_home.py
index a8752527..dcb07b66 100644
--- a/cloudinit/config/cc_phone_home.py
+++ b/cloudinit/config/cc_phone_home.py
@@ -26,8 +26,13 @@ from cloudinit.settings import PER_INSTANCE
 
 frequency = PER_INSTANCE
 
-post_list_all = ['pub_key_dsa', 'pub_key_rsa', 'pub_key_ecdsa',
-                 'instance_id', 'hostname']
+POST_LIST_ALL = [
+    'pub_key_dsa',
+    'pub_key_rsa',
+    'pub_key_ecdsa',
+    'instance_id',
+    'hostname'
+]
 
 
 # phone_home:
@@ -63,7 +68,7 @@ def handle(name, cfg, cloud, log, args):
                           " is not an integer, using %s instead"), tries)
 
     if post_list == "all":
-        post_list = post_list_all
+        post_list = POST_LIST_ALL
 
     all_keys = {}
     all_keys['instance_id'] = cloud.get_instance_id()
diff --git a/cloudinit/config/cc_puppet.py b/cloudinit/config/cc_puppet.py
index 5fb88bf2..5154efba 100644
--- a/cloudinit/config/cc_puppet.py
+++ b/cloudinit/config/cc_puppet.py
@@ -63,7 +63,7 @@ def handle(name, cfg, cloud, log, _args):
                 util.ensure_dir(pp_ssl_dir, 0771)
                 util.chownbyid(pp_ssl_dir,
                                pwd.getpwnam('puppet').pw_uid, 0)
-                pp_ssl_certs = cloud.paths.join(False, 
+                pp_ssl_certs = cloud.paths.join(False,
                                                 '/var/lib/puppet/ssl/certs/')
                 util.ensure_dir(pp_ssl_certs)
                 util.chownbyid(pp_ssl_certs,
diff --git a/cloudinit/config/cc_resizefs.py b/cloudinit/config/cc_resizefs.py
index 1690094a..c019989e 100644
--- a/cloudinit/config/cc_resizefs.py
+++ b/cloudinit/config/cc_resizefs.py
@@ -27,7 +27,7 @@ from cloudinit.settings import PER_ALWAYS
 
 frequency = PER_ALWAYS
 
-resize_fs_prefixes_cmds = [
+RESIZE_FS_PREFIXES_CMDS = [
     ('ext', 'resize2fs'),
     ('xfs', 'xfs_growfs'),
 ]
@@ -89,16 +89,16 @@ def handle(name, cfg, cloud, log, args):
         # occurs this temporary file will still benefit from
         # auto deletion
         tfh.unlink_now()
-    
+
         st_dev = nodeify_path(devpth, resize_what, log)
         fs_type = get_fs_type(st_dev, devpth, log)
         if not fs_type:
             log.warn("Could not determine filesystem type of %s", resize_what)
             return
-    
+
         resizer = None
         fstype_lc = fs_type.lower()
-        for (pfix, root_cmd) in resize_fs_prefixes_cmds:
+        for (pfix, root_cmd) in RESIZE_FS_PREFIXES_CMDS:
             if fstype_lc.startswith(pfix):
                 resizer = root_cmd
                 break
@@ -112,7 +112,7 @@ def handle(name, cfg, cloud, log, args):
         resize_cmd = [resizer, devpth]
 
         if resize_root == "noblock":
-            # Fork to a child that will run 
+            # Fork to a child that will run
             # the resize command
             util.fork_cb(do_resize, resize_cmd, log)
             # Don't delete the file now in the parent
diff --git a/cloudinit/config/cc_salt_minion.py b/cloudinit/config/cc_salt_minion.py
index 16f5286d..986e6db6 100644
--- a/cloudinit/config/cc_salt_minion.py
+++ b/cloudinit/config/cc_salt_minion.py
@@ -32,7 +32,7 @@ def handle(name, cfg, cloud, log, _args):
 
     # Start by installing the salt package ...
     cloud.distro.install_packages(["salt"])
-    
+
     # Ensure we can configure files at the right dir
     config_dir = salt_cfg.get("config_dir", '/etc/salt')
     config_dir = cloud.paths.join(False, config_dir)
diff --git a/cloudinit/config/cc_scripts_per_boot.py b/cloudinit/config/cc_scripts_per_boot.py
index 364e1d02..d3c47442 100644
--- a/cloudinit/config/cc_scripts_per_boot.py
+++ b/cloudinit/config/cc_scripts_per_boot.py
@@ -26,16 +26,16 @@ from cloudinit.settings import PER_ALWAYS
 
 frequency = PER_ALWAYS
 
-script_subdir = 'per-boot'
+SCRIPT_SUBDIR = 'per-boot'
 
 
 def handle(name, _cfg, cloud, log, _args):
     # Comes from the following:
     # https://forums.aws.amazon.com/thread.jspa?threadID=96918
-    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
+    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', SCRIPT_SUBDIR)
     try:
         util.runparts(runparts_path)
     except:
         log.warn("Failed to run transform %s (%s in %s)",
-                 name, script_subdir, runparts_path)
+                 name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_scripts_per_instance.py b/cloudinit/config/cc_scripts_per_instance.py
index d75ab47d..8e428ac2 100644
--- a/cloudinit/config/cc_scripts_per_instance.py
+++ b/cloudinit/config/cc_scripts_per_instance.py
@@ -26,16 +26,16 @@ from cloudinit.settings import PER_INSTANCE
 
 frequency = PER_INSTANCE
 
-script_subdir = 'per-instance'
+SCRIPT_SUBDIR = 'per-instance'
 
 
 def handle(name, _cfg, cloud, log, _args):
     # Comes from the following:
     # https://forums.aws.amazon.com/thread.jspa?threadID=96918
-    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
+    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', SCRIPT_SUBDIR)
     try:
         util.runparts(runparts_path)
     except:
         log.warn("Failed to run transform %s (%s in %s)",
-                 name, script_subdir, runparts_path)
+                 name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_scripts_per_once.py b/cloudinit/config/cc_scripts_per_once.py
index 80f8c325..e7a29a44 100644
--- a/cloudinit/config/cc_scripts_per_once.py
+++ b/cloudinit/config/cc_scripts_per_once.py
@@ -26,16 +26,16 @@ from cloudinit.settings import PER_ONCE
 
 frequency = PER_ONCE
 
-script_subdir = 'per-once'
+SCRIPT_SUBDIR = 'per-once'
 
 
 def handle(name, _cfg, cloud, log, _args):
     # Comes from the following:
     # https://forums.aws.amazon.com/thread.jspa?threadID=96918
-    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', script_subdir)
+    runparts_path = os.path.join(cloud.get_cpath(), 'scripts', SCRIPT_SUBDIR)
     try:
         util.runparts(runparts_path)
     except:
         log.warn("Failed to run transform %s (%s in %s)",
-                 name, script_subdir, runparts_path)
+                 name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_scripts_user.py b/cloudinit/config/cc_scripts_user.py
index f4fe3a2a..1ff05aae 100644
--- a/cloudinit/config/cc_scripts_user.py
+++ b/cloudinit/config/cc_scripts_user.py
@@ -26,17 +26,17 @@ from cloudinit.settings import PER_INSTANCE
 
 frequency = PER_INSTANCE
 
-script_subdir = 'scripts'
+SCRIPT_SUBDIR = 'scripts'
 
 
 def handle(name, _cfg, cloud, log, _args):
     # This is written to by the user data handlers
     # Ie, any custom shell scripts that come down
     # go here...
-    runparts_path = os.path.join(cloud.get_ipath_cur(), script_subdir)
+    runparts_path = os.path.join(cloud.get_ipath_cur(), SCRIPT_SUBDIR)
     try:
         util.runparts(runparts_path)
     except:
         log.warn("Failed to run transform %s (%s in %s)",
-                 name, script_subdir, runparts_path)
+                 name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_set_passwords.py b/cloudinit/config/cc_set_passwords.py
index e7049f22..ce17f357 100644
--- a/cloudinit/config/cc_set_passwords.py
+++ b/cloudinit/config/cc_set_passwords.py
@@ -25,7 +25,7 @@ from cloudinit import util
 from string import letters, digits  # pylint: disable=W0402
 
 # We are removing certain 'painful' letters/numbers
-pw_set = (letters.translate(None, 'loLOI') +
+PW_SET = (letters.translate(None, 'loLOI') +
           digits.translate(None, '01'))
 
 
@@ -148,4 +148,4 @@ def handle(_name, cfg, cloud, log, args):
 
 
 def rand_user_password(pwlen=9):
-    return util.rand_str(pwlen, select_from=pw_set)
+    return util.rand_str(pwlen, select_from=PW_SET)
diff --git a/cloudinit/config/cc_ssh.py b/cloudinit/config/cc_ssh.py
index e5e99560..4019ae90 100644
--- a/cloudinit/config/cc_ssh.py
+++ b/cloudinit/config/cc_ssh.py
@@ -24,11 +24,11 @@ import glob
 from cloudinit import util
 from cloudinit import ssh_util
 
-DISABLE_ROOT_OPTS = ( "no-port-forwarding,no-agent-forwarding," 
-"no-X11-forwarding,command=\"echo \'Please login as the user \\\"$USER\\\" " 
+DISABLE_ROOT_OPTS = ("no-port-forwarding,no-agent-forwarding,"
+"no-X11-forwarding,command=\"echo \'Please login as the user \\\"$USER\\\" "
 "rather than the user \\\"root\\\".\';echo;sleep 10\"")
 
-key2file = {
+KEY_2_FILE = {
     "rsa_private": ("/etc/ssh/ssh_host_rsa_key", 0600),
     "rsa_public": ("/etc/ssh/ssh_host_rsa_key.pub", 0644),
     "dsa_private": ("/etc/ssh/ssh_host_dsa_key", 0600),
@@ -37,15 +37,17 @@ key2file = {
     "ecdsa_public": ("/etc/ssh/ssh_host_ecdsa_key.pub", 0644),
 }
 
-priv2pub = {
-    'rsa_private': 'rsa_public', 
+PRIV_2_PUB = {
+    'rsa_private': 'rsa_public',
     'dsa_private': 'dsa_public',
     'ecdsa_private': 'ecdsa_public',
 }
 
-key_gen_tpl = 'o=$(ssh-keygen -yf "%s") && echo "$o" root@localhost > "%s"'
+KEY_GEN_TPL = 'o=$(ssh-keygen -yf "%s") && echo "$o" root@localhost > "%s"'
 
-generate_keys = ['rsa', 'dsa', 'ecdsa']
+GENERATE_KEY_NAMES = ['rsa', 'dsa', 'ecdsa']
+
+KEY_FILE_TPL = '/etc/ssh/ssh_host_%s_key'
 
 
 def handle(_name, cfg, cloud, log, _args):
@@ -58,21 +60,21 @@ def handle(_name, cfg, cloud, log, _args):
                 util.del_file(f)
             except:
                 util.logexc(log, "Failed deleting key file %s", f)
-    
+
     if "ssh_keys" in cfg:
         # if there are keys in cloud-config, use them
         for (key, val) in cfg["ssh_keys"].iteritems():
-            if key in key2file:
-                tgt_fn = key2file[key][0]
-                tgt_perms = key2file[key][1]
+            if key in KEY_2_FILE:
+                tgt_fn = KEY_2_FILE[key][0]
+                tgt_perms = KEY_2_FILE[key][1]
                 util.write_file(cloud.paths.join(False, tgt_fn),
                                 val, tgt_perms)
 
-        for (priv, pub) in priv2pub.iteritems():
+        for (priv, pub) in PRIV_2_PUB.iteritems():
             if pub in cfg['ssh_keys'] or not priv in cfg['ssh_keys']:
                 continue
-            pair = (key2file[priv][0], key2file[pub][0])
-            cmd = ['sh', '-xc', key_gen_tpl % pair]
+            pair = (KEY_2_FILE[priv][0], KEY_2_FILE[pub][0])
+            cmd = ['sh', '-xc', KEY_GEN_TPL % pair]
             try:
                 # TODO: Is this guard needed?
                 with util.SeLinuxGuard("/etc/ssh", recursive=True):
@@ -84,12 +86,11 @@ def handle(_name, cfg, cloud, log, _args):
     else:
         # if not, generate them
         genkeys = util.get_cfg_option_list(cfg,
-                                            'ssh_genkeytypes', 
-                                            generate_keys)
+                                           'ssh_genkeytypes',
+                                           GENERATE_KEY_NAMES)
         for keytype in genkeys:
-            keyfile = '/etc/ssh/ssh_host_%s_key' % (keytype)
-            keyfile = cloud.paths.join(False, keyfile)
-            util.ensure_dir(os.path.dirname(keyfile)) 
+            keyfile = cloud.paths.join(False, KEY_FILE_TPL % (keytype))
+            util.ensure_dir(os.path.dirname(keyfile))
             if not os.path.exists(keyfile):
                 cmd = ['ssh-keygen', '-t', keytype, '-N', '', '-f', keyfile]
                 try:
diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 45dd85ec..25a60c52 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -157,4 +157,3 @@ def fetch(distro_name, mods=(__name__, )):
                            % (distro_name))
     distro_cls = getattr(mod, 'Distro')
     return distro_cls
-    
diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index b67ae5b8..5cbefa6e 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -35,7 +35,7 @@ class Distro(distros.Distro):
 
     def __init__(self, name, cfg, paths):
         distros.Distro.__init__(self, name, cfg, paths)
-    
+
     def install_packages(self, pkglist):
         self.package_command('install', pkglist)
 
@@ -210,12 +210,12 @@ class Distro(distros.Distro):
     def package_command(self, command, args=None):
         cmd = ['yum']
         # If enabled, then yum will be tolerant of errors on the command line
-        # with regard to packages. 
-        # For example: if you request to install foo, bar and baz and baz is 
+        # with regard to packages.
+        # For example: if you request to install foo, bar and baz and baz is
         # installed; yum won't error out complaining that baz is already
-        # installed. 
+        # installed.
         cmd.append("-t")
-        # Determines whether or not yum prompts for confirmation 
+        # Determines whether or not yum prompts for confirmation
         # of critical actions. We don't want to prompt...
         cmd.append("-y")
         cmd.append(command)
@@ -223,8 +223,8 @@ class Distro(distros.Distro):
             cmd.extend(args)
         # Allow the output of this to flow outwards (ie not be captured)
         util.subp(cmd, capture=False)
-        
-        
+
+
 # This is a util function to translate a ubuntu /etc/network/interfaces 'blob'
 # to a rhel equiv. that can then be written to /etc/sysconfig/network-scripts/
 # TODO remove when we have python-netcf active...
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 5a1b572e..fd7b7b8d 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -36,11 +36,11 @@ class Distro(distros.Distro):
 
     def __init__(self, name, cfg, paths):
         distros.Distro.__init__(self, name, cfg, paths)
-        # This will be used to restrict certain 
+        # This will be used to restrict certain
         # calls from repeatly happening (when they
         # should only happen say once per instance...)
         self._runner = helpers.Runners(paths)
-    
+
     def install_packages(self, pkglist):
         self._update_package_sources()
         self.package_command('install', pkglist)
@@ -131,4 +131,4 @@ class Distro(distros.Distro):
 
     def _update_package_sources(self):
         self._runner.run("update-sources", self.package_command,
-                         ["update"], freq=PER_INSTANCE)
\ No newline at end of file
+                         ["update"], freq=PER_INSTANCE)
diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index c6f2119c..d52b1cba 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -104,7 +104,7 @@ def run_part(mod, data, ctype, filename, payload, frequency):
     except:
         mod_ver = 1
     try:
-        LOG.debug("Calling handler %s (%s, %s, %s) with frequency %s", 
+        LOG.debug("Calling handler %s (%s, %s, %s) with frequency %s",
                   mod, ctype, filename, mod_ver, frequency)
         if mod_ver >= 2:
             # Treat as v. 2 which does get a frequency
@@ -114,7 +114,7 @@ def run_part(mod, data, ctype, filename, payload, frequency):
             mod.handle_part(data, ctype, filename, payload)
     except:
         util.logexc(LOG, ("Failed calling handler %s (%s, %s, %s)"
-                         " with frequency %s"), 
+                         " with frequency %s"),
                     mod, ctype, filename,
                     mod_ver, frequency)
 
@@ -178,7 +178,7 @@ def walker_callback(pdata, ctype, filename, payload):
                  payload, pdata['frequency'])
 
 
-# Callback is a function that will be called with 
+# Callback is a function that will be called with
 # (data, content_type, filename, payload)
 def walk(msg, callback, data):
     partnum = 0
@@ -226,5 +226,3 @@ def type_from_starts_with(payload, default=None):
         if payload_lc.startswith(text):
             return INCLUSION_TYPES_MAP[text]
     return default
-
-
diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 45633e0f..4447d1ee 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -84,7 +84,7 @@ class FileSemaphores(object):
         try:
             util.del_dir(self.sem_path)
         except (IOError, OSError):
-            util.logexc(LOG, "Failed deleting semaphore directory %s", 
+            util.logexc(LOG, "Failed deleting semaphore directory %s",
                         self.sem_path)
 
     def _acquire(self, name, freq):
@@ -212,7 +212,7 @@ class Paths(object):
         self.cfgs = path_cfgs
         # Populate all the initial paths
         self.cloud_dir = self.join(False,
-                                   path_cfgs.get('cloud_dir', 
+                                   path_cfgs.get('cloud_dir',
                                                  '/var/lib/cloud'))
         self.instance_link = os.path.join(self.cloud_dir, 'instance')
         self.boot_finished = os.path.join(self.instance_link, "boot-finished")
@@ -237,7 +237,7 @@ class Paths(object):
         # Set when a datasource becomes active
         self.datasource = ds
 
-    # joins the paths but also appends a read 
+    # joins the paths but also appends a read
     # or write root if available
     def join(self, read_only, *paths):
         if read_only:
diff --git a/cloudinit/log.py b/cloudinit/log.py
index 478946f8..fc1428a2 100644
--- a/cloudinit/log.py
+++ b/cloudinit/log.py
@@ -20,7 +20,6 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-
 import logging
 import logging.handlers
 import logging.config
@@ -53,7 +52,6 @@ def setupBasicLogging():
     root.setLevel(DEBUG)
 
 
-
 def setupLogging(cfg=None):
     # See if the config provides any logging conf...
     if not cfg:
diff --git a/cloudinit/settings.py b/cloudinit/settings.py
index 8a1eaeb3..fac9b862 100644
--- a/cloudinit/settings.py
+++ b/cloudinit/settings.py
@@ -47,7 +47,7 @@ CFG_BUILTIN = {
         'paths': {
             'cloud_dir': '/var/lib/cloud',
             'templates_dir': '/etc/cloud/templates/',
-        }, 
+        },
         'distro': 'ubuntu',
     },
 }
diff --git a/cloudinit/sources/DataSourceCloudStack.py b/cloudinit/sources/DataSourceCloudStack.py
index b1817654..83c577e6 100644
--- a/cloudinit/sources/DataSourceCloudStack.py
+++ b/cloudinit/sources/DataSourceCloudStack.py
@@ -121,7 +121,7 @@ class DataSourceCloudStack(sources.DataSource):
                 None, self.metadata_address)
             self.metadata = boto_utils.get_instance_metadata(self.api_ver,
                 self.metadata_address)
-            LOG.debug("Crawl of metadata service took %s seconds", 
+            LOG.debug("Crawl of metadata service took %s seconds",
                       int(time.time() - start_time))
             return True
         except Exception:
diff --git a/cloudinit/sources/DataSourceConfigDrive.py b/cloudinit/sources/DataSourceConfigDrive.py
index 5da1ffea..9905dad4 100644
--- a/cloudinit/sources/DataSourceConfigDrive.py
+++ b/cloudinit/sources/DataSourceConfigDrive.py
@@ -36,7 +36,7 @@ CFG_DRIVE_FILES = [
     "meta.js",
 ]
 DEFAULT_METADATA = {
-    "instance-id": DEFAULT_IID, 
+    "instance-id": DEFAULT_IID,
     "dsmode": DEFAULT_MODE,
 }
 CFG_DRIVE_DEV_ENV = 'CLOUD_INIT_CONFIG_DRIVE_DEVICE'
diff --git a/cloudinit/sources/DataSourceEc2.py b/cloudinit/sources/DataSourceEc2.py
index 55447102..0598dfa2 100644
--- a/cloudinit/sources/DataSourceEc2.py
+++ b/cloudinit/sources/DataSourceEc2.py
@@ -38,7 +38,7 @@ DEF_MD_URL = "http://169.254.169.254"
 DEF_MD_VERSION = '2009-04-04'
 
 # Default metadata urls that will be used if none are provided
-# They will be checked for 'resolveability' and some of the 
+# They will be checked for 'resolveability' and some of the
 # following may be discarded if they do not resolve
 DEF_MD_URLS = [DEF_MD_URL, "http://instance-data:8773"]
 
@@ -69,7 +69,7 @@ class DataSourceEc2(sources.DataSource):
                 None, self.metadata_address)
             self.metadata = boto_utils.get_instance_metadata(self.api_ver,
                 self.metadata_address)
-            LOG.debug("Crawl of metadata service took %s seconds", 
+            LOG.debug("Crawl of metadata service took %s seconds",
                        int(time.time() - start_time))
             return True
         except Exception:
@@ -201,7 +201,7 @@ class DataSourceEc2(sources.DataSource):
             return None
 
         # Example:
-        # 'block-device-mapping': 
+        # 'block-device-mapping':
         # {'ami': '/dev/sda1',
         # 'ephemeral0': '/dev/sdb',
         # 'root': '/dev/sda1'}
diff --git a/cloudinit/sources/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
index bb8fbac1..104e7a54 100644
--- a/cloudinit/sources/DataSourceMAAS.py
+++ b/cloudinit/sources/DataSourceMAAS.py
@@ -251,6 +251,7 @@ datasources = [
   (DataSourceMAAS, (sources.DEP_FILESYSTEM, sources.DEP_NETWORK)),
 ]
 
+
 # Return a list of data sources that match this set of dependencies
 def get_datasource_list(depends):
     return sources.list_from_depends(depends, datasources)
diff --git a/cloudinit/sources/DataSourceNoCloud.py b/cloudinit/sources/DataSourceNoCloud.py
index 2b016d1c..8499a97c 100644
--- a/cloudinit/sources/DataSourceNoCloud.py
+++ b/cloudinit/sources/DataSourceNoCloud.py
@@ -154,7 +154,7 @@ class DataSourceNoCloud(sources.DataSource):
             (self.dsmode in ("local", seeded_interfaces))):
             LOG.info("Updating network interfaces from %s", self)
             self.distro.apply_network(md['network-interfaces'])
-            
+
         if md['dsmode'] == self.dsmode:
             self.seed = ",".join(found)
             self.metadata = md
diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index fef3d40f..45dd5535 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -103,10 +103,10 @@ class AuthKeyLineParser(object):
             elif curc == '"':
                 quoted = not quoted
             i = i + 1
-    
+
         options = ent[0:i]
         options_lst = []
-        
+
         # Now use a csv parser to pull the options
         # out of the above string that we just found an endpoint for.
         #
@@ -211,7 +211,6 @@ def update_authorized_keys(fname, keys):
 
 
 def setup_user_keys(keys, user, key_prefix, paths):
-    
     # Make sure the users .ssh dir is setup accordingly
     pwent = pwd.getpwnam(user)
     ssh_dir = os.path.join(pwent.pw_dir, '.ssh')
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index ae6e2de5..84a965c2 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -287,7 +287,7 @@ class Init(object):
 
     def cloudify(self):
         # Form the needed options to cloudify our members
-        return cloud.Cloud(self.datasource, 
+        return cloud.Cloud(self.datasource,
                            self.paths, self.cfg,
                            self.distro, helpers.Runners(self.paths))
 
@@ -318,7 +318,7 @@ class Init(object):
     def consume(self, frequency=PER_INSTANCE):
         cdir = self.paths.get_cpath("handlers")
         idir = self.paths.get_ipath("handlers")
-    
+
         # Add the path to the plugins dir to the top of our list for import
         # instance dir should be read before cloud-dir
         if cdir and cdir not in sys.path:
@@ -417,7 +417,7 @@ class Modules(object):
             except:
                 util.logexc(LOG, ("Failed loading of datasource"
                                   " config object from %s"), self.datasource)
-        
+
         if self.base_cfg:
             t_cfgs.append(self.base_cfg)
 
diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 1c583eba..223278ce 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -47,11 +47,11 @@ class UrlResponse(object):
     @property
     def contents(self):
         return self._contents
-    
+
     @property
     def headers(self):
         return self._headers
-    
+
     def __str__(self):
         if not self.contents:
             return ''
@@ -66,7 +66,7 @@ class UrlResponse(object):
             return True
         else:
             return False
-    
+
 
 def readurl(url, data=None, timeout=None,
             retries=0, sec_between=1, headers=None):
@@ -89,8 +89,8 @@ def readurl(url, data=None, timeout=None,
 
     excepts = []
     LOG.info(("Attempting to open '%s' with %s attempts"
-                " (%s retries, timeout=%s) to be performed"), 
-             url, attempts, retries, timeout)
+              " (%s retries, timeout=%s) to be performed"),
+              url, attempts, retries, timeout)
     open_args = {}
     if timeout is not None:
         open_args['timeout'] = int(timeout)
@@ -112,7 +112,7 @@ def readurl(url, data=None, timeout=None,
             excepts.append(e)
         except urllib2.URLError as e:
             # This can be a message string or
-            # another exception instance 
+            # another exception instance
             # (socket.error for remote URLs, OSError for local URLs).
             if (isinstance(e.reason, (OSError)) and
                 e.reason.errno == errno.ENOENT):
@@ -128,7 +128,7 @@ def readurl(url, data=None, timeout=None,
 
     # Didn't work out
     LOG.warn("Failed reading from %s after %s attempts", url, attempts)
-    
+
     # It must of errored at least once for code
     # to get here so re-raise the last error
     LOG.debug("%s errors occured, re-raising the last one", len(excepts))
diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index b7902d44..4babb8e5 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -65,33 +65,33 @@ class UserDataProcessor(object):
             # multipart/* are just containers
             if part.get_content_maintype() == 'multipart':
                 continue
-    
+
             ctype = None
             ctype_orig = part.get_content_type()
             payload = part.get_payload(decode=True)
-    
+
             if not ctype_orig:
                 ctype_orig = UNDEF_TYPE
-    
+
             if ctype_orig in TYPE_NEEDED:
                 ctype = handlers.type_from_starts_with(payload)
-    
+
             if ctype is None:
                 ctype = ctype_orig
-    
+
             if ctype in INCLUDE_TYPES:
                 self._do_include(payload, append_msg)
                 continue
-    
+
             if ctype in ARCHIVE_TYPES:
                 self._explode_archive(payload, append_msg)
                 continue
-    
+
             if 'Content-Type' in base_msg:
                 base_msg.replace_header('Content-Type', ctype)
             else:
                 base_msg['Content-Type'] = ctype
-    
+
             self._attach_part(append_msg, part)
 
     def _get_include_once_filename(self, entry):
@@ -108,8 +108,8 @@ class UserDataProcessor(object):
             lc_line = line.lower()
             if lc_line.startswith("#include-once"):
                 line = line[len("#include-once"):].lstrip()
-                # Every following include will now 
-                # not be refetched.... but will be 
+                # Every following include will now
+                # not be refetched.... but will be
                 # re-read from a local urlcache (if it worked)
                 include_once_on = True
             elif lc_line.startswith("#include"):
@@ -190,10 +190,10 @@ class UserDataProcessor(object):
         """
         if ATTACHMENT_FIELD not in outer_msg:
             outer_msg[ATTACHMENT_FIELD] = '0'
-    
+
         if new_count is not None:
             outer_msg.replace_header(ATTACHMENT_FIELD, str(new_count))
-    
+
         fetched_count = 0
         try:
             fetched_count = int(outer_msg.get(ATTACHMENT_FIELD))
@@ -234,7 +234,3 @@ def convert_string(raw_data, headers=None):
         msg = MIMEBase(maintype, subtype, *headers)
         msg.set_payload(data)
     return msg
-
-
-
-
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 91d20a76..56c01fab 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -35,7 +35,7 @@ import pwd
 import random
 import shutil
 import socket
-import string # pylint: disable=W0402
+import string  # pylint: disable=W0402
 import subprocess
 import sys
 import tempfile
@@ -153,13 +153,15 @@ def SilentTemporaryFile(**kwargs):
     # file to unlink has been unlinked elsewhere..
     LOG.debug("Created temporary file %s", fh.name)
     fh.unlink = del_file
-    # Add a new method that will unlink 
+
+    # Add a new method that will unlink
     # right 'now' but still lets the exit
     # method attempt to remove it (which will
     # not throw due to our del file being quiet
     # about files that are not there)
     def unlink_now():
         fh.unlink(fh.name)
+
     setattr(fh, 'unlink_now', unlink_now)
     return fh
 
@@ -199,7 +201,7 @@ def is_false_str(val, addons=None):
 
 def translate_bool(val, addons=None):
     if not val:
-        # This handles empty lists and false and 
+        # This handles empty lists and false and
         # other things that python believes are false
         return False
     # If its already a boolean skip
@@ -214,7 +216,6 @@ def rand_str(strlen=32, select_from=None):
     return "".join([random.choice(select_from) for _x in range(0, strlen)])
 
 
-
 def read_conf(fname):
     try:
         return load_yaml(load_file(fname), default={})
@@ -275,7 +276,7 @@ def is_ipv4(instr):
 
 def merge_base_cfg(cfgfile, cfg_builtin=None):
     syscfg = read_conf_with_confd(cfgfile)
-    
+
     kern_contents = read_cc_from_cmdline()
     kerncfg = {}
     if kern_contents:
@@ -575,7 +576,7 @@ def load_yaml(blob, default=None, allowed=(dict,)):
     try:
         blob = str(blob)
         LOG.debug(("Attempting to load yaml from string "
-                 "of length %s with allowed root types %s"), 
+                 "of length %s with allowed root types %s"),
                  len(blob), allowed)
         converted = yaml.load(blob)
         if not isinstance(converted, allowed):
@@ -625,7 +626,7 @@ def read_conf_d(confd):
 
     # remove anything not ending in '.cfg'
     confs = [f for f in confs if f.endswith(".cfg")]
-    
+
     # remove anything not a file
     confs = [f for f in confs if os.path.isfile(os.path.join(confd, f))]
 
@@ -726,9 +727,9 @@ def get_fqdn_from_hosts(hostname, filename="/etc/hosts"):
     """
     For each host a single line should be present with
       the following information:
-    
-	     IP_address canonical_hostname [aliases...]
-    
+
+        IP_address canonical_hostname [aliases...]
+
       Fields of the entry are separated by any number of  blanks  and/or  tab
       characters.  Text  from	a "#" character until the end of the line is a
       comment, and is ignored.	 Host  names  may  contain  only  alphanumeric
@@ -747,7 +748,7 @@ def get_fqdn_from_hosts(hostname, filename="/etc/hosts"):
             if not line:
                 continue
 
-            # If there there is less than 3 entries 
+            # If there there is less than 3 entries
             # (IP_address, canonical_hostname, alias)
             # then ignore this line
             toks = line.split()
@@ -829,7 +830,7 @@ def close_stdin():
         os.dup2(fp.fileno(), sys.stdin.fileno())
 
 
-def find_devs_with(criteria=None, oformat='device', 
+def find_devs_with(criteria=None, oformat='device',
                     tag=None, no_cache=False, path=None):
     """
     find devices matching given criteria (via blkid)
@@ -841,23 +842,23 @@ def find_devs_with(criteria=None, oformat='device',
     blk_id_cmd = ['blkid']
     options = []
     if criteria:
-        # Search for block devices with tokens named NAME that 
+        # Search for block devices with tokens named NAME that
         # have the value 'value' and display any devices which are found.
         # Common values for NAME include  TYPE, LABEL, and UUID.
         # If there are no devices specified on the command line,
-        # all block devices will be searched; otherwise, 
+        # all block devices will be searched; otherwise,
         # only search the devices specified by the user.
         options.append("-t%s" % (criteria))
     if tag:
         # For each (specified) device, show only the tags that match tag.
         options.append("-s%s" % (tag))
     if no_cache:
-        # If you want to start with a clean cache 
-        # (i.e. don't report devices previously scanned 
+        # If you want to start with a clean cache
+        # (i.e. don't report devices previously scanned
         # but not necessarily available at this time), specify /dev/null.
         options.extend(["-c", "/dev/null"])
     if oformat:
-        # Display blkid's output using the specified format. 
+        # Display blkid's output using the specified format.
         # The format parameter may be:
         # full, value, list, device, udev, export
         options.append('-o%s' % (oformat))
@@ -1104,7 +1105,7 @@ def mounts():
                 (dev, mp, fstype, opts, _freq, _passno) = mpline.split()
             except:
                 continue
-            # If the name of the mount point contains spaces these 
+            # If the name of the mount point contains spaces these
             # can be escaped as '\040', so undo that..
             mp = mp.replace("\\040", " ")
             mounted[dev] = {

From 812971e7dc5b50a4c0fb85b78dde1e91fe9b04c1 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 17:32:03 -0700
Subject: [PATCH 265/434] Use setuptools instead of disttools, this seems to be
 needed for requirements to work

---
 setup.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/setup.py b/setup.py
index d2e022f0..45207af9 100755
--- a/setup.py
+++ b/setup.py
@@ -25,7 +25,7 @@ from glob import glob
 import os
 import re
 
-from distutils.core import setup
+import setuptools
 
 
 def is_f(p):
@@ -62,7 +62,7 @@ def requires(fn='Requires'):
     return requires
 
 
-setup(name='cloud-init',
+setuptools.setup(name='cloud-init',
       version=versions()[0],
       description='EC2 initialisation magic',
       author='Scott Moser',

From 0e7181d28610abf3eb0fdc685abd2d4adb13f2d4 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 17:34:36 -0700
Subject: [PATCH 266/434] Fix secondary config subdir name

---
 setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index 45207af9..b55ec4ff 100755
--- a/setup.py
+++ b/setup.py
@@ -71,7 +71,7 @@ setuptools.setup(name='cloud-init',
       # This second package referencing cloudinit.conf.*
       # makes the config modules accessible to the whole
       # import system...
-      packages=['cloudinit', 'cloudinit.conf'],
+      packages=['cloudinit', 'cloudinit.config'],
       scripts=['bin/cloud-init',
                'tools/cloud-init-per',
                ],

From f70046b813d6723966fc096181e2f7033fa63137 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 17:45:45 -0700
Subject: [PATCH 267/434] Add a license and use find_packages to locate the
 needed packages

---
 setup.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/setup.py b/setup.py
index b55ec4ff..81468943 100755
--- a/setup.py
+++ b/setup.py
@@ -68,13 +68,11 @@ setuptools.setup(name='cloud-init',
       author='Scott Moser',
       author_email='scott.moser@canonical.com',
       url='http://launchpad.net/cloud-init/',
-      # This second package referencing cloudinit.conf.*
-      # makes the config modules accessible to the whole
-      # import system...
-      packages=['cloudinit', 'cloudinit.config'],
+      packages=setuptools.find_packages(exclude=['tests']),
       scripts=['bin/cloud-init',
                'tools/cloud-init-per',
                ],
+      license='GPLv3',
       data_files=[('/etc/cloud', glob('config/*.cfg')),
                   ('/etc/cloud/cloud.cfg.d', glob('config/cloud.cfg.d/*')),
                   ('/etc/cloud/templates', glob('templates/*')),

From 0b9a130b3875b7ba8e30cdb196dfc70e1b92d48c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 23:39:46 -0700
Subject: [PATCH 268/434] No need for this now that we have the imports done
 correctly

---
 bin/cloud-init | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index c1788ef4..c4633bdf 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -32,12 +32,6 @@ possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
 if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
     sys.path.insert(0, possible_topdir)
 
-# This is so config modules can be found
-if os.path.exists(os.path.join(possible_topdir,
-                 "cloudinit", 'config', "__init__.py")):
-    sys.path.insert(0, os.path.join(possible_topdir, 'cloudinit', 'config'))
-
-
 from cloudinit import log as logging
 from cloudinit import netinfo
 from cloudinit import settings

From 47360ed84384ae9bc648ccd7e4b76f704dc38142 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 23:40:00 -0700
Subject: [PATCH 269/434] 1. Add an importer function that will search for a
 given module in a set of search module 'prefixes'    that also has a
 potential set of required attributes. 2. Use this new importer to find the
 distro class, the userdata handler modules, the config modules    and the
 datasource modules, if none can be found error out accordingly.

---
 cloudinit/config/__init__.py   |  4 ----
 cloudinit/distros/__init__.py  | 23 ++++++++----------
 cloudinit/handlers/__init__.py |  8 -------
 cloudinit/importer.py          | 44 +++++++++++++++++++++++++++-------
 cloudinit/sources/__init__.py  | 34 +++++++++-----------------
 cloudinit/stages.py            | 22 +++++++++++++----
 6 files changed, 74 insertions(+), 61 deletions(-)

diff --git a/cloudinit/config/__init__.py b/cloudinit/config/__init__.py
index 02e32462..ab13045f 100644
--- a/cloudinit/config/__init__.py
+++ b/cloudinit/config/__init__.py
@@ -51,10 +51,6 @@ def fixup_module(mod, def_freq=PER_INSTANCE):
         freq = mod.frequency
         if freq and freq not in FREQUENCIES:
             LOG.warn("Module %s has an unknown frequency %s", mod, freq)
-    if not hasattr(mod, 'handle'):
-        def empty_handle(_name, _cfg, _cloud, _log, _args):
-            pass
-        setattr(mod, 'handle', empty_handle)
     if not hasattr(mod, 'distros'):
         setattr(mod, 'distros', None)
     return mod
diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 25a60c52..e0ef6ee0 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -144,16 +144,13 @@ class Distro(object):
             return False
 
 
-def fetch(distro_name, mods=(__name__, )):
-    mod = None
-    for m in mods:
-        mod_name = "%s.%s" % (m, distro_name)
-        try:
-            mod = importer.import_module(mod_name)
-        except ImportError:
-            pass
-    if not mod:
-        raise RuntimeError("No distribution found for distro %s"
-                           % (distro_name))
-    distro_cls = getattr(mod, 'Distro')
-    return distro_cls
+def fetch(name):
+    locs = importer.find_module(name,
+                                ['', __name__],
+                                ['Distro'])
+    if not locs:
+        raise ImportError("No distribution found for distro %s"
+                           % (name))
+    mod = importer.import_module(locs[0])
+    cls = getattr(mod, 'Distro')
+    return cls
diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index d52b1cba..0f7432e5 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -202,20 +202,12 @@ def walk(msg, callback, data):
 def fixup_handler(mod, def_freq=PER_INSTANCE):
     if not hasattr(mod, "handler_version"):
         setattr(mod, "handler_version", 1)
-    if not hasattr(mod, 'list_types'):
-        def empty_types():
-            return []
-        setattr(mod, 'list_types', empty_types)
     if not hasattr(mod, 'frequency'):
         setattr(mod, 'frequency', def_freq)
     else:
         freq = mod.frequency
         if freq and freq not in FREQUENCIES:
             LOG.warn("Handler %s has an unknown frequency %s", mod, freq)
-    if not hasattr(mod, 'handle_part'):
-        def empty_handler(_data, _ctype, _filename, _payload):
-            pass
-        setattr(mod, 'handle_part', empty_handler)
     return mod
 
 
diff --git a/cloudinit/importer.py b/cloudinit/importer.py
index a36b87bc..71cf2726 100644
--- a/cloudinit/importer.py
+++ b/cloudinit/importer.py
@@ -23,17 +23,43 @@
 import sys
 
 from cloudinit import log as logging
-from cloudinit import util
 
 LOG = logging.getLogger(__name__)
 
 
-# Simple wrapper that allows us to add more logging in...
 def import_module(module_name):
-    try:
-        LOG.debug("Attempting to import module %s", module_name)
-        __import__(module_name)
-        return sys.modules[module_name]
-    except:
-        util.logexc(LOG, 'Failed at importing %s', module_name)
-        raise
+    __import__(module_name)
+    return sys.modules[module_name]
+
+
+def find_module(base_name, search_paths, required_attrs=None):
+    found_places = []
+    if not required_attrs:
+        required_attrs = []
+    real_paths = []
+    for path in search_paths:
+        real_path = []
+        if path:
+            real_path.extend(path.split("."))
+        real_path.append(base_name)
+        full_path = '.'.join(real_path)
+        real_paths.append(full_path)
+    LOG.debug("Looking for modules %s that have attributes %s",
+              real_paths, required_attrs)
+    for full_path in real_paths:
+        mod = None
+        try:
+            mod = import_module(full_path)
+        except ImportError:
+            pass
+        if not mod:
+            continue
+        found_attrs = 0
+        for attr in required_attrs:
+            if hasattr(mod, attr):
+                found_attrs += 1
+        if found_attrs == len(required_attrs):
+            found_places.append(full_path)
+    LOG.debug("Found %s with attributes %s in %s", base_name,
+              required_attrs, found_places)
+    return found_places
diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 8ab7cf54..42e924b0 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -191,31 +191,19 @@ def list_sources(cfg_list, depends, pkg_list):
     LOG.info(("Looking for for data source in: %s,"
               " via packages %s that matches dependencies %s"),
              cfg_list, pkg_list, depends)
-    for ds_coll in cfg_list:
-        ds_name = str(ds_coll)
+    for ds_name in cfg_list:
         if not ds_name.startswith(DS_PREFIX):
             ds_name = '%s%s' % (DS_PREFIX, ds_name)
-        for pkg in pkg_list:
-            pkg_name = []
-            if pkg:
-                # Any package name given, this affects
-                # the lookup path
-                pkg_name.append(str(pkg))
-            pkg_name.append(ds_name)
-            try:
-                mod = importer.import_module(".".join(pkg_name))
-            except ImportError:
-                continue
-            lister = getattr(mod, "get_datasource_list", None)
-            if not lister:
-                continue
-            cls_matches = lister(depends)
-            if not cls_matches:
-                continue
-            src_list.extend(cls_matches)
-            LOG.debug(("Found a match"
-                       " in %s with matches %s"), mod, cls_matches)
-            break
+        m_locs = importer.find_module(ds_name,
+                                      pkg_list,
+                                      ['get_datasource_list'])
+        for m_loc in m_locs:
+            mod = importer.import_module(m_loc)
+            lister = getattr(mod, "get_datasource_list")
+            matches = lister(depends)
+            if matches:
+                src_list.extend(matches)
+                break
     return src_list
 
 
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 84a965c2..1997301a 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -205,7 +205,7 @@ class Init(object):
         # Any config provided???
         pkg_list = self.cfg.get('datasource_pkg_list') or []
         # Add the defaults at the end
-        for n in [util.obj_name(sources), '']:
+        for n in ['', util.obj_name(sources)]:
             if n not in pkg_list:
                 pkg_list.append(n)
         cfg_list = self.cfg.get('datasource_list') or []
@@ -334,9 +334,17 @@ class Init(object):
 
         # Add handlers in cdir
         potential_handlers = util.find_modules(cdir)
-        for (fname, modname) in potential_handlers.iteritems():
+        for (fname, mod_name) in potential_handlers.iteritems():
             try:
-                mod = handlers.fixup_handler(importer.import_module(modname))
+                mod_locs = importer.find_module(mod_name, [''],
+                                                ['list_types',
+                                                 'handle_part'])
+                if not mod_locs:
+                    LOG.warn(("Could not find a valid user-data handler"
+                              " named %s in file %s"), mod_name, fname)
+                    continue
+                mod = importer.import_module(mod_locs[0])
+                mod = handlers.fixup_handler(mod)
                 types = c_handlers.register(mod)
                 LOG.debug("Added handler for %s from %s", types, fname)
             except:
@@ -482,7 +490,13 @@ class Modules(object):
                           " has an unknown frequency %s"), raw_name, freq)
                 # Reset it so when ran it will get set to a known value
                 freq = None
-            mod = config.fixup_module(importer.import_module(mod_name))
+            mod_locs = importer.find_module(mod_name,
+                                            ['', util.obj_name(config)],
+                                            ['handle'])
+            if not mod_locs:
+                LOG.warn("Could not find module named %s", mod_name)
+                continue
+            mod = config.fixup_module(importer.import_module(mod_locs[0]))
             mostly_mods.append([mod, raw_name, freq, run_args])
         return mostly_mods
 

From 795b56d98c0db707a045231d15d3d0a6c19e69a9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 23:57:30 -0700
Subject: [PATCH 270/434] 1. Shorten the passed in name for frequency (and
 expand it later) 2. For single modules, if it doesn't run, print a warning
 and exit with a return code of 1

---
 bin/cloud-init | 25 ++++++++++++++++---------
 1 file changed, 16 insertions(+), 9 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index c4633bdf..a2f15c4b 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -52,6 +52,13 @@ QUERY_DATA_TYPES = [
     'instance_id',
 ]
 
+# Frequency shortname to full name
+FREQ_SHORT_NAMES = {
+    'instance': settings.PER_INSTANCE,
+    'always': settings.PER_ALWAYS,
+    'once': settings.PER_ONCE,
+}
+
 LOG = logging.getLogger()
 
 
@@ -294,6 +301,7 @@ def main_single(name, args):
     mod_freq = args.frequency
     if mod_freq:
         LOG.debug("Using passed in frequency %s", mod_freq)
+        mod_freq = FREQ_SHORT_NAMES.get(mod_freq)
     # Stage 3
     try:
         LOG.debug("Closing stdin")
@@ -308,15 +316,14 @@ def main_single(name, args):
         logging.resetLogging()
     logging.setupLogging(mods.cfg)
     # Stage 4
-    try:
-        (_run_am, failures) = mods.run_single(mod_name,
-                                              mod_args,
-                                              mod_freq)
-    except ImportError:
-        util.logexc(LOG, "Failed at importing module %s", mod_name)
-        return 1
+    (run_am, failures) = mods.run_single(mod_name,
+                                         mod_args,
+                                         mod_freq)
     if failures:
-        LOG.debug("Ran %s but it failed", mod_name)
+        LOG.warn("Ran %s but it failed!", mod_name)
+        return 1
+    elif run_am == 0:
+        LOG.warn("Did not run %s, does it exist?", mod_name)
         return 1
     else:
         return 0
@@ -382,7 +389,7 @@ def main():
     parser_single.add_argument("--frequency", action="store",
                               help=("frequency of the module"),
                               required=False,
-                              choices=settings.FREQUENCIES)
+                              choices=list(FREQ_SHORT_NAMES.keys()))
     parser_single.add_argument("module_args", nargs="*",
                               metavar='argument',
                               help=('any additional arguments to'

From a27179157a93bbadfe1f9cfb11cbff570ee5e6ee Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 23:58:29 -0700
Subject: [PATCH 271/434] 1. Add a dummy lock object + a file lock object 2.
 Use this object when returning semaphores 3. Adjust the debug statement to
 show this object

---
 cloudinit/helpers.py | 17 +++++++++++++----
 1 file changed, 13 insertions(+), 4 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 4447d1ee..b6974f3c 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -40,13 +40,17 @@ class LockFailure(Exception):
     pass
 
 
+class DummyLock(object):
+    pass
+
+
 class DummySemaphores(object):
     def __init__(self):
         pass
 
     @contextlib.contextmanager
     def lock(self, _name, _freq, _clear_on_fail=False):
-        yield True
+        yield DummyLock()
 
     def has_run(self, _name, _freq):
         return False
@@ -58,6 +62,11 @@ class DummySemaphores(object):
         pass
 
 
+class FileLock(object):
+    def __init__(self, fn):
+        self.fn = fn
+
+
 class FileSemaphores(object):
     def __init__(self, sem_path):
         self.sem_path = sem_path
@@ -101,7 +110,7 @@ class FileSemaphores(object):
         except (IOError, OSError):
             util.logexc(LOG, "Failed writing semaphore file %s", sem_file)
             return None
-        return sem_file
+        return FileLock(sem_file)
 
     def has_run(self, name, freq):
         if not freq or freq == PER_ALWAYS:
@@ -158,8 +167,8 @@ class Runners(object):
             if not lk:
                 raise LockFailure("Failed to acquire lock for %s" % name)
             else:
-                LOG.debug("Running %s with args %s using lock %s (%s)",
-                          functor, args, util.obj_name(lk), lk)
+                LOG.debug("Running %s with args %s using lock (%s)",
+                          functor, args, lk)
                 if isinstance(args, (dict)):
                     results = functor(**args)
                 else:

From 50c42334aac1aa6f91db27429ca4caa7f50c4412 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 20 Jun 2012 23:59:24 -0700
Subject: [PATCH 272/434] Return a empty json map as default instead of an
 empty string for unknown fields

---
 tools/mock-meta.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index 019a24f2..d4677af6 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -181,7 +181,7 @@ class MetaDataHandler(object):
                 else:
                     return "%s" % (PLACEMENT_CAPABILITIES.get(pentry, ''))
         else:
-            return ''
+            return '{}'
 
 class UserDataHandler(object):
 

From a6927bbaed3c217ad76cc5d21007e2b9b1673091 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Thu, 21 Jun 2012 08:38:12 -0700
Subject: [PATCH 273/434] 1. Move all info() logging methods to debug() 2.
 Adjust comment on sources list from depends 3. For the /etc/timezone
 'writing', add a header that says created by cloud-init

---
 bin/cloud-init                             |  3 +--
 cloudinit/distros/__init__.py              |  6 +++---
 cloudinit/distros/ubuntu.py                |  6 +++++-
 cloudinit/helpers.py                       |  2 +-
 cloudinit/sources/DataSourceCloudStack.py  |  2 +-
 cloudinit/sources/DataSourceConfigDrive.py |  6 ++----
 cloudinit/sources/DataSourceEc2.py         |  2 +-
 cloudinit/sources/DataSourceMAAS.py        |  2 +-
 cloudinit/sources/DataSourceNoCloud.py     |  2 +-
 cloudinit/sources/__init__.py              | 22 +++++++++++-----------
 cloudinit/url_helper.py                    | 14 +++++++-------
 11 files changed, 34 insertions(+), 33 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index a2f15c4b..d193272e 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -73,8 +73,7 @@ def welcome(action):
     }
     welcome_msg = "%s" % (templater.render_string(msg, tpl_params))
     sys.stderr.write("%s\n" % (welcome_msg))
-    sys.stderr.flush()
-    LOG.info(welcome_msg)
+    LOG.debug(welcome_msg)
 
 
 def extract_fns(args):
diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index e0ef6ee0..6325257c 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -133,14 +133,14 @@ class Distro(object):
             raise NotImplementedError("Unknown interface action %s" % (action))
         cmd = IFACE_ACTIONS[action]
         try:
-            LOG.info("Attempting to run %s interface action using command %s",
-                     action, cmd)
+            LOG.debug("Attempting to run %s interface action using command %s",
+                      action, cmd)
             (_out, err) = util.subp(cmd)
             if len(err):
                 LOG.warn("Running %s resulted in stderr output: %s", cmd, err)
             return True
         except util.ProcessExecutionError:
-            util.logexc(LOG, "Running %s failed", cmd)
+            util.logexc(LOG, "Running interface command %s failed", cmd)
             return False
 
 
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index fd7b7b8d..15af2e7f 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -112,7 +112,11 @@ class Distro(distros.Distro):
         if not os.path.isfile(tz_file):
             raise Exception(("Invalid timezone %s,"
                              " no file found at %s") % (tz, tz_file))
-        tz_contents = "%s\n" % tz
+        tz_lines = [
+            "# Created by cloud-init",
+            str(tz),
+        ]
+        tz_contents = "\n".join(tz_lines)
         tz_fn = self._paths.join(False, "/etc/timezone")
         util.write_file(tz_fn, tz_contents)
         util.copy(tz_file, self._paths.join(False, "/etc/localtime"))
diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index b6974f3c..6751f4a5 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -161,7 +161,7 @@ class Runners(object):
         if not args:
             args = []
         if sem.has_run(name, freq):
-            LOG.info("%s already ran (freq=%s)", name, freq)
+            LOG.debug("%s already ran (freq=%s)", name, freq)
             return (False, None)
         with sem.lock(name, freq, clear_on_fail) as lk:
             if not lk:
diff --git a/cloudinit/sources/DataSourceCloudStack.py b/cloudinit/sources/DataSourceCloudStack.py
index 83c577e6..751bef4f 100644
--- a/cloudinit/sources/DataSourceCloudStack.py
+++ b/cloudinit/sources/DataSourceCloudStack.py
@@ -98,7 +98,7 @@ class DataSourceCloudStack(sources.DataSource):
                                 timeout=timeout, status_cb=LOG.warn)
 
         if url:
-            LOG.info("Using metadata source: '%s'", url)
+            LOG.debug("Using metadata source: '%s'", url)
         else:
             LOG.critical(("Giving up on waiting for the metadata from %s"
                           " after %s seconds"),
diff --git a/cloudinit/sources/DataSourceConfigDrive.py b/cloudinit/sources/DataSourceConfigDrive.py
index 9905dad4..320dd1d1 100644
--- a/cloudinit/sources/DataSourceConfigDrive.py
+++ b/cloudinit/sources/DataSourceConfigDrive.py
@@ -87,10 +87,8 @@ class DataSourceConfigDrive(sources.DataSource):
         # Update interfaces and ifup only on the local datasource
         # this way the DataSourceConfigDriveNet doesn't do it also.
         if 'network-interfaces' in md and self.dsmode == "local":
-            if md['dsmode'] == "pass":
-                LOG.info("Updating network interfaces from configdrive")
-            else:
-                LOG.debug("Updating network interfaces from configdrive")
+            LOG.debug("Updating network interfaces from config drive (%s)",
+                     md['dsmode'])
             self.distro.apply_network(md['network-interfaces'])
 
         self.seed = found
diff --git a/cloudinit/sources/DataSourceEc2.py b/cloudinit/sources/DataSourceEc2.py
index 0598dfa2..cb460de1 100644
--- a/cloudinit/sources/DataSourceEc2.py
+++ b/cloudinit/sources/DataSourceEc2.py
@@ -169,7 +169,7 @@ class DataSourceEc2(sources.DataSource):
                                 timeout=timeout, status_cb=LOG.warn)
 
         if url:
-            LOG.info("Using metadata source: '%s'", url2base[url])
+            LOG.debug("Using metadata source: '%s'", url2base[url])
         else:
             LOG.critical("Giving up on md from %s after %s seconds",
                             urls, int(time.time() - start_time))
diff --git a/cloudinit/sources/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
index 104e7a54..22c90b7c 100644
--- a/cloudinit/sources/DataSourceMAAS.py
+++ b/cloudinit/sources/DataSourceMAAS.py
@@ -128,7 +128,7 @@ class DataSourceMAAS(sources.DataSource):
                                  headers_cb=self.md_headers)
 
         if url:
-            LOG.info("Using metadata source: '%s'", url)
+            LOG.debug("Using metadata source: '%s'", url)
         else:
             LOG.critical("Giving up on md from %s after %i seconds",
                             urls, int(time.time() - starttime))
diff --git a/cloudinit/sources/DataSourceNoCloud.py b/cloudinit/sources/DataSourceNoCloud.py
index 8499a97c..bed500a2 100644
--- a/cloudinit/sources/DataSourceNoCloud.py
+++ b/cloudinit/sources/DataSourceNoCloud.py
@@ -152,7 +152,7 @@ class DataSourceNoCloud(sources.DataSource):
         # ('local' for NoCloud, 'net' for NoCloudNet')
         if ('network-interfaces' in md and
             (self.dsmode in ("local", seeded_interfaces))):
-            LOG.info("Updating network interfaces from %s", self)
+            LOG.debug("Updating network interfaces from %s", self)
             self.distro.apply_network(md['network-interfaces'])
 
         if md['dsmode'] == self.dsmode:
diff --git a/cloudinit/sources/__init__.py b/cloudinit/sources/__init__.py
index 42e924b0..b25724a5 100644
--- a/cloudinit/sources/__init__.py
+++ b/cloudinit/sources/__init__.py
@@ -166,7 +166,7 @@ class DataSource(object):
 def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
     ds_list = list_sources(cfg_list, ds_deps, pkg_list)
     ds_names = [util.obj_name(f) for f in ds_list]
-    LOG.info("Searching for data source in: %s", ds_names)
+    LOG.debug("Searching for data source in: %s", ds_names)
 
     for cls in ds_list:
         try:
@@ -188,9 +188,9 @@ def find_source(sys_cfg, distro, paths, ds_deps, cfg_list, pkg_list):
 # Return an ordered list of classes that match (if any)
 def list_sources(cfg_list, depends, pkg_list):
     src_list = []
-    LOG.info(("Looking for for data source in: %s,"
-              " via packages %s that matches dependencies %s"),
-             cfg_list, pkg_list, depends)
+    LOG.debug(("Looking for for data source in: %s,"
+               " via packages %s that matches dependencies %s"),
+              cfg_list, pkg_list, depends)
     for ds_name in cfg_list:
         if not ds_name.startswith(DS_PREFIX):
             ds_name = '%s%s' % (DS_PREFIX, ds_name)
@@ -207,17 +207,17 @@ def list_sources(cfg_list, depends, pkg_list):
     return src_list
 
 
-# depends is a list of dependencies (DEP_FILESYSTEM)
-# dslist is a list of 2 item lists
-# dslist = [
+# 'depends' is a list of dependencies (DEP_FILESYSTEM)
+# ds_list is a list of 2 item lists
+# ds_list = [
 #   ( class, ( depends-that-this-class-needs ) )
 # }
-# it returns a list of 'class' that matched these deps exactly
-# it is a helper function for DataSourceCollections
-def list_from_depends(depends, dslist):
+# It returns a list of 'class' that matched these deps exactly
+# It mainly is a helper function for DataSourceCollections
+def list_from_depends(depends, ds_list):
     ret_list = []
     depset = set(depends)
-    for (cls, deps) in dslist:
+    for (cls, deps) in ds_list:
         if depset == set(deps):
             ret_list.append(cls)
     return ret_list
diff --git a/cloudinit/url_helper.py b/cloudinit/url_helper.py
index 223278ce..dbf72392 100644
--- a/cloudinit/url_helper.py
+++ b/cloudinit/url_helper.py
@@ -88,8 +88,8 @@ def readurl(url, data=None, timeout=None,
     attempts = retries + 1
 
     excepts = []
-    LOG.info(("Attempting to open '%s' with %s attempts"
-              " (%s retries, timeout=%s) to be performed"),
+    LOG.debug(("Attempting to open '%s' with %s attempts"
+               " (%s retries, timeout=%s) to be performed"),
               url, attempts, retries, timeout)
     open_args = {}
     if timeout is not None:
@@ -105,8 +105,8 @@ def readurl(url, data=None, timeout=None,
                 headers = {}
                 if rh.headers:
                     headers = dict(rh.headers)
-                LOG.info("Read from %s (%s, %sb) after %s attempts",
-                         url, status, len(content), (i + 1))
+                LOG.debug("Read from %s (%s, %sb) after %s attempts",
+                          url, status, len(content), (i + 1))
                 return UrlResponse(status, content, headers)
         except urllib2.HTTPError as e:
             excepts.append(e)
@@ -165,7 +165,7 @@ def wait_for_url(urls, max_wait=None, timeout=None,
     start_time = time.time()
 
     def log_status_cb(msg):
-        LOG.info(msg)
+        LOG.debug(msg)
 
     if status_cb is None:
         status_cb = log_status_cb
@@ -219,8 +219,8 @@ def wait_for_url(urls, max_wait=None, timeout=None,
             break
 
         loop_n = loop_n + 1
-        LOG.info("Please wait %s seconds while we wait to try again",
-                 sleep_time)
+        LOG.debug("Please wait %s seconds while we wait to try again",
+                  sleep_time)
         time.sleep(sleep_time)
 
     return False

From 5b112badba2fd093f2eab4ce8a5141cc08ca4055 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Thu, 21 Jun 2012 08:56:36 -0700
Subject: [PATCH 274/434] Move to a write location and when writing, also write
 to the write location, instead of the read-only one

---
 cloudinit/config/cc_mcollective.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/cloudinit/config/cc_mcollective.py b/cloudinit/config/cc_mcollective.py
index ba5e13ca..3fec6729 100644
--- a/cloudinit/config/cc_mcollective.py
+++ b/cloudinit/config/cc_mcollective.py
@@ -83,7 +83,7 @@ def handle(name, cfg, cloud, log, _args):
                     mcollective_config.set(cfg_name, o, v)
         # We got all our config as wanted we'll rename
         # the previous server.cfg and create our new one
-        old_fn = "%s.old" % (server_cfg_fn)
+        old_fn = cloud.paths.join(False, '/etc/mcollective/server.cfg.old')
         util.rename(server_cfg_fn, old_fn)
         # Now we got the whole file, write to disk except the section
         # we added so that config parser won't error out when trying to read.
@@ -91,7 +91,8 @@ def handle(name, cfg, cloud, log, _args):
         # works.  Below, we remove the initial 'nullsection' header.
         contents = mcollective_config.stringify()
         contents = contents.replace("%s\n" % (section_head), "")
-        util.write_file(server_cfg_fn, contents, mode=0644)
+        server_cfg_rw = cloud.paths.join(False, '/etc/mcollective/server.cfg')
+        util.write_file(server_cfg_rw, contents, mode=0644)
 
     # Start mcollective
     util.subp(['service', 'mcollective', 'start'], capture=False)

From e6e6f84fd94d44e24363f97b056caaa197d3eeb2 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Thu, 21 Jun 2012 09:12:16 -0700
Subject: [PATCH 275/434] 1. Renames for debug message from 'transform' to
 'module' 2. Fixing up more cloud.path.joins found to use the right ro/rw
 filename

---
 cloudinit/cloud.py                          |  4 ++--
 cloudinit/config/cc_apt_pipelining.py       |  6 ++++--
 cloudinit/config/cc_bootcmd.py              |  4 ++--
 cloudinit/config/cc_byobu.py                |  2 +-
 cloudinit/config/cc_ca_certs.py             |  2 +-
 cloudinit/config/cc_chef.py                 |  2 +-
 cloudinit/config/cc_disable_ec2_metadata.py |  2 +-
 cloudinit/config/cc_foo.py                  |  2 +-
 cloudinit/config/cc_keys_to_console.py      |  2 +-
 cloudinit/config/cc_landscape.py            | 11 ++++++++---
 cloudinit/config/cc_locale.py               |  2 +-
 cloudinit/config/cc_mcollective.py          |  2 +-
 cloudinit/config/cc_mounts.py               |  3 ++-
 cloudinit/config/cc_phone_home.py           |  2 +-
 cloudinit/config/cc_puppet.py               | 12 +++++++-----
 cloudinit/config/cc_resizefs.py             |  2 +-
 cloudinit/config/cc_rightscale_userdata.py  |  6 +++---
 cloudinit/config/cc_rsyslog.py              |  2 +-
 cloudinit/config/cc_runcmd.py               |  2 +-
 cloudinit/config/cc_salt_minion.py          | 10 +++++-----
 cloudinit/config/cc_scripts_per_boot.py     |  2 +-
 cloudinit/config/cc_scripts_per_instance.py |  2 +-
 cloudinit/config/cc_scripts_per_once.py     |  2 +-
 cloudinit/config/cc_scripts_user.py         |  2 +-
 cloudinit/config/cc_set_hostname.py         |  2 +-
 cloudinit/config/cc_set_passwords.py        |  4 +++-
 cloudinit/config/cc_ssh_import_id.py        |  4 ++--
 cloudinit/config/cc_timezone.py             |  2 +-
 cloudinit/config/cc_update_etc_hosts.py     |  2 +-
 cloudinit/config/cc_update_hostname.py      |  2 +-
 cloudinit/stages.py                         |  2 +-
 31 files changed, 59 insertions(+), 47 deletions(-)

diff --git a/cloudinit/cloud.py b/cloudinit/cloud.py
index 6cdcb76a..22d9167e 100644
--- a/cloudinit/cloud.py
+++ b/cloudinit/cloud.py
@@ -29,7 +29,7 @@ LOG = logging.getLogger(__name__)
 
 # This class is the high level wrapper that provides
 # access to cloud-init objects without exposing the stage objects
-# to handler and or transform manipulation. It allows for cloud
+# to handler and or module manipulation. It allows for cloud
 # init to restrict what those types of user facing code may see
 # and or adjust (which helps avoid code messing with each other)
 #
@@ -47,7 +47,7 @@ class Cloud(object):
         self._cfg = cfg
         self._runners = runners
 
-    # If a transform manipulates logging or logging services
+    # If a 'user' manipulates logging or logging services
     # it is typically useful to cause the logging to be
     # setup again.
     def cycle_logging(self):
diff --git a/cloudinit/config/cc_apt_pipelining.py b/cloudinit/config/cc_apt_pipelining.py
index f460becb..3426099e 100644
--- a/cloudinit/config/cc_apt_pipelining.py
+++ b/cloudinit/config/cc_apt_pipelining.py
@@ -25,6 +25,9 @@ distros = ['ubuntu', 'debian']
 
 DEFAULT_FILE = "/etc/apt/apt.conf.d/90cloud-init-pipelining"
 
+APT_PIPE_TPL = ("//Written by cloud-init per 'apt_pipelining'\n"
+                'Acquire::http::Pipeline-Depth "%s";\n')
+
 # Acquire::http::Pipeline-Depth can be a value
 # from 0 to 5 indicating how many outstanding requests APT should send.
 # A value of zero MUST be specified if the remote host does not properly linger
@@ -49,8 +52,7 @@ def handle(_name, cfg, cloud, log, _args):
 def write_apt_snippet(cloud, setting, log, f_name):
     """ Writes f_name with apt pipeline depth 'setting' """
 
-    file_contents = ("//Written by cloud-init per 'apt_pipelining'\n"
-                     'Acquire::http::Pipeline-Depth "%s";\n') % (setting)
+    file_contents = APT_PIPE_TPL % (setting)
 
     util.write_file(cloud.paths.join(False, f_name), file_contents)
 
diff --git a/cloudinit/config/cc_bootcmd.py b/cloudinit/config/cc_bootcmd.py
index 635e3a1f..89ccf3f1 100644
--- a/cloudinit/config/cc_bootcmd.py
+++ b/cloudinit/config/cc_bootcmd.py
@@ -30,7 +30,7 @@ frequency = PER_ALWAYS
 def handle(name, cfg, cloud, log, _args):
 
     if "bootcmd" not in cfg:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                    " no 'bootcmd' key in configuration"), name)
         return
 
@@ -52,5 +52,5 @@ def handle(name, cfg, cloud, log, _args):
             util.subp(cmd, env=env, capture=False)
         except:
             util.logexc(log,
-                        ("Failed to run bootcmd transform %s"), name)
+                        ("Failed to run bootcmd module %s"), name)
             raise
diff --git a/cloudinit/config/cc_byobu.py b/cloudinit/config/cc_byobu.py
index 741aa934..38586174 100644
--- a/cloudinit/config/cc_byobu.py
+++ b/cloudinit/config/cc_byobu.py
@@ -30,7 +30,7 @@ def handle(name, cfg, _cloud, log, args):
         value = util.get_cfg_option_str(cfg, "byobu_by_default", "")
 
     if not value:
-        log.debug("Skipping transform named %s, no 'byobu' values found", name)
+        log.debug("Skipping module named %s, no 'byobu' values found", name)
         return
 
     if value == "user" or value == "system":
diff --git a/cloudinit/config/cc_ca_certs.py b/cloudinit/config/cc_ca_certs.py
index 56c41561..3221a587 100644
--- a/cloudinit/config/cc_ca_certs.py
+++ b/cloudinit/config/cc_ca_certs.py
@@ -75,7 +75,7 @@ def handle(name, cfg, cloud, log, _args):
     """
     # If there isn't a ca-certs section in the configuration don't do anything
     if "ca-certs" not in cfg:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                    " no 'ca-certs' key in configuration"), name)
         return
 
diff --git a/cloudinit/config/cc_chef.py b/cloudinit/config/cc_chef.py
index 74af2a7e..d8bd85f8 100644
--- a/cloudinit/config/cc_chef.py
+++ b/cloudinit/config/cc_chef.py
@@ -31,7 +31,7 @@ def handle(name, cfg, cloud, log, _args):
 
     # If there isn't a chef key in the configuration don't do anything
     if 'chef' not in cfg:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                   " no 'chef' key in configuration"), name)
         return
     chef_cfg = cfg['chef']
diff --git a/cloudinit/config/cc_disable_ec2_metadata.py b/cloudinit/config/cc_disable_ec2_metadata.py
index 62cca7cc..a7c6a75b 100644
--- a/cloudinit/config/cc_disable_ec2_metadata.py
+++ b/cloudinit/config/cc_disable_ec2_metadata.py
@@ -32,5 +32,5 @@ def handle(name, cfg, _cloud, log, _args):
     if disabled:
         util.subp(REJECT_CMD)
     else:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                    " disabling the ec2 route not enabled"), name)
diff --git a/cloudinit/config/cc_foo.py b/cloudinit/config/cc_foo.py
index e81e7faa..95aab4dd 100644
--- a/cloudinit/config/cc_foo.py
+++ b/cloudinit/config/cc_foo.py
@@ -49,4 +49,4 @@ frequency = PER_INSTANCE
 
 
 def handle(name, _cfg, _cloud, log, _args):
-    log.debug("Hi from transform %s", name)
+    log.debug("Hi from module %s", name)
diff --git a/cloudinit/config/cc_keys_to_console.py b/cloudinit/config/cc_keys_to_console.py
index a8fb3ba7..d4c877f7 100644
--- a/cloudinit/config/cc_keys_to_console.py
+++ b/cloudinit/config/cc_keys_to_console.py
@@ -31,7 +31,7 @@ HELPER_TOOL = '/usr/lib/cloud-init/write-ssh-key-fingerprints'
 
 def handle(name, cfg, cloud, log, _args):
     if not os.path.exists(HELPER_TOOL):
-        log.warn(("Unable to activate transform %s,"
+        log.warn(("Unable to activate module %s,"
                   " helper tool not found at %s"), name, HELPER_TOOL)
         return
 
diff --git a/cloudinit/config/cc_landscape.py b/cloudinit/config/cc_landscape.py
index 599276a7..d45c9203 100644
--- a/cloudinit/config/cc_landscape.py
+++ b/cloudinit/config/cc_landscape.py
@@ -56,7 +56,7 @@ def handle(name, cfg, cloud, log, _args):
     """
     if not ConfigObj:
         log.warn(("'ConfigObj' support not available,"
-                  " running transform %s disabled"), name)
+                  " running module %s disabled"), name)
         return
 
     ls_cloudcfg = cfg.get("landscape", {})
@@ -66,9 +66,14 @@ def handle(name, cfg, cloud, log, _args):
                          " but not a dictionary type,"
                          " is a %s instead"), util.obj_name(ls_cloudcfg))
 
-    lsc_client_fn = cloud.paths.join(True, LSC_CLIENT_CFG_FILE)
-    merged = merge_together([LSC_BUILTIN_CFG, lsc_client_fn, ls_cloudcfg])
+    merge_data = [
+        LSC_BUILTIN_CFG,
+        cloud.paths.join(True, LSC_CLIENT_CFG_FILE),
+        ls_cloudcfg,
+    ]
+    merged = merge_together(merge_data)
 
+    lsc_client_fn = cloud.paths.join(False, LSC_CLIENT_CFG_FILE)
     lsc_dir = cloud.paths.join(False, os.path.dirname(lsc_client_fn))
     if not os.path.isdir(lsc_dir):
         util.ensure_dir(lsc_dir)
diff --git a/cloudinit/config/cc_locale.py b/cloudinit/config/cc_locale.py
index 7f273123..3fb4c5d9 100644
--- a/cloudinit/config/cc_locale.py
+++ b/cloudinit/config/cc_locale.py
@@ -49,7 +49,7 @@ def handle(name, cfg, cloud, log, args):
                                              "/etc/default/locale")
 
     if not locale:
-        log.debug(("Skipping transform named %s, "
+        log.debug(("Skipping module named %s, "
                    "no 'locale' configuration found"), name)
         return
 
diff --git a/cloudinit/config/cc_mcollective.py b/cloudinit/config/cc_mcollective.py
index 3fec6729..36a4cade 100644
--- a/cloudinit/config/cc_mcollective.py
+++ b/cloudinit/config/cc_mcollective.py
@@ -32,7 +32,7 @@ def handle(name, cfg, cloud, log, _args):
 
     # If there isn't a mcollective key in the configuration don't do anything
     if 'mcollective' not in cfg:
-        log.debug(("Skipping transform named %s, "
+        log.debug(("Skipping module named %s, "
                    "no 'mcollective' key in configuration"), name)
         return
 
diff --git a/cloudinit/config/cc_mounts.py b/cloudinit/config/cc_mounts.py
index ab097c2a..d3dcf7af 100644
--- a/cloudinit/config/cc_mounts.py
+++ b/cloudinit/config/cc_mounts.py
@@ -188,8 +188,9 @@ def handle(_name, cfg, cloud, log, _args):
             util.logexc(log, "Activating swap via 'swapon -a' failed")
 
     for d in dirs:
+        real_dir = cloud.paths.join(False, d)
         try:
-            util.ensure_dir(cloud.paths.join(False, d))
+            util.ensure_dir(real_dir)
         except:
             util.logexc(log, "Failed to make '%s' config-mount", d)
 
diff --git a/cloudinit/config/cc_phone_home.py b/cloudinit/config/cc_phone_home.py
index dcb07b66..d929eb64 100644
--- a/cloudinit/config/cc_phone_home.py
+++ b/cloudinit/config/cc_phone_home.py
@@ -53,7 +53,7 @@ def handle(name, cfg, cloud, log, args):
         ph_cfg = cfg['phone_home']
 
     if 'url' not in ph_cfg:
-        log.warn(("Skipping transform named %s, "
+        log.warn(("Skipping module named %s, "
                   "no 'url' found in 'phone_home' configuration"), name)
         return
 
diff --git a/cloudinit/config/cc_puppet.py b/cloudinit/config/cc_puppet.py
index 5154efba..467c1496 100644
--- a/cloudinit/config/cc_puppet.py
+++ b/cloudinit/config/cc_puppet.py
@@ -31,7 +31,7 @@ from cloudinit import util
 def handle(name, cfg, cloud, log, _args):
     # If there isn't a puppet key in the configuration don't do anything
     if 'puppet' not in cfg:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                    " no 'puppet' configuration found"), name)
         return
 
@@ -43,7 +43,7 @@ def handle(name, cfg, cloud, log, _args):
     # ... and then update the puppet configuration
     if 'conf' in puppet_cfg:
         # Add all sections from the conf object to puppet.conf
-        puppet_conf_fn = cloud.paths.join(False, '/etc/puppet/puppet.conf')
+        puppet_conf_fn = cloud.paths.join(True, '/etc/puppet/puppet.conf')
         contents = util.load_file(puppet_conf_fn)
         # Create object for reading puppet.conf values
         puppet_config = helpers.DefaultingConfigParser()
@@ -89,9 +89,11 @@ def handle(name, cfg, cloud, log, _args):
                     puppet_config.set(cfg_name, o, v)
             # We got all our config as wanted we'll rename
             # the previous puppet.conf and create our new one
-            puppet_conf_old_fn = "%s.old" % (puppet_conf_fn)
-            util.rename(puppet_conf_fn, puppet_conf_old_fn)
-            util.write_file(puppet_conf_fn, puppet_config.stringify())
+            conf_old_fn = cloud.paths.join(False,
+                                           '/etc/puppet/puppet.conf.old')
+            util.rename(puppet_conf_fn, conf_old_fn)
+            puppet_conf_rw = cloud.paths.join(False, '/etc/puppet/puppet.conf')
+            util.write_file(puppet_conf_rw, puppet_config.stringify())
 
     # Set puppet to automatically start
     if os.path.exists('/etc/default/puppet'):
diff --git a/cloudinit/config/cc_resizefs.py b/cloudinit/config/cc_resizefs.py
index c019989e..7e1428e9 100644
--- a/cloudinit/config/cc_resizefs.py
+++ b/cloudinit/config/cc_resizefs.py
@@ -69,7 +69,7 @@ def handle(name, cfg, cloud, log, args):
         resize_root = util.get_cfg_option_str(cfg, "resize_rootfs", True)
 
     if not util.translate_bool(resize_root):
-        log.debug("Skipping transform named %s, resizing disabled", name)
+        log.debug("Skipping module named %s, resizing disabled", name)
         return
 
     # TODO is the directory ok to be used??
diff --git a/cloudinit/config/cc_rightscale_userdata.py b/cloudinit/config/cc_rightscale_userdata.py
index 8385e281..7a134569 100644
--- a/cloudinit/config/cc_rightscale_userdata.py
+++ b/cloudinit/config/cc_rightscale_userdata.py
@@ -53,13 +53,13 @@ def handle(name, _cfg, cloud, log, _args):
     try:
         ud = cloud.get_userdata_raw()
     except:
-        log.warn("Failed to get raw userdata in transform %s", name)
+        log.warn("Failed to get raw userdata in module %s", name)
         return
 
     try:
         mdict = parse_qs(ud)
         if not mdict or not MY_HOOKNAME in mdict:
-            log.debug(("Skipping transform %s, "
+            log.debug(("Skipping module %s, "
                        "did not find %s in parsed"
                        " raw userdata"), name, MY_HOOKNAME)
             return
@@ -73,7 +73,7 @@ def handle(name, _cfg, cloud, log, _args):
 
     # These will eventually be then ran by the cc_scripts_user
     # TODO: maybe this should just be a new user data handler??
-    # Instead of a late transform that acts like a user data handler?
+    # Instead of a late module that acts like a user data handler?
     scripts_d = cloud.get_ipath_cur('scripts')
     urls = mdict[MY_HOOKNAME]
     for (i, url) in enumerate(urls):
diff --git a/cloudinit/config/cc_rsyslog.py b/cloudinit/config/cc_rsyslog.py
index f2c1de1e..78327526 100644
--- a/cloudinit/config/cc_rsyslog.py
+++ b/cloudinit/config/cc_rsyslog.py
@@ -36,7 +36,7 @@ def handle(name, cfg, cloud, log, _args):
 
     # process 'rsyslog'
     if not 'rsyslog' in cfg:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                    " no 'rsyslog' key in configuration"), name)
         return
 
diff --git a/cloudinit/config/cc_runcmd.py b/cloudinit/config/cc_runcmd.py
index f121484b..65064cfb 100644
--- a/cloudinit/config/cc_runcmd.py
+++ b/cloudinit/config/cc_runcmd.py
@@ -25,7 +25,7 @@ from cloudinit import util
 
 def handle(name, cfg, cloud, log, _args):
     if "runcmd" not in cfg:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                    " no 'runcmd' key in configuration"), name)
         return
 
diff --git a/cloudinit/config/cc_salt_minion.py b/cloudinit/config/cc_salt_minion.py
index 986e6db6..ff90d07a 100644
--- a/cloudinit/config/cc_salt_minion.py
+++ b/cloudinit/config/cc_salt_minion.py
@@ -24,7 +24,7 @@ from cloudinit import util
 def handle(name, cfg, cloud, log, _args):
     # If there isn't a salt key in the configuration don't do anything
     if 'salt_minion' not in cfg:
-        log.debug(("Skipping transform named %s,"
+        log.debug(("Skipping module named %s,"
                    " no 'salt_minion' key in configuration"), name)
         return
 
@@ -34,8 +34,8 @@ def handle(name, cfg, cloud, log, _args):
     cloud.distro.install_packages(["salt"])
 
     # Ensure we can configure files at the right dir
-    config_dir = salt_cfg.get("config_dir", '/etc/salt')
-    config_dir = cloud.paths.join(False, config_dir)
+    config_dir = cloud.paths.join(False, salt_cfg.get("config_dir",
+                                                      '/etc/salt'))
     util.ensure_dir(config_dir)
 
     # ... and then update the salt configuration
@@ -47,8 +47,8 @@ def handle(name, cfg, cloud, log, _args):
 
     # ... copy the key pair if specified
     if 'public_key' in salt_cfg and 'private_key' in salt_cfg:
-        pki_dir = salt_cfg.get('pki_dir', '/etc/salt/pki')
-        pki_dir = cloud.paths.join(pki_dir)
+        pki_dir = cloud.paths.join(False, salt_cfg.get('pki_dir',
+                                                       '/etc/salt/pki'))
         with util.umask(077):
             util.ensure_dir(pki_dir)
             pub_name = os.path.join(pki_dir, 'minion.pub')
diff --git a/cloudinit/config/cc_scripts_per_boot.py b/cloudinit/config/cc_scripts_per_boot.py
index d3c47442..42b987eb 100644
--- a/cloudinit/config/cc_scripts_per_boot.py
+++ b/cloudinit/config/cc_scripts_per_boot.py
@@ -36,6 +36,6 @@ def handle(name, _cfg, cloud, log, _args):
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run transform %s (%s in %s)",
+        log.warn("Failed to run module %s (%s in %s)",
                  name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_scripts_per_instance.py b/cloudinit/config/cc_scripts_per_instance.py
index 8e428ac2..b5d71c13 100644
--- a/cloudinit/config/cc_scripts_per_instance.py
+++ b/cloudinit/config/cc_scripts_per_instance.py
@@ -36,6 +36,6 @@ def handle(name, _cfg, cloud, log, _args):
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run transform %s (%s in %s)",
+        log.warn("Failed to run module %s (%s in %s)",
                  name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_scripts_per_once.py b/cloudinit/config/cc_scripts_per_once.py
index e7a29a44..d77d36d5 100644
--- a/cloudinit/config/cc_scripts_per_once.py
+++ b/cloudinit/config/cc_scripts_per_once.py
@@ -36,6 +36,6 @@ def handle(name, _cfg, cloud, log, _args):
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run transform %s (%s in %s)",
+        log.warn("Failed to run module %s (%s in %s)",
                  name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_scripts_user.py b/cloudinit/config/cc_scripts_user.py
index 1ff05aae..5c53014f 100644
--- a/cloudinit/config/cc_scripts_user.py
+++ b/cloudinit/config/cc_scripts_user.py
@@ -37,6 +37,6 @@ def handle(name, _cfg, cloud, log, _args):
     try:
         util.runparts(runparts_path)
     except:
-        log.warn("Failed to run transform %s (%s in %s)",
+        log.warn("Failed to run module %s (%s in %s)",
                  name, SCRIPT_SUBDIR, runparts_path)
         raise
diff --git a/cloudinit/config/cc_set_hostname.py b/cloudinit/config/cc_set_hostname.py
index 3ac8a8fa..b0f27ebf 100644
--- a/cloudinit/config/cc_set_hostname.py
+++ b/cloudinit/config/cc_set_hostname.py
@@ -24,7 +24,7 @@ from cloudinit import util
 def handle(name, cfg, cloud, log, _args):
     if util.get_cfg_option_bool(cfg, "preserve_hostname", False):
         log.debug(("Configuration option 'preserve_hostname' is set,"
-                    " not setting the hostname in transform %s"), name)
+                    " not setting the hostname in module %s"), name)
         return
 
     (hostname, _fqdn) = util.get_hostname_fqdn(cfg, cloud)
diff --git a/cloudinit/config/cc_set_passwords.py b/cloudinit/config/cc_set_passwords.py
index ce17f357..eb68ddfe 100644
--- a/cloudinit/config/cc_set_passwords.py
+++ b/cloudinit/config/cc_set_passwords.py
@@ -106,7 +106,9 @@ def handle(_name, cfg, cloud, log, args):
         replacement = "PasswordAuthentication %s" % (pw_auth)
 
         # See http://linux.die.net/man/5/sshd_config
-        old_lines = util.load_file('/etc/ssh/sshd_config').splitlines()
+        conf_fn = cloud.paths.join(True, '/etc/ssh/sshd_config')
+        # Todo: use the common ssh_util function for this parsing...
+        old_lines = util.load_file(conf_fn).splitlines()
         for i, line in enumerate(old_lines):
             if not line.strip() or line.startswith("#"):
                 new_lines.append(line)
diff --git a/cloudinit/config/cc_ssh_import_id.py b/cloudinit/config/cc_ssh_import_id.py
index d57e4665..c58b28ec 100644
--- a/cloudinit/config/cc_ssh_import_id.py
+++ b/cloudinit/config/cc_ssh_import_id.py
@@ -36,11 +36,11 @@ def handle(name, cfg, _cloud, log, args):
         ids = util.get_cfg_option_list(cfg, "ssh_import_id", [])
 
     if len(ids) == 0:
-        log.debug("Skipping transform named %s, no ids found to import", name)
+        log.debug("Skipping module named %s, no ids found to import", name)
         return
 
     if not user:
-        log.debug("Skipping transform named %s, no user found to import", name)
+        log.debug("Skipping module named %s, no user found to import", name)
         return
 
     cmd = ["sudo", "-Hu", user, "ssh-import-id"] + ids
diff --git a/cloudinit/config/cc_timezone.py b/cloudinit/config/cc_timezone.py
index 747c436c..b9eb85b2 100644
--- a/cloudinit/config/cc_timezone.py
+++ b/cloudinit/config/cc_timezone.py
@@ -32,7 +32,7 @@ def handle(name, cfg, cloud, log, args):
         timezone = util.get_cfg_option_str(cfg, "timezone", False)
 
     if not timezone:
-        log.debug("Skipping transform named %s, no 'timezone' specified", name)
+        log.debug("Skipping module named %s, no 'timezone' specified", name)
         return
 
     # Let the distro handle settings its timezone
diff --git a/cloudinit/config/cc_update_etc_hosts.py b/cloudinit/config/cc_update_etc_hosts.py
index 75615db1..6820ac4f 100644
--- a/cloudinit/config/cc_update_etc_hosts.py
+++ b/cloudinit/config/cc_update_etc_hosts.py
@@ -57,4 +57,4 @@ def handle(name, cfg, cloud, log, _args):
         cloud.distro.update_etc_hosts(hostname, fqdn)
     else:
         log.debug(("Configuration option 'manage_etc_hosts' is not set,"
-                    " not managing /etc/hosts in transform %s"), name)
+                    " not managing /etc/hosts in module %s"), name)
diff --git a/cloudinit/config/cc_update_hostname.py b/cloudinit/config/cc_update_hostname.py
index 58444fab..b84a1a06 100644
--- a/cloudinit/config/cc_update_hostname.py
+++ b/cloudinit/config/cc_update_hostname.py
@@ -29,7 +29,7 @@ frequency = PER_ALWAYS
 def handle(name, cfg, cloud, log, _args):
     if util.get_cfg_option_bool(cfg, "preserve_hostname", False):
         log.debug(("Configuration option 'preserve_hostname' is set,"
-                    " not updating the hostname in transform %s"), name)
+                    " not updating the hostname in module %s"), name)
         return
 
     (hostname, _fqdn) = util.get_hostname_fqdn(cfg, cloud)
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 1997301a..9f28c2e8 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -518,7 +518,7 @@ class Modules(object):
                               " but not on %s distro. It may or may not work"
                               " correctly."), name, worked_distros, d_name)
                 # Deep copy the config so that modules can't alter it
-                # Use the transforms logger and not our own
+                # Use the configs logger and not our own
                 func_args = [name, copy.deepcopy(self.cfg),
                              cc, config.LOG, args]
                 # Mark it as having started running

From 4014179a6cd7c502b55e09271ef6d2179efbaf90 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 10:54:01 -0700
Subject: [PATCH 276/434] Use yaml safe_load just incase

---
 cloudinit/util.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 56c01fab..9c3d7fc7 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -578,7 +578,7 @@ def load_yaml(blob, default=None, allowed=(dict,)):
         LOG.debug(("Attempting to load yaml from string "
                  "of length %s with allowed root types %s"),
                  len(blob), allowed)
-        converted = yaml.load(blob)
+        converted = yaml.safe_load(blob)
         if not isinstance(converted, allowed):
             # Yes this will just be caught, but thats ok for now...
             raise TypeError(("Yaml load allows %s root types,"

From 56c86071645e42a03a1df3fd7f57c03d09cf4fd5 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 12:30:32 -0700
Subject: [PATCH 277/434] Simplify sshd config loading to make it use one set
 of functions/objects/classes

---
 cloudinit/config/cc_set_passwords.py | 43 ++++++++++--------------
 cloudinit/ssh_util.py                | 49 ++++++++++++++++++++++++----
 2 files changed, 61 insertions(+), 31 deletions(-)

diff --git a/cloudinit/config/cc_set_passwords.py b/cloudinit/config/cc_set_passwords.py
index eb68ddfe..5b72224b 100644
--- a/cloudinit/config/cc_set_passwords.py
+++ b/cloudinit/config/cc_set_passwords.py
@@ -20,6 +20,7 @@
 
 import sys
 
+from cloudinit import ssh_util
 from cloudinit import util
 
 from string import letters, digits  # pylint: disable=W0402
@@ -101,39 +102,31 @@ def handle(_name, cfg, cloud, log, args):
             pw_auth = 'no'
 
     if change_pwauth:
-        new_lines = []
         replaced_auth = False
-        replacement = "PasswordAuthentication %s" % (pw_auth)
 
-        # See http://linux.die.net/man/5/sshd_config
-        conf_fn = cloud.paths.join(True, '/etc/ssh/sshd_config')
-        # Todo: use the common ssh_util function for this parsing...
-        old_lines = util.load_file(conf_fn).splitlines()
-        for i, line in enumerate(old_lines):
-            if not line.strip() or line.startswith("#"):
-                new_lines.append(line)
-                continue
-            splitup = line.split(None, 1)
-            if len(splitup) <= 1:
-                new_lines.append(line)
-                continue
-            (cmd, args) = splitup
+        # See: man sshd_config
+        conf_fn = cloud.paths.join(True, ssh_util.DEF_SSHD_CFG)
+        old_lines = ssh_util.parse_ssh_config(conf_fn)
+        new_lines = []
+        i = 0
+        for (i, line) in enumerate(old_lines):
             # Keywords are case-insensitive and arguments are case-sensitive
-            cmd = cmd.lower().strip()
-            if cmd == 'passwordauthentication':
-                log.debug("Replacing auth line %s with %s", i + 1, replacement)
+            if line.key == 'passwordauthentication':
+                log.debug("Replacing auth line %s with %s", i + 1, pw_auth)
                 replaced_auth = True
-                new_lines.append(replacement)
-            else:
-                new_lines.append(line)
+                line.value = pw_auth
+            new_lines.append(line)
 
         if not replaced_auth:
-            log.debug("Adding new auth line %s", replacement)
+            log.debug("Adding new auth line %s", i + 1)
             replaced_auth = True
-            new_lines.append(replacement)
+            new_lines.append(ssh_util.SshdConfigLine('',
+                                                     'PasswordAuthentication',
+                                                     pw_auth))
 
-        util.write_file(cloud.paths.join(False, '/etc/ssh/sshd_config'),
-                        "\n".join(new_lines))
+        lines = [str(e) for e in new_lines]
+        ssh_rw_fn = cloud.paths.join(False, ssh_util.DEF_SSHD_CFG)
+        util.write_file(ssh_rw_fn, "\n".join(lines))
 
         try:
             cmd = ['service']
diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index 45dd5535..fc8b9b3d 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -29,6 +29,8 @@ from cloudinit import log as logging
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)
+
+# See: man sshd_config
 DEF_SSHD_CFG = "/etc/ssh/sshd_config"
 
 
@@ -233,7 +235,7 @@ def setup_user_keys(keys, user, key_prefix, paths):
             # The following tokens are defined: %% is replaced by a literal
             # '%', %h is replaced by the home directory of the user being
             # authenticated and %u is replaced by the username of that user.
-            ssh_cfg = parse_ssh_config(sshd_conf_fn)
+            ssh_cfg = parse_ssh_config_map(sshd_conf_fn)
             akeys = ssh_cfg.get("authorizedkeysfile", '')
             akeys = akeys.strip()
             if not akeys:
@@ -258,19 +260,54 @@ def setup_user_keys(keys, user, key_prefix, paths):
         util.chownbyid(authorized_keys, pwent.pw_uid, pwent.pw_gid)
 
 
+class SshdConfigLine(object):
+    def __init__(self, line, k=None, v=None):
+        self.line = line
+        self._key = k
+        self.value = v
+
+    @property
+    def key(self):
+        if self._key is None:
+            return None
+        # Keywords are case-insensitive
+        return self._key.lower()
+
+    def __str__(self):
+        if self._key is None:
+            return str(self.line)
+        else:
+            v = str(self._key)
+            if self.value:
+                v += " " + str(self.value)
+            return v
+
+
 def parse_ssh_config(fname):
+    # See: man sshd_config
     # The file contains keyword-argument pairs, one per line.
     # Lines starting with '#' and empty lines are interpreted as comments.
     # Note: key-words are case-insensitive and arguments are case-sensitive
-    ret = {}
+    lines = []
     if not os.path.isfile(fname):
-        return ret
+        return lines
     for line in util.load_file(fname).splitlines():
         line = line.strip()
         if not line or line.startswith("#"):
+            lines.append(SshdConfigLine(line))
             continue
         (key, val) = line.split(None, 1)
-        key = key.strip().lower()
-        if key:
-            ret[key] = val
+        lines.append(SshdConfigLine(line, key, val))
+    return lines
+
+
+def parse_ssh_config_map(fname):
+    lines = parse_ssh_config(fname)
+    if not lines:
+        return {}
+    ret = {}
+    for line in lines:
+        if not line.key:
+            continue
+        ret[line.key] = line.value
     return ret

From f7ee6ab23a7fb8c9d0c0afd17a4e967d269c247c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 12:33:53 -0700
Subject: [PATCH 278/434] Remove a unused import.

---
 cloudinit/handlers/__init__.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 0f7432e5..94cb699e 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -27,7 +27,6 @@ from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE, FREQUENCIES)
 
 from cloudinit import importer
 from cloudinit import log as logging
-from cloudinit import url_helper
 from cloudinit import util
 
 LOG = logging.getLogger(__name__)

From fa284be90c812b6b13a0362092c8c0ef354452dc Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 12:34:25 -0700
Subject: [PATCH 279/434] Remove another unused import

---
 cloudinit/distros/__init__.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index 6325257c..f9a97da7 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -23,7 +23,6 @@
 from StringIO import StringIO
 
 import abc
-import copy
 
 from cloudinit import importer
 from cloudinit import log as logging

From 389a0f3275be19dff20a2acf0842a10825daec36 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 13:13:19 -0700
Subject: [PATCH 280/434] Pass along any environment settings via the variable
 'noseopts'

---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 82c5dedb..ab23bf1f 100644
--- a/Makefile
+++ b/Makefile
@@ -11,7 +11,7 @@ pyflakes:
 	pyflakes $(PY_FILES)
 
 test:
-	nosetests tests/unittests/
+	nosetests $(noseopts) tests/unittests/
 
 2to3:
 	2to3 $(PY_FILES)

From 431b287e9df61f3cd2e5dbdfbfe1f4e770f5a67e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 13:36:33 -0700
Subject: [PATCH 281/434] This is now functional and all passing again

---
 tests/unittests/test_util.py | 91 +++++++++++++++++++-----------------
 1 file changed, 49 insertions(+), 42 deletions(-)

diff --git a/tests/unittests/test_util.py b/tests/unittests/test_util.py
index e8f5885c..27c0fbd6 100644
--- a/tests/unittests/test_util.py
+++ b/tests/unittests/test_util.py
@@ -1,13 +1,13 @@
-from unittest import TestCase
-from mocker import MockerTestCase
-from tempfile import mkdtemp
 from shutil import rmtree
+from tempfile import mkdtemp
+
 import os
 import stat
 
-from cloudinit.util import (mergedict, get_cfg_option_list_or_str, write_file,
-                            delete_dir_contents, get_cmdline,
-                            keyval_str_to_dict)
+from unittest import TestCase
+from mocker import MockerTestCase
+
+from cloudinit import util
 
 
 class TestMergeDict(TestCase):
@@ -15,14 +15,14 @@ class TestMergeDict(TestCase):
         """Test simple non-conflict merge."""
         source = {"key1": "value1"}
         candidate = {"key2": "value2"}
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual({"key1": "value1", "key2": "value2"}, result)
 
     def test_nested_merge(self):
         """Test nested merge."""
         source = {"key1": {"key1.1": "value1.1"}}
         candidate = {"key1": {"key1.2": "value1.2"}}
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual(
             {"key1": {"key1.1": "value1.1", "key1.2": "value1.2"}}, result)
 
@@ -30,42 +30,42 @@ class TestMergeDict(TestCase):
         """Test that candidate doesn't override source."""
         source = {"key1": "value1", "key2": "value2"}
         candidate = {"key1": "value2", "key2": "NEW VALUE"}
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual(source, result)
 
     def test_empty_candidate(self):
         """Test empty candidate doesn't change source."""
         source = {"key": "value"}
         candidate = {}
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual(source, result)
 
     def test_empty_source(self):
         """Test empty source is replaced by candidate."""
         source = {}
         candidate = {"key": "value"}
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual(candidate, result)
 
     def test_non_dict_candidate(self):
         """Test non-dict candidate is discarded."""
         source = {"key": "value"}
         candidate = "not a dict"
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual(source, result)
 
     def test_non_dict_source(self):
         """Test non-dict source is not modified with a dict candidate."""
         source = "not a dict"
         candidate = {"key": "value"}
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual(source, result)
 
     def test_neither_dict(self):
         """Test if neither candidate or source is dict source wins."""
         source = "source"
         candidate = "candidate"
-        result = mergedict(source, candidate)
+        result = util.mergedict(source, candidate)
         self.assertEqual(source, result)
 
 
@@ -73,31 +73,31 @@ class TestGetCfgOptionListOrStr(TestCase):
     def test_not_found_no_default(self):
         """None is returned if key is not found and no default given."""
         config = {}
-        result = get_cfg_option_list_or_str(config, "key")
+        result = util.get_cfg_option_list(config, "key")
         self.assertIsNone(result)
 
     def test_not_found_with_default(self):
         """Default is returned if key is not found."""
         config = {}
-        result = get_cfg_option_list_or_str(config, "key", default=["DEFAULT"])
+        result = util.get_cfg_option_list(config, "key", default=["DEFAULT"])
         self.assertEqual(["DEFAULT"], result)
 
     def test_found_with_default(self):
         """Default is not returned if key is found."""
         config = {"key": ["value1"]}
-        result = get_cfg_option_list_or_str(config, "key", default=["DEFAULT"])
+        result = util.get_cfg_option_list(config, "key", default=["DEFAULT"])
         self.assertEqual(["value1"], result)
 
     def test_found_convert_to_list(self):
         """Single string is converted to one element list."""
         config = {"key": "value1"}
-        result = get_cfg_option_list_or_str(config, "key")
+        result = util.get_cfg_option_list(config, "key")
         self.assertEqual(["value1"], result)
 
     def test_value_is_none(self):
         """If value is None empty list is returned."""
         config = {"key": None}
-        result = get_cfg_option_list_or_str(config, "key")
+        result = util.get_cfg_option_list(config, "key")
         self.assertEqual([], result)
 
 
@@ -117,7 +117,7 @@ class TestWriteFile(MockerTestCase):
         path = os.path.join(self.tmp, "NewFile.txt")
         contents = "Hey there"
 
-        write_file(path, contents)
+        util.write_file(path, contents)
 
         self.assertTrue(os.path.exists(path))
         self.assertTrue(os.path.isfile(path))
@@ -133,7 +133,7 @@ class TestWriteFile(MockerTestCase):
         path = os.path.join(dirname, "NewFile.txt")
         contents = "Hey there"
 
-        write_file(path, contents)
+        util.write_file(path, contents)
 
         self.assertTrue(os.path.isdir(dirname))
         self.assertTrue(os.path.isfile(path))
@@ -143,7 +143,7 @@ class TestWriteFile(MockerTestCase):
         path = os.path.join(self.tmp, "NewFile.txt")
         contents = "Hey there"
 
-        write_file(path, contents, mode=0666)
+        util.write_file(path, contents, mode=0666)
 
         self.assertTrue(os.path.exists(path))
         self.assertTrue(os.path.isfile(path))
@@ -158,7 +158,7 @@ class TestWriteFile(MockerTestCase):
         # Create file first with basic content
         with open(path, "wb") as f:
             f.write("LINE1\n")
-        write_file(path, contents, omode="a")
+        util.write_file(path, contents, omode="a")
 
         self.assertTrue(os.path.exists(path))
         self.assertTrue(os.path.isfile(path))
@@ -167,17 +167,24 @@ class TestWriteFile(MockerTestCase):
             self.assertEqual("LINE1\nHey there", create_contents)
 
     def test_restorecon_if_possible_is_called(self):
-        """Make sure the restorecon_if_possible is called correctly."""
-        path = os.path.join(self.tmp, "NewFile.txt")
-        contents = "Hey there"
-
-        # Mock out the restorecon_if_possible call to test if it's called.
-        mock_restorecon = self.mocker.replace(
-            "cloudinit.util.restorecon_if_possible", passthrough=False)
-        mock_restorecon(path)
-        self.mocker.replay()
-
-        write_file(path, contents)
+        """Make sure the selinux guard is called correctly."""
+        try:
+            # We can only mock these out if selinux actually
+            # exists, so thats why we catch the import
+            mock_restorecon = self.mocker.replace(
+                "selinux.restorecon", passthrough=False)
+            mock_is_selinux_enabled = self.mocker.replace(
+                "selinux.is_selinux_enabled", passthrough=False)
+            mock_is_selinux_enabled.result(True)
+            mock_restorecon(path)
+            self.mocker.replay()
+            old = util.HAVE_LIBSELINUX
+            util.HAVE_LIBSELINUX = True
+            with util.SeLinuxGuard(self.tmp) as is_on:
+                self.assertTrue(is_on)
+            util.HAVE_LIBSELINUX = old
+        except ImportError:
+            pass
 
 
 class TestDeleteDirContents(TestCase):
@@ -196,7 +203,7 @@ class TestDeleteDirContents(TestCase):
 
     def test_does_not_delete_dir(self):
         """Ensure directory itself is not deleted."""
-        delete_dir_contents(self.tmp)
+        util.delete_dir_contents(self.tmp)
 
         self.assertTrue(os.path.isdir(self.tmp))
         self.assertDirEmpty(self.tmp)
@@ -206,7 +213,7 @@ class TestDeleteDirContents(TestCase):
         with open(os.path.join(self.tmp, "new_file.txt"), "wb") as f:
             f.write("DELETE ME")
 
-        delete_dir_contents(self.tmp)
+        util.delete_dir_contents(self.tmp)
 
         self.assertDirEmpty(self.tmp)
 
@@ -214,7 +221,7 @@ class TestDeleteDirContents(TestCase):
         """Empty directories should be deleted."""
         os.mkdir(os.path.join(self.tmp, "new_dir"))
 
-        delete_dir_contents(self.tmp)
+        util.delete_dir_contents(self.tmp)
 
         self.assertDirEmpty(self.tmp)
 
@@ -223,7 +230,7 @@ class TestDeleteDirContents(TestCase):
         os.mkdir(os.path.join(self.tmp, "new_dir"))
         os.mkdir(os.path.join(self.tmp, "new_dir", "new_subdir"))
 
-        delete_dir_contents(self.tmp)
+        util.delete_dir_contents(self.tmp)
 
         self.assertDirEmpty(self.tmp)
 
@@ -234,7 +241,7 @@ class TestDeleteDirContents(TestCase):
         with open(f_name, "wb") as f:
             f.write("DELETE ME")
 
-        delete_dir_contents(self.tmp)
+        util.delete_dir_contents(self.tmp)
 
         self.assertDirEmpty(self.tmp)
 
@@ -246,7 +253,7 @@ class TestDeleteDirContents(TestCase):
             f.write("DELETE ME")
         os.symlink(file_name, link_name)
 
-        delete_dir_contents(self.tmp)
+        util.delete_dir_contents(self.tmp)
 
         self.assertDirEmpty(self.tmp)
 
@@ -255,12 +262,12 @@ class TestKeyValStrings(TestCase):
     def test_keyval_str_to_dict(self):
         expected = {'1': 'one', '2': 'one+one', 'ro': True}
         cmdline = "1=one ro 2=one+one"
-        self.assertEqual(expected, keyval_str_to_dict(cmdline))
+        self.assertEqual(expected, util.keyval_str_to_dict(cmdline))
 
 
 class TestGetCmdline(TestCase):
     def test_cmdline_reads_debug_env(self):
         os.environ['DEBUG_PROC_CMDLINE'] = 'abcd 123'
-        self.assertEqual(os.environ['DEBUG_PROC_CMDLINE'], get_cmdline())
+        self.assertEqual(os.environ['DEBUG_PROC_CMDLINE'], util.get_cmdline())
 
 # vi: ts=4 expandtab

From 1751a121f98ee514ed4a7d19623fcca84905e0d9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 13:38:06 -0700
Subject: [PATCH 282/434] Returning whether it was enabled, useful for unit
 testing

---
 cloudinit/util.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 9c3d7fc7..f0a65fa3 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -133,7 +133,7 @@ class SeLinuxGuard(object):
 
     def __enter__(self):
         # TODO: Should we try to engage selinux here??
-        return None
+        return self.enabled
 
     def __exit__(self, excp_type, excp_value, excp_traceback):
         if self.enabled:

From a9933e3def7647fd7696f3246ec854b475062c33 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 15:56:31 -0700
Subject: [PATCH 283/434] 1. Got this test working again using the new code. 2.
 Adjusted so that instead of capturing all logging, only a certain level is
 captured (now that we have lots more logging)

---
 tests/unittests/test_userdata.py | 145 +++++++++++++++++++------------
 1 file changed, 91 insertions(+), 54 deletions(-)

diff --git a/tests/unittests/test_userdata.py b/tests/unittests/test_userdata.py
index 8eb7b259..eeddde7d 100644
--- a/tests/unittests/test_userdata.py
+++ b/tests/unittests/test_userdata.py
@@ -1,107 +1,144 @@
 """Tests for handling of userdata within cloud init"""
 
-import logging
 import StringIO
 
+import logging
+import os
+import shutil
+import tempfile
+
 from email.mime.base import MIMEBase
 
 from mocker import MockerTestCase
 
-import cloudinit
-from cloudinit.DataSource import DataSource
+from cloudinit import helpers
+from cloudinit import log
+from cloudinit import sources
+from cloudinit import stages
+from cloudinit import util
+
+INSTANCE_ID = "i-testing"
 
 
-instance_id = "i-testing"
-
-
-class FakeDataSource(DataSource):
+class FakeDataSource(sources.DataSource):
 
     def __init__(self, userdata):
-        DataSource.__init__(self)
-        self.metadata = {'instance-id': instance_id}
+        sources.DataSource.__init__(self, {}, None, None)
+        self.metadata = {'instance-id': INSTANCE_ID}
         self.userdata_raw = userdata
 
 
+# FIXME: these tests shouldn't be checking log output??
+# Weirddddd...
+
+
 class TestConsumeUserData(MockerTestCase):
 
-    _log_handler = None
-    _log = None
-    log_file = None
-
     def setUp(self):
+        MockerTestCase.setUp(self)
+        # Replace the write so no actual files
+        # get written out...
         self.mock_write = self.mocker.replace("cloudinit.util.write_file",
             passthrough=False)
-        self.mock_write(self.get_ipath("cloud_config"), "", 0600)
-        self.capture_log()
+        self._log = None
+        self._log_file = None
+        self._log_handler = None
 
     def tearDown(self):
-        self._log.removeHandler(self._log_handler)
+        MockerTestCase.tearDown(self)
+        if self._log_handler and self._log:
+            self._log.removeHandler(self._log_handler)
 
-    @staticmethod
-    def get_ipath(name):
-        return "%s/instances/%s%s" % (cloudinit.varlibdir, instance_id,
-            cloudinit.pathmap[name])
-
-    def capture_log(self):
-        self.log_file = StringIO.StringIO()
-        self._log_handler = logging.StreamHandler(self.log_file)
-        self._log_handler.setLevel(logging.DEBUG)
-        self._log = logging.getLogger(cloudinit.logger_name)
+    def capture_log(self, lvl=logging.DEBUG):
+        log_file = StringIO.StringIO()
+        self._log_handler = logging.StreamHandler(log_file)
+        self._log_handler.setLevel(lvl)
+        self._log = log.getLogger()
         self._log.addHandler(self._log_handler)
+        return log_file
 
     def test_unhandled_type_warning(self):
         """Raw text without magic is ignored but shows warning"""
+        ci = stages.Init()
+        data = "arbitrary text\n"
+        ci.datasource = FakeDataSource(data)
+
+        self.mock_write(ci.paths.get_ipath("cloud_config"), "", 0600)
         self.mocker.replay()
-        ci = cloudinit.CloudInit()
-        ci.datasource = FakeDataSource("arbitrary text\n")
-        ci.consume_userdata()
-        self.assertEqual(
-            "Unhandled non-multipart userdata starting 'arbitrary text...'\n",
-            self.log_file.getvalue())
+
+        log_file = self.capture_log(logging.WARNING)
+        ci.fetch()
+        ci.consume()
+        self.assertIn(
+            "Unhandled non-multipart (text/x-not-multipart) userdata:",
+            log_file.getvalue())
 
     def test_mime_text_plain(self):
-        """Mime message of type text/plain is ignored without warning"""
-        self.mocker.replay()
-        ci = cloudinit.CloudInit()
+        """Mime message of type text/plain is ignored but shows warning"""
+        ci = stages.Init()
         message = MIMEBase("text", "plain")
         message.set_payload("Just text")
         ci.datasource = FakeDataSource(message.as_string())
-        ci.consume_userdata()
-        self.assertEqual("", self.log_file.getvalue())
 
+        self.mock_write(ci.paths.get_ipath("cloud_config"), "", 0600)
+        self.mocker.replay()
+
+        log_file = self.capture_log(logging.WARNING)
+        ci.fetch()
+        ci.consume()
+        self.assertIn(
+            "Unhandled unknown content-type (text/plain)",
+            log_file.getvalue())
+
+    
     def test_shellscript(self):
         """Raw text starting #!/bin/sh is treated as script"""
+        ci = stages.Init()
         script = "#!/bin/sh\necho hello\n"
-        outpath = cloudinit.get_ipath_cur("scripts") + "/part-001"
+        ci.datasource = FakeDataSource(script)
+
+        outpath = os.path.join(ci.paths.get_ipath_cur("scripts"), "part-001")
+        self.mock_write(ci.paths.get_ipath("cloud_config"), "", 0600)
         self.mock_write(outpath, script, 0700)
         self.mocker.replay()
-        ci = cloudinit.CloudInit()
-        ci.datasource = FakeDataSource(script)
-        ci.consume_userdata()
-        self.assertEqual("", self.log_file.getvalue())
+
+        log_file = self.capture_log(logging.WARNING)
+        ci.fetch()
+        ci.consume()
+        self.assertEqual("", log_file.getvalue())
 
     def test_mime_text_x_shellscript(self):
         """Mime message of type text/x-shellscript is treated as script"""
+        ci = stages.Init()
         script = "#!/bin/sh\necho hello\n"
-        outpath = cloudinit.get_ipath_cur("scripts") + "/part-001"
-        self.mock_write(outpath, script, 0700)
-        self.mocker.replay()
-        ci = cloudinit.CloudInit()
         message = MIMEBase("text", "x-shellscript")
         message.set_payload(script)
         ci.datasource = FakeDataSource(message.as_string())
-        ci.consume_userdata()
-        self.assertEqual("", self.log_file.getvalue())
+
+        outpath = os.path.join(ci.paths.get_ipath_cur("scripts"), "part-001")
+        self.mock_write(ci.paths.get_ipath("cloud_config"), "", 0600)
+        self.mock_write(outpath, script, 0700)
+        self.mocker.replay()
+
+        log_file = self.capture_log(logging.WARNING)
+        ci.fetch()
+        ci.consume()
+        self.assertEqual("", log_file.getvalue())
 
     def test_mime_text_plain_shell(self):
         """Mime type text/plain starting #!/bin/sh is treated as script"""
+        ci = stages.Init()
         script = "#!/bin/sh\necho hello\n"
-        outpath = cloudinit.get_ipath_cur("scripts") + "/part-001"
-        self.mock_write(outpath, script, 0700)
-        self.mocker.replay()
-        ci = cloudinit.CloudInit()
         message = MIMEBase("text", "plain")
         message.set_payload(script)
         ci.datasource = FakeDataSource(message.as_string())
-        ci.consume_userdata()
-        self.assertEqual("", self.log_file.getvalue())
+
+        outpath = os.path.join(ci.paths.get_ipath_cur("scripts"), "part-001")
+        self.mock_write(outpath, script, 0700)
+        self.mock_write(ci.paths.get_ipath("cloud_config"), "", 0600)
+        self.mocker.replay()
+
+        log_file = self.capture_log(logging.WARNING)
+        ci.fetch()
+        ci.consume()
+        self.assertEqual("", log_file.getvalue())

From a505aa0c52ec728e2bb27ef268aabc30391ef115 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 15:57:09 -0700
Subject: [PATCH 284/434] Use the mocker built-in method for creating temporary
 dirs (which it will cleanup)

---
 tests/unittests/test_util.py | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/tests/unittests/test_util.py b/tests/unittests/test_util.py
index 27c0fbd6..aea1aabb 100644
--- a/tests/unittests/test_util.py
+++ b/tests/unittests/test_util.py
@@ -1,6 +1,3 @@
-from shutil import rmtree
-from tempfile import mkdtemp
-
 import os
 import stat
 
@@ -10,7 +7,7 @@ from mocker import MockerTestCase
 from cloudinit import util
 
 
-class TestMergeDict(TestCase):
+class TestMergeDict(MockerTestCase):
     def test_simple_merge(self):
         """Test simple non-conflict merge."""
         source = {"key1": "value1"}
@@ -105,12 +102,10 @@ class TestWriteFile(MockerTestCase):
     def setUp(self):
         super(TestWriteFile, self).setUp()
         # Make a temp directoy for tests to use.
-        self.tmp = mkdtemp(prefix="unittest_")
+        self.tmp = self.makeDir(prefix="unittest_")
 
     def tearDown(self):
         super(TestWriteFile, self).tearDown()
-        # Clean up temp directory
-        rmtree(self.tmp)
 
     def test_basic_usage(self):
         """Verify basic usage with default args."""

From 2e83d545a7189802bb3e41d2d1816f7a8fa7c471 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 15:59:57 -0700
Subject: [PATCH 285/434] Missed some other mkdtemp and rmtree calls no longer
 needed

---
 tests/unittests/test_util.py | 14 ++------------
 1 file changed, 2 insertions(+), 12 deletions(-)

diff --git a/tests/unittests/test_util.py b/tests/unittests/test_util.py
index aea1aabb..ba565b29 100644
--- a/tests/unittests/test_util.py
+++ b/tests/unittests/test_util.py
@@ -101,12 +101,8 @@ class TestGetCfgOptionListOrStr(TestCase):
 class TestWriteFile(MockerTestCase):
     def setUp(self):
         super(TestWriteFile, self).setUp()
-        # Make a temp directoy for tests to use.
         self.tmp = self.makeDir(prefix="unittest_")
 
-    def tearDown(self):
-        super(TestWriteFile, self).tearDown()
-
     def test_basic_usage(self):
         """Verify basic usage with default args."""
         path = os.path.join(self.tmp, "NewFile.txt")
@@ -182,16 +178,10 @@ class TestWriteFile(MockerTestCase):
             pass
 
 
-class TestDeleteDirContents(TestCase):
+class TestDeleteDirContents(MockerTestCase):
     def setUp(self):
         super(TestDeleteDirContents, self).setUp()
-        # Make a temp directoy for tests to use.
-        self.tmp = mkdtemp(prefix="unittest_")
-
-    def tearDown(self):
-        super(TestDeleteDirContents, self).tearDown()
-        # Clean up temp directory
-        rmtree(self.tmp)
+        self.tmp = self.makeDir(prefix="unittest_")
 
     def assertDirEmpty(self, dirname):
         self.assertEqual([], os.listdir(dirname))

From 8069ce83abd825b812aa466cc45b63053c487437 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 17:15:45 -0700
Subject: [PATCH 286/434] 1. Only register and increment the handler count
 after we have ensured it imports and call_begin passes. 2. Fixup the
 'test__init__.py' file to now be working again.

---
 cloudinit/handlers/__init__.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/cloudinit/handlers/__init__.py b/cloudinit/handlers/__init__.py
index 94cb699e..20a822bd 100644
--- a/cloudinit/handlers/__init__.py
+++ b/cloudinit/handlers/__init__.py
@@ -135,12 +135,15 @@ def walker_handle_handler(pdata, _ctype, _filename, payload):
         modfname = "%s.py" % (modfname)
     # TODO: Check if path exists??
     util.write_file(modfname, payload, 0600)
-    pdata['handlercount'] = curcount + 1
     handlers = pdata['handlers']
     try:
         mod = fixup_handler(importer.import_module(modname))
-        handlers.register(mod)
         call_begin(mod, pdata['data'], frequency)
+        # Only register and increment
+        # after the above have worked (so we don't if it
+        # fails)
+        handlers.register(mod)
+        pdata['handlercount'] = curcount + 1
     except:
         util.logexc(LOG, ("Failed at registering python file: %s"
                           " (part handler %s)"), modfname, curcount)

From 236c293e53d43ed88724395d82cc07e0476fdea2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 17:36:09 -0700
Subject: [PATCH 287/434] Testing is easier if we just pass the paths object,
 instead of the full cloud object here.

---
 cloudinit/config/cc_ca_certs.py | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/cloudinit/config/cc_ca_certs.py b/cloudinit/config/cc_ca_certs.py
index 3221a587..266a2d84 100644
--- a/cloudinit/config/cc_ca_certs.py
+++ b/cloudinit/config/cc_ca_certs.py
@@ -33,7 +33,7 @@ def update_ca_certs():
     util.subp(["update-ca-certificates"])
 
 
-def add_ca_certs(cloud, certs):
+def add_ca_certs(paths, certs):
     """
     Adds certificates to the system. To actually apply the new certificates
     you must also call L{update_ca_certs}.
@@ -44,21 +44,21 @@ def add_ca_certs(cloud, certs):
         # First ensure they are strings...
         cert_file_contents = "\n".join([str(c) for c in certs])
         cert_file_fullpath = os.path.join(CA_CERT_PATH, CA_CERT_FILENAME)
-        cert_file_fullpath = cloud.paths.join(False, cert_file_fullpath)
+        cert_file_fullpath = paths.join(False, cert_file_fullpath)
         util.write_file(cert_file_fullpath, cert_file_contents, mode=0644)
         # Append cert filename to CA_CERT_CONFIG file.
-        util.write_file(cloud.paths.join(False, CA_CERT_CONFIG),
+        util.write_file(paths.join(False, CA_CERT_CONFIG),
                         "\n%s" % CA_CERT_FILENAME, omode="ab")
 
 
-def remove_default_ca_certs(cloud):
+def remove_default_ca_certs(paths):
     """
     Removes all default trusted CA certificates from the system. To actually
     apply the change you must also call L{update_ca_certs}.
     """
-    util.delete_dir_contents(cloud.paths.join(False, CA_CERT_PATH))
-    util.delete_dir_contents(cloud.paths.join(False, CA_CERT_SYSTEM_PATH))
-    util.write_file(cloud.paths.join(False, CA_CERT_CONFIG), "", mode=0644)
+    util.delete_dir_contents(paths.join(False, CA_CERT_PATH))
+    util.delete_dir_contents(paths.join(False, CA_CERT_SYSTEM_PATH))
+    util.write_file(paths.join(False, CA_CERT_CONFIG), "", mode=0644)
     debconf_sel = "ca-certificates ca-certificates/trust_new_crts select no"
     util.subp(('debconf-set-selections', '-'), debconf_sel)
 
@@ -85,14 +85,14 @@ def handle(name, cfg, cloud, log, _args):
     # default trusted CA certs first.
     if ca_cert_cfg.get("remove-defaults", False):
         log.debug("Removing default certificates")
-        remove_default_ca_certs(cloud)
+        remove_default_ca_certs(cloud.paths)
 
     # If we are given any new trusted CA certs to add, add them.
     if "trusted" in ca_cert_cfg:
         trusted_certs = util.get_cfg_option_list(ca_cert_cfg, "trusted")
         if trusted_certs:
             log.debug("Adding %d certificates" % len(trusted_certs))
-            add_ca_certs(cloud, trusted_certs)
+            add_ca_certs(cloud.paths, trusted_certs)
 
     # Update the system with the new cert configuration.
     log.debug("Updating certificates")

From 539a05e141b2d84dd12b32b275399c8ceb1a3d72 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 17:37:00 -0700
Subject: [PATCH 288/434] Get both of these tests back in working shape.

---
 tests/unittests/test__init__.py               | 162 ++++++++----------
 .../test_handler/test_handler_ca_certs.py     | 101 ++++++-----
 2 files changed, 131 insertions(+), 132 deletions(-)

diff --git a/tests/unittests/test__init__.py b/tests/unittests/test__init__.py
index 4f60f0ea..af18955d 100644
--- a/tests/unittests/test__init__.py
+++ b/tests/unittests/test__init__.py
@@ -1,18 +1,42 @@
-from mocker import MockerTestCase, ANY, ARGS, KWARGS
+import StringIO
+import logging
 import os
+import sys
 
-from cloudinit import (partwalker_handle_handler, handler_handle_part,
-                       handler_register, get_cmdline_url)
-from cloudinit.util import write_file, logexc, readurl
+from mocker import MockerTestCase, ANY, ARGS, KWARGS
+
+from cloudinit import handlers
+from cloudinit import helpers
+from cloudinit import importer
+from cloudinit import log
+from cloudinit import settings
+from cloudinit import url_helper
+from cloudinit import util
 
 
-class TestPartwalkerHandleHandler(MockerTestCase):
+class FakeModule(handlers.Handler):
+    def __init__(self):
+        handlers.Handler.__init__(self, settings.PER_ALWAYS)
+        self.types = []
+
+    def list_types(self):
+        return self.types
+
+    def _handle_part(self, data, ctype, filename, payload, frequency):
+        pass
+
+
+class TestWalkerHandleHandler(MockerTestCase):
+
     def setUp(self):
+
+        MockerTestCase.setUp(self)
+
         self.data = {
             "handlercount": 0,
-            "frequency": "?",
-            "handlerdir": "?",
-            "handlers": [],
+            "frequency": "",
+            "handlerdir": self.makeDir(),
+            "handlers": helpers.ContentHandlers(),
             "data": None}
 
         self.expected_module_name = "part-handler-%03d" % (
@@ -20,179 +44,138 @@ class TestPartwalkerHandleHandler(MockerTestCase):
         expected_file_name = "%s.py" % self.expected_module_name
         expected_file_fullname = os.path.join(self.data["handlerdir"],
                                               expected_file_name)
-        self.module_fake = "fake module handle"
+        self.module_fake = FakeModule()
         self.ctype = None
         self.filename = None
         self.payload = "dummy payload"
 
         # Mock the write_file function
-        write_file_mock = self.mocker.replace(write_file, passthrough=False)
+        write_file_mock = self.mocker.replace(util.write_file, passthrough=False)
         write_file_mock(expected_file_fullname, self.payload, 0600)
 
     def test_no_errors(self):
         """Payload gets written to file and added to C{pdata}."""
-        # Mock the __import__ builtin
-        import_mock = self.mocker.replace("__builtin__.__import__")
+        import_mock = self.mocker.replace(importer.import_module, passthrough=False)
         import_mock(self.expected_module_name)
         self.mocker.result(self.module_fake)
-        # Mock the handle_register function
-        handle_reg_mock = self.mocker.replace(handler_register,
-                                              passthrough=False)
-        handle_reg_mock(self.module_fake, self.data["handlers"],
-                        self.data["data"], self.data["frequency"])
-        # Activate mocks
         self.mocker.replay()
-
-        partwalker_handle_handler(self.data, self.ctype, self.filename,
-                                  self.payload)
-
+ 
+        handlers.walker_handle_handler(self.data, self.ctype, self.filename,
+                                       self.payload)
+ 
         self.assertEqual(1, self.data["handlercount"])
-
+ 
     def test_import_error(self):
         """Module import errors are logged. No handler added to C{pdata}"""
-        # Mock the __import__ builtin
-        import_mock = self.mocker.replace("__builtin__.__import__")
+        import_mock = self.mocker.replace(importer.import_module, passthrough=False)
         import_mock(self.expected_module_name)
         self.mocker.throw(ImportError())
-        # Mock log function
-        logexc_mock = self.mocker.replace(logexc, passthrough=False)
-        logexc_mock(ANY)
-        # Mock the print_exc function
-        print_exc_mock = self.mocker.replace("traceback.print_exc",
-                                             passthrough=False)
-        print_exc_mock(ARGS, KWARGS)
-        # Activate mocks
         self.mocker.replay()
 
-        partwalker_handle_handler(self.data, self.ctype, self.filename,
-                                  self.payload)
+        handlers.walker_handle_handler(self.data, self.ctype, self.filename,
+                                       self.payload)
 
         self.assertEqual(0, self.data["handlercount"])
 
     def test_attribute_error(self):
         """Attribute errors are logged. No handler added to C{pdata}"""
-        # Mock the __import__ builtin
-        import_mock = self.mocker.replace("__builtin__.__import__")
+        import_mock = self.mocker.replace(importer.import_module, passthrough=False)
         import_mock(self.expected_module_name)
         self.mocker.result(self.module_fake)
-        # Mock the handle_register function
-        handle_reg_mock = self.mocker.replace(handler_register,
-                                              passthrough=False)
-        handle_reg_mock(self.module_fake, self.data["handlers"],
-                        self.data["data"], self.data["frequency"])
         self.mocker.throw(AttributeError())
-        # Mock log function
-        logexc_mock = self.mocker.replace(logexc, passthrough=False)
-        logexc_mock(ANY)
-        # Mock the print_exc function
-        print_exc_mock = self.mocker.replace("traceback.print_exc",
-                                             passthrough=False)
-        print_exc_mock(ARGS, KWARGS)
-        # Activate mocks
         self.mocker.replay()
 
-        partwalker_handle_handler(self.data, self.ctype, self.filename,
-                                  self.payload)
+        handlers.walker_handle_handler(self.data, self.ctype, self.filename,
+                                       self.payload)
 
         self.assertEqual(0, self.data["handlercount"])
 
 
 class TestHandlerHandlePart(MockerTestCase):
+
     def setUp(self):
         self.data = "fake data"
         self.ctype = "fake ctype"
         self.filename = "fake filename"
         self.payload = "fake payload"
-        self.frequency = "once-per-instance"
+        self.frequency = settings.PER_INSTANCE
 
     def test_normal_version_1(self):
         """
         C{handle_part} is called without C{frequency} for
         C{handler_version} == 1.
         """
-        # Build a mock part-handler module
         mod_mock = self.mocker.mock()
         getattr(mod_mock, "frequency")
-        self.mocker.result("once-per-instance")
+        self.mocker.result(settings.PER_INSTANCE)
         getattr(mod_mock, "handler_version")
         self.mocker.result(1)
         mod_mock.handle_part(self.data, self.ctype, self.filename,
                              self.payload)
         self.mocker.replay()
 
-        handler_handle_part(mod_mock, self.data, self.ctype, self.filename,
-                            self.payload, self.frequency)
+        handlers.run_part(mod_mock, self.data, self.ctype, self.filename,
+                          self.payload, self.frequency)
 
     def test_normal_version_2(self):
         """
         C{handle_part} is called with C{frequency} for
         C{handler_version} == 2.
         """
-        # Build a mock part-handler module
         mod_mock = self.mocker.mock()
         getattr(mod_mock, "frequency")
-        self.mocker.result("once-per-instance")
+        self.mocker.result(settings.PER_INSTANCE)
         getattr(mod_mock, "handler_version")
         self.mocker.result(2)
         mod_mock.handle_part(self.data, self.ctype, self.filename,
                              self.payload, self.frequency)
         self.mocker.replay()
 
-        handler_handle_part(mod_mock, self.data, self.ctype, self.filename,
-                            self.payload, self.frequency)
+        handlers.run_part(mod_mock, self.data, self.ctype, self.filename,
+                          self.payload, self.frequency)
 
     def test_modfreq_per_always(self):
         """
         C{handle_part} is called regardless of frequency if nofreq is always.
         """
         self.frequency = "once"
-        # Build a mock part-handler module
         mod_mock = self.mocker.mock()
         getattr(mod_mock, "frequency")
-        self.mocker.result("always")
+        self.mocker.result(settings.PER_ALWAYS)
         getattr(mod_mock, "handler_version")
         self.mocker.result(1)
         mod_mock.handle_part(self.data, self.ctype, self.filename,
                              self.payload)
         self.mocker.replay()
 
-        handler_handle_part(mod_mock, self.data, self.ctype, self.filename,
-                            self.payload, self.frequency)
+        handlers.run_part(mod_mock, self.data, self.ctype, self.filename,
+                          self.payload, self.frequency)
 
     def test_no_handle_when_modfreq_once(self):
         """C{handle_part} is not called if frequency is once"""
         self.frequency = "once"
-        # Build a mock part-handler module
         mod_mock = self.mocker.mock()
         getattr(mod_mock, "frequency")
-        self.mocker.result("once-per-instance")
+        self.mocker.result(settings.PER_ONCE)
         self.mocker.replay()
 
-        handler_handle_part(mod_mock, self.data, self.ctype, self.filename,
-                            self.payload, self.frequency)
+        handlers.run_part(mod_mock, self.data, self.ctype, self.filename,
+                          self.payload, self.frequency)
 
     def test_exception_is_caught(self):
         """Exceptions within C{handle_part} are caught and logged."""
-        # Build a mock part-handler module
         mod_mock = self.mocker.mock()
         getattr(mod_mock, "frequency")
-        self.mocker.result("once-per-instance")
+        self.mocker.result(settings.PER_INSTANCE)
         getattr(mod_mock, "handler_version")
         self.mocker.result(1)
         mod_mock.handle_part(self.data, self.ctype, self.filename,
                              self.payload)
         self.mocker.throw(Exception())
-        # Mock log function
-        logexc_mock = self.mocker.replace(logexc, passthrough=False)
-        logexc_mock(ANY)
-        # Mock the print_exc function
-        print_exc_mock = self.mocker.replace("traceback.print_exc",
-                                             passthrough=False)
-        print_exc_mock(ARGS, KWARGS)
         self.mocker.replay()
 
-        handler_handle_part(mod_mock, self.data, self.ctype, self.filename,
-                            self.payload, self.frequency)
+        handlers.run_part(mod_mock, self.data, self.ctype, self.filename,
+                          self.payload, self.frequency)
 
 
 class TestCmdlineUrl(MockerTestCase):
@@ -202,14 +185,13 @@ class TestCmdlineUrl(MockerTestCase):
         payload = "0"
         cmdline = "ro %s=%s bar=1" % (key, url)
 
-        mock_readurl = self.mocker.replace(readurl, passthrough=False)
+        mock_readurl = self.mocker.replace(url_helper.readurl, passthrough=False)
         mock_readurl(url)
-        self.mocker.result(payload)
-
+        self.mocker.result(url_helper.UrlResponse(200, payload))
         self.mocker.replay()
 
         self.assertEqual((key, url, None),
-            get_cmdline_url(names=[key], starts="xxxxxx", cmdline=cmdline))
+            util.get_cmdline_url(names=[key], starts="xxxxxx", cmdline=cmdline))
 
     def test_valid_content(self):
         url = "http://example.com/foo"
@@ -217,14 +199,13 @@ class TestCmdlineUrl(MockerTestCase):
         payload = "xcloud-config\nmydata: foo\nbar: wark\n"
         cmdline = "ro %s=%s bar=1" % (key, url)
 
-        mock_readurl = self.mocker.replace(readurl, passthrough=False)
+        mock_readurl = self.mocker.replace(url_helper.readurl, passthrough=False)
         mock_readurl(url)
-        self.mocker.result(payload)
-
+        self.mocker.result(url_helper.UrlResponse(200, payload))
         self.mocker.replay()
 
         self.assertEqual((key, url, payload),
-            get_cmdline_url(names=[key], starts="xcloud-config",
+            util.get_cmdline_url(names=[key], starts="xcloud-config",
                             cmdline=cmdline))
 
     def test_no_key_found(self):
@@ -232,11 +213,12 @@ class TestCmdlineUrl(MockerTestCase):
         key = "mykey"
         cmdline = "ro %s=%s bar=1" % (key, url)
 
-        self.mocker.replace(readurl, passthrough=False)
+        self.mocker.replace(url_helper.readurl, passthrough=False)
+        self.mocker.result(url_helper.UrlResponse(400))
         self.mocker.replay()
 
         self.assertEqual((None, None, None),
-            get_cmdline_url(names=["does-not-appear"],
+            util.get_cmdline_url(names=["does-not-appear"],
                 starts="#cloud-config", cmdline=cmdline))
 
 # vi: ts=4 expandtab
diff --git a/tests/unittests/test_handler/test_handler_ca_certs.py b/tests/unittests/test_handler/test_handler_ca_certs.py
index 21d2442f..8d85d331 100644
--- a/tests/unittests/test_handler/test_handler_ca_certs.py
+++ b/tests/unittests/test_handler/test_handler_ca_certs.py
@@ -1,9 +1,12 @@
 from mocker import MockerTestCase
 
-from cloudinit.util import write_file, delete_dir_contents
-from cloudinit.CloudConfig.cc_ca_certs import (
-    handle, update_ca_certs, add_ca_certs, remove_default_ca_certs)
-from logging import getLogger
+from cloudinit import util
+from cloudinit import cloud
+from cloudinit import helpers
+
+from cloudinit.config import cc_ca_certs
+
+import logging
 
 
 class TestNoConfig(MockerTestCase):
@@ -11,36 +14,37 @@ class TestNoConfig(MockerTestCase):
         super(TestNoConfig, self).setUp()
         self.name = "ca-certs"
         self.cloud_init = None
-        self.log = getLogger("TestNoConfig")
+        self.log = logging.getLogger("TestNoConfig")
         self.args = []
 
     def test_no_config(self):
         """
         Test that nothing is done if no ca-certs configuration is provided.
         """
-        config = {"unknown-key": "value"}
-
-        self.mocker.replace(write_file, passthrough=False)
-        self.mocker.replace(update_ca_certs, passthrough=False)
+        config = util.get_builtin_cfg()
+        self.mocker.replace(util.write_file, passthrough=False)
+        self.mocker.replace(cc_ca_certs.update_ca_certs, passthrough=False)
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud_init, self.log, self.args)
 
 
 class TestConfig(MockerTestCase):
     def setUp(self):
         super(TestConfig, self).setUp()
         self.name = "ca-certs"
-        self.cloud_init = None
-        self.log = getLogger("TestNoConfig")
+        self.paths = None
+        self.cloud = cloud.Cloud(None, self.paths, None, None, None)
+        self.log = logging.getLogger("TestNoConfig")
         self.args = []
 
         # Mock out the functions that actually modify the system
-        self.mock_add = self.mocker.replace(add_ca_certs, passthrough=False)
-        self.mock_update = self.mocker.replace(update_ca_certs,
+        self.mock_add = self.mocker.replace(cc_ca_certs.add_ca_certs, passthrough=False)
+        self.mock_update = self.mocker.replace(cc_ca_certs.update_ca_certs,
                                                passthrough=False)
-        self.mock_remove = self.mocker.replace(remove_default_ca_certs,
+        self.mock_remove = self.mocker.replace(cc_ca_certs.remove_default_ca_certs,
                                                passthrough=False)
+
         # Order must be correct
         self.mocker.order()
 
@@ -55,7 +59,7 @@ class TestConfig(MockerTestCase):
         self.mock_update()
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud, self.log, self.args)
 
     def test_empty_trusted_list(self):
         """Test that no certificate are written if 'trusted' list is empty"""
@@ -65,37 +69,37 @@ class TestConfig(MockerTestCase):
         self.mock_update()
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud, self.log, self.args)
 
     def test_single_trusted(self):
         """Test that a single cert gets passed to add_ca_certs"""
         config = {"ca-certs": {"trusted": ["CERT1"]}}
 
-        self.mock_add(["CERT1"])
+        self.mock_add(self.paths, ["CERT1"])
         self.mock_update()
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud, self.log, self.args)
 
     def test_multiple_trusted(self):
         """Test that multiple certs get passed to add_ca_certs"""
         config = {"ca-certs": {"trusted": ["CERT1", "CERT2"]}}
 
-        self.mock_add(["CERT1", "CERT2"])
+        self.mock_add(self.paths, ["CERT1", "CERT2"])
         self.mock_update()
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud, self.log, self.args)
 
     def test_remove_default_ca_certs(self):
         """Test remove_defaults works as expected"""
         config = {"ca-certs": {"remove-defaults": True}}
 
-        self.mock_remove()
+        self.mock_remove(self.paths)
         self.mock_update()
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud, self.log, self.args)
 
     def test_no_remove_defaults_if_false(self):
         """Test remove_defaults is not called when config value is False"""
@@ -104,72 +108,85 @@ class TestConfig(MockerTestCase):
         self.mock_update()
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud, self.log, self.args)
 
     def test_correct_order_for_remove_then_add(self):
         """Test remove_defaults is not called when config value is False"""
         config = {"ca-certs": {"remove-defaults": True, "trusted": ["CERT1"]}}
 
-        self.mock_remove()
-        self.mock_add(["CERT1"])
+        self.mock_remove(self.paths)
+        self.mock_add(self.paths, ["CERT1"])
         self.mock_update()
         self.mocker.replay()
 
-        handle(self.name, config, self.cloud_init, self.log, self.args)
+        cc_ca_certs.handle(self.name, config, self.cloud, self.log, self.args)
 
 
 class TestAddCaCerts(MockerTestCase):
+
+    def setUp(self):
+        super(TestAddCaCerts, self).setUp()
+        self.paths = helpers.Paths({
+            'cloud_dir': self.makeDir()
+        })
+
     def test_no_certs_in_list(self):
         """Test that no certificate are written if not provided."""
-        self.mocker.replace(write_file, passthrough=False)
+        self.mocker.replace(util.write_file, passthrough=False)
         self.mocker.replay()
-
-        add_ca_certs([])
+        cc_ca_certs.add_ca_certs(self.paths, [])
 
     def test_single_cert(self):
         """Test adding a single certificate to the trusted CAs"""
         cert = "CERT1\nLINE2\nLINE3"
 
-        mock_write = self.mocker.replace(write_file, passthrough=False)
+        mock_write = self.mocker.replace(util.write_file, passthrough=False)
         mock_write("/usr/share/ca-certificates/cloud-init-ca-certs.crt",
                    cert, mode=0644)
         mock_write("/etc/ca-certificates.conf",
-                   "\ncloud-init-ca-certs.crt", omode="a")
+                   "\ncloud-init-ca-certs.crt", omode="ab")
         self.mocker.replay()
 
-        add_ca_certs([cert])
+        cc_ca_certs.add_ca_certs(self.paths, [cert])
 
     def test_multiple_certs(self):
         """Test adding multiple certificates to the trusted CAs"""
         certs = ["CERT1\nLINE2\nLINE3", "CERT2\nLINE2\nLINE3"]
         expected_cert_file = "\n".join(certs)
 
-        mock_write = self.mocker.replace(write_file, passthrough=False)
+        mock_write = self.mocker.replace(util.write_file, passthrough=False)
         mock_write("/usr/share/ca-certificates/cloud-init-ca-certs.crt",
                    expected_cert_file, mode=0644)
         mock_write("/etc/ca-certificates.conf",
-                   "\ncloud-init-ca-certs.crt", omode="a")
+                   "\ncloud-init-ca-certs.crt", omode="ab")
         self.mocker.replay()
 
-        add_ca_certs(certs)
+        cc_ca_certs.add_ca_certs(self.paths, certs)
 
 
 class TestUpdateCaCerts(MockerTestCase):
     def test_commands(self):
-        mock_check_call = self.mocker.replace("subprocess.check_call",
+        mock_check_call = self.mocker.replace(util.subp,
                                               passthrough=False)
         mock_check_call(["update-ca-certificates"])
         self.mocker.replay()
 
-        update_ca_certs()
+        cc_ca_certs.update_ca_certs()
 
 
 class TestRemoveDefaultCaCerts(MockerTestCase):
+
+    def setUp(self):
+        super(TestRemoveDefaultCaCerts, self).setUp()
+        self.paths = helpers.Paths({
+            'cloud_dir': self.makeDir()
+        })
+
     def test_commands(self):
-        mock_delete_dir_contents = self.mocker.replace(delete_dir_contents,
+        mock_delete_dir_contents = self.mocker.replace(util.delete_dir_contents,
                                                        passthrough=False)
-        mock_write = self.mocker.replace(write_file, passthrough=False)
-        mock_subp = self.mocker.replace("cloudinit.util.subp",
+        mock_write = self.mocker.replace(util.write_file, passthrough=False)
+        mock_subp = self.mocker.replace(util.subp,
                                         passthrough=False)
 
         mock_delete_dir_contents("/usr/share/ca-certificates/")
@@ -179,4 +196,4 @@ class TestRemoveDefaultCaCerts(MockerTestCase):
                   "ca-certificates ca-certificates/trust_new_crts select no")
         self.mocker.replay()
 
-        remove_default_ca_certs()
+        cc_ca_certs.remove_default_ca_certs(self.paths)

From f60d2e26aaa962257328ddbfa707e48e879d9934 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 17:54:42 -0700
Subject: [PATCH 289/434] Ensure that calling the urls happens in a specified
 order.

---
 cloudinit/sources/DataSourceMAAS.py | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/cloudinit/sources/DataSourceMAAS.py b/cloudinit/sources/DataSourceMAAS.py
index 22c90b7c..f16d5c21 100644
--- a/cloudinit/sources/DataSourceMAAS.py
+++ b/cloudinit/sources/DataSourceMAAS.py
@@ -172,6 +172,12 @@ def read_maas_seed_url(seed_url, header_cb=None, timeout=None,
       * <seed_url>/<version>/user-data
     """
     base_url = "%s/%s" % (seed_url, version)
+    file_order = [
+        'local-hostname',
+        'instance-id',
+        'public-keys',
+        'user-data',
+    ]
     files = {
         'local-hostname': "%s/%s" % (base_url, 'meta-data/local-hostname'),
         'instance-id': "%s/%s" % (base_url, 'meta-data/instance-id'),
@@ -179,7 +185,8 @@ def read_maas_seed_url(seed_url, header_cb=None, timeout=None,
         'user-data': "%s/%s" % (base_url, 'user-data'),
     }
     md = {}
-    for (name, url) in files:
+    for name in file_order:
+        url = files.get(name)
         if header_cb:
             headers = header_cb(url)
         else:

From 052605c0f111fe9e26a6ac9451ff48eed5e81c05 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 17:54:53 -0700
Subject: [PATCH 290/434] Get this test working again.

---
 tests/unittests/test_datasource/test_maas.py | 64 +++++++++-----------
 1 file changed, 30 insertions(+), 34 deletions(-)

diff --git a/tests/unittests/test_datasource/test_maas.py b/tests/unittests/test_datasource/test_maas.py
index 7659dd03..261c410a 100644
--- a/tests/unittests/test_datasource/test_maas.py
+++ b/tests/unittests/test_datasource/test_maas.py
@@ -1,14 +1,11 @@
-from tempfile import mkdtemp
-from shutil import rmtree
 import os
 from StringIO import StringIO
 from copy import copy
-from cloudinit.DataSourceMAAS import (
-    MAASSeedDirNone,
-    MAASSeedDirMalformed,
-    read_maas_seed_dir,
-    read_maas_seed_url,
-)
+
+from cloudinit import util
+from cloudinit import url_helper
+from cloudinit.sources import DataSourceMAAS
+
 from mocker import MockerTestCase
 
 
@@ -17,12 +14,7 @@ class TestMAASDataSource(MockerTestCase):
     def setUp(self):
         super(TestMAASDataSource, self).setUp()
         # Make a temp directoy for tests to use.
-        self.tmp = mkdtemp(prefix="unittest_")
-
-    def tearDown(self):
-        super(TestMAASDataSource, self).tearDown()
-        # Clean up temp directory
-        rmtree(self.tmp)
+        self.tmp = self.makeDir()
 
     def test_seed_dir_valid(self):
         """Verify a valid seeddir is read as such"""
@@ -35,7 +27,7 @@ class TestMAASDataSource(MockerTestCase):
         my_d = os.path.join(self.tmp, "valid")
         populate_dir(my_d, data)
 
-        (userdata, metadata) = read_maas_seed_dir(my_d)
+        (userdata, metadata) = DataSourceMAAS.read_maas_seed_dir(my_d)
 
         self.assertEqual(userdata, data['user-data'])
         for key in ('instance-id', 'local-hostname'):
@@ -54,7 +46,7 @@ class TestMAASDataSource(MockerTestCase):
         my_d = os.path.join(self.tmp, "valid_extra")
         populate_dir(my_d, data)
 
-        (userdata, metadata) = read_maas_seed_dir(my_d)
+        (userdata, metadata) = DataSourceMAAS.read_maas_seed_dir(my_d)
 
         self.assertEqual(userdata, data['user-data'])
         for key in ('instance-id', 'local-hostname'):
@@ -76,24 +68,28 @@ class TestMAASDataSource(MockerTestCase):
         invalid_data = copy(valid)
         del invalid_data['local-hostname']
         populate_dir(my_d, invalid_data)
-        self.assertRaises(MAASSeedDirMalformed, read_maas_seed_dir, my_d)
+        self.assertRaises(DataSourceMAAS.MAASSeedDirMalformed,
+                          DataSourceMAAS.read_maas_seed_dir, my_d)
 
         # missing 'instance-id'
         my_d = "%s-02" % my_based
         invalid_data = copy(valid)
         del invalid_data['instance-id']
         populate_dir(my_d, invalid_data)
-        self.assertRaises(MAASSeedDirMalformed, read_maas_seed_dir, my_d)
+        self.assertRaises(DataSourceMAAS.MAASSeedDirMalformed,
+                          DataSourceMAAS.read_maas_seed_dir, my_d)
 
     def test_seed_dir_none(self):
         """Verify that empty seed_dir raises MAASSeedDirNone"""
 
         my_d = os.path.join(self.tmp, "valid_empty")
-        self.assertRaises(MAASSeedDirNone, read_maas_seed_dir, my_d)
+        self.assertRaises(DataSourceMAAS.MAASSeedDirNone,
+                          DataSourceMAAS.read_maas_seed_dir, my_d)
 
     def test_seed_dir_missing(self):
         """Verify that missing seed_dir raises MAASSeedDirNone"""
-        self.assertRaises(MAASSeedDirNone, read_maas_seed_dir,
+        self.assertRaises(DataSourceMAAS.MAASSeedDirNone, 
+            DataSourceMAAS.read_maas_seed_dir,
             os.path.join(self.tmp, "nonexistantdirectory"))
 
     def test_seed_url_valid(self):
@@ -102,30 +98,30 @@ class TestMAASDataSource(MockerTestCase):
             'meta-data/local-hostname': 'test-hostname',
             'meta-data/public-keys': 'test-hostname',
             'user-data': 'foodata'}
-
+        valid_order = [
+            'meta-data/local-hostname',
+            'meta-data/instance-id',
+            'meta-data/public-keys',
+            'user-data',
+        ]
         my_seed = "http://example.com/xmeta"
         my_ver = "1999-99-99"
         my_headers = {'header1': 'value1', 'header2': 'value2'}
 
         def my_headers_cb(url):
-            return(my_headers)
+            return my_headers
 
-        mock_request = self.mocker.replace("urllib2.Request",
-            passthrough=False)
-        mock_urlopen = self.mocker.replace("urllib2.urlopen",
+        mock_request = self.mocker.replace(url_helper.readurl,
             passthrough=False)
 
-        for (key, val) in valid.iteritems():
-            mock_request("%s/%s/%s" % (my_seed, my_ver, key),
-                data=None, headers=my_headers)
-            self.mocker.nospec()
-            self.mocker.result("fake-request-%s" % key)
-            mock_urlopen("fake-request-%s" % key, timeout=None)
-            self.mocker.result(StringIO(val))
-
+        for key in valid_order:
+            url = "%s/%s/%s" % (my_seed, my_ver, key)
+            mock_request(url, headers=my_headers, timeout=None)
+            resp = valid.get(key)
+            self.mocker.result(url_helper.UrlResponse(200, resp))
         self.mocker.replay()
 
-        (userdata, metadata) = read_maas_seed_url(my_seed,
+        (userdata, metadata) = DataSourceMAAS.read_maas_seed_url(my_seed,
             header_cb=my_headers_cb, version=my_ver)
 
         self.assertEqual("foodata", userdata)

From 5f586faf9898e9f24a23feb6a60eb098d60b5df5 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 19:46:16 -0700
Subject: [PATCH 291/434] Updated so that the locale that is being written out
 currently in 'cc_locale' now will be done by the distro classes (since its
 not the same for rhel and ubuntu).

Remove the template also since it will just be created by the ubuntu distro class (its just one line).
---
 cloudinit/config/cc_locale.py | 25 ++-----------------------
 cloudinit/distros/__init__.py |  4 ++++
 cloudinit/distros/rhel.py     | 31 +++++++++++++++++++++++++++++++
 cloudinit/distros/ubuntu.py   | 11 +++++++++++
 templates/default-locale.tmpl |  1 -
 5 files changed, 48 insertions(+), 24 deletions(-)
 delete mode 100644 templates/default-locale.tmpl

diff --git a/cloudinit/config/cc_locale.py b/cloudinit/config/cc_locale.py
index 3fb4c5d9..6feaae9d 100644
--- a/cloudinit/config/cc_locale.py
+++ b/cloudinit/config/cc_locale.py
@@ -18,41 +18,20 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import os
-
-from cloudinit import templater
 from cloudinit import util
 
 
-def apply_locale(locale, cfgfile, cloud, log):
-    # TODO this command might not work on RH...
-    if os.path.exists('/usr/sbin/locale-gen'):
-        util.subp(['locale-gen', locale], capture=False)
-    if os.path.exists('/usr/sbin/update-locale'):
-        util.subp(['update-locale', locale], capture=False)
-    if not cfgfile:
-        return
-    template_fn = cloud.get_template_filename('default-locale')
-    if not template_fn:
-        log.warn("No template filename found to write to %s", cfgfile)
-    else:
-        templater.render_to_file(template_fn, cfgfile, {'locale': locale})
-
-
 def handle(name, cfg, cloud, log, args):
     if len(args) != 0:
         locale = args[0]
     else:
         locale = util.get_cfg_option_str(cfg, "locale", cloud.get_locale())
 
-    locale_cfgfile = util.get_cfg_option_str(cfg, "locale_configfile",
-                                             "/etc/default/locale")
-
     if not locale:
         log.debug(("Skipping module named %s, "
                    "no 'locale' configuration found"), name)
         return
 
     log.debug("Setting locale to %s", locale)
-
-    apply_locale(locale, locale_cfgfile, cloud, log)
+    locale_cfgfile = util.get_cfg_option_str(cfg, "locale_configfile")
+    cloud.distro.apply_locale(locale, locale_cfgfile)
diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index f9a97da7..c324ddf6 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -82,6 +82,10 @@ class Distro(object):
             return self._interface_action('up')
         return False
 
+    @abc.abstractmethod
+    def apply_locale(self, locale, out_fn=None):
+        raise NotImplementedError()
+
     @abc.abstractmethod
     def set_timezone(self, tz):
         raise NotImplementedError()
diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index 5cbefa6e..df63d559 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -30,6 +30,10 @@ LOG = logging.getLogger(__name__)
 
 NETWORK_FN_TPL = '/etc/sysconfig/network-scripts/ifcfg-%s'
 
+# See: http://tiny.cc/6r99fw
+# For what alot of these files that are being written
+# are and the format of them
+
 
 class Distro(distros.Distro):
 
@@ -83,6 +87,33 @@ class Distro(distros.Distro):
             LOG.debug("Setting hostname to %s", hostname)
             util.subp(['hostname', hostname])
 
+    def apply_locale(self, locale, out_fn=None):
+        if not out_fn:
+            out_fn = self._paths.join(False, '/etc/sysconfig/i18n')
+        ro_fn = self._paths.join(True, '/etc/sysconfig/i18n')
+        # Update the 'LANG' if it exists instead of appending
+        old_contents = self._read_conf(ro_fn)
+        adjusted = False
+        new_contents = []
+        for entry in old_contents:
+            if not entry:
+                continue
+            if len(entry) == 1:
+                new_contents.append(entry[0])
+                continue
+            (cmd, args) = entry
+            cmd_c = cmd.strip().lower()
+            if cmd_c == 'lang':
+                args = "%s" % (locale)
+                adjusted = True
+            new_contents.append("=".join([cmd, args]))
+        # Guess not found, append it
+        if not adjusted:
+            new_contents.append("# Added by cloud-init")
+            new_contents.append('LANG="%s"' % (locale))
+        contents = "\n".join(new_contents)
+        util.write_file(out_fn, contents, 0644)
+
     def _write_hostname(self, hostname, out_fn):
         old_contents = []
         if os.path.isfile(out_fn):
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index 15af2e7f..e8b95374 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -41,6 +41,17 @@ class Distro(distros.Distro):
         # should only happen say once per instance...)
         self._runner = helpers.Runners(paths)
 
+    def apply_locale(self, locale, out_fn=None):
+        if not out_fn:
+            out_fn = self._paths.join(False, '/etc/default/locale')
+        util.subp(['locale-gen', locale], capture=False)
+        util.subp(['update-locale', locale], capture=False)
+        contents = [
+            "# Created by cloud-init",
+            'LANG="%s"' % (locale),
+        ]
+        util.write_file(out_fn, "\n".join(contents))
+
     def install_packages(self, pkglist):
         self._update_package_sources()
         self.package_command('install', pkglist)
diff --git a/templates/default-locale.tmpl b/templates/default-locale.tmpl
deleted file mode 100644
index 5ee7e454..00000000
--- a/templates/default-locale.tmpl
+++ /dev/null
@@ -1 +0,0 @@
-LANG="{{locale}}"

From a3514b63d6557ac587a36d8cb8f8dcd965896194 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 19:47:27 -0700
Subject: [PATCH 292/434] 1. Update the comment about fstab to just point to
 'man fstab' 2. Update the mount point adding of '/' to just add it in one
 place if it does not already exist

---
 cloudinit/util.py | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index f0a65fa3..3aa4e462 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1100,7 +1100,7 @@ def mounts():
         # Go through mounts to see what is already mounted
         mount_locs = load_file("/proc/mounts").splitlines()
         for mpline in mount_locs:
-            # Format at: http://linux.die.net/man/5/fstab
+            # Format at: man fstab
             try:
                 (dev, mp, fstype, opts, _freq, _passno) = mpline.split()
             except:
@@ -1129,7 +1129,7 @@ def mount_cb(device, callback, data=None, rw=False, mtype=None, sync=True):
     with tempdir() as tmpd:
         umount = False
         if device in mounted:
-            mountpoint = "%s/" % mounted[device]['mountpoint']
+            mountpoint = mounted[device]['mountpoint']
         else:
             try:
                 mountcmd = ['mount']
@@ -1140,7 +1140,7 @@ def mount_cb(device, callback, data=None, rw=False, mtype=None, sync=True):
                     mountopts.append('ro')
                 if sync:
                     # This seems like the safe approach to do
-                    # (where this is on by default)
+                    # (ie where this is on by default)
                     mountopts.append("sync")
                 if mountopts:
                     mountcmd.extend(["-o", ",".join(mountopts)])
@@ -1149,12 +1149,15 @@ def mount_cb(device, callback, data=None, rw=False, mtype=None, sync=True):
                 mountcmd.append(device)
                 mountcmd.append(tmpd)
                 subp(mountcmd)
-                umount = tmpd
+                umount = tmpd  # This forces it to be unmounted (when set)
+                mountpoint = tmpd
             except (IOError, OSError) as exc:
                 raise MountFailedError(("Failed mounting %s "
                                         "to %s due to: %s") %
                                        (device, tmpd, exc))
-            mountpoint = "%s/" % tmpd
+        # Be nice and ensure it ends with a slash
+        if not mountpoint.endswith("/"):
+            mountpoint += "/"
         with unmounter(umount):
             if data is None:
                 ret = callback(mountpoint)

From 5edb13be9545ce109247e68935f082a014c0cda7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 19:48:06 -0700
Subject: [PATCH 293/434] Comment cleanups and remove unneeded quotes.

---
 config/cloud.cfg | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/config/cloud.cfg b/config/cloud.cfg
index a87b613d..5dae4047 100644
--- a/config/cloud.cfg
+++ b/config/cloud.cfg
@@ -1,4 +1,4 @@
-# The top level settings are used as transforms
+# The top level settings are used as module
 # and system configuration.
 
 # This user will have its password adjusted
@@ -60,14 +60,15 @@ cloud_final_modules:
  - final-message
 
 # System and/or distro specific settings
+# (not accessible to handlers/transforms)
 system_info:
    # This will affect which distro class gets used
    distro: ubuntu
    # Other config here will be given to the distro class and/or path classes
    paths:
-      cloud_dir: "/var/lib/cloud/"
-      templates_dir: "/etc/cloud/templates/"
-      upstart_dir: "/etc/init/"
-   package_mirror: "http://archive.ubuntu.com/ubuntu"
-   availability_zone_template: "http://%(zone)s.ec2.archive.ubuntu.com/ubuntu/"
+      cloud_dir: /var/lib/cloud/
+      templates_dir: /etc/cloud/templates/
+      upstart_dir: /etc/init/
+   package_mirror: http://archive.ubuntu.com/ubuntu
+   availability_zone_template: http://%(zone)s.ec2.archive.ubuntu.com/ubuntu/
    ssh_svcname: ssh

From 78a6e2f55b66dfa685a1c1e49e248d5d0d7ba873 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 20:14:04 -0700
Subject: [PATCH 294/434] 1. Update comment about ipath returning None when no
 datasource is active 2. Fix pylint warning on set method of config parser.

---
 cloudinit/helpers.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 6751f4a5..7a2ac6b8 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -286,7 +286,7 @@ class Paths(object):
             cpath = os.path.join(cpath, add_on)
         return cpath
 
-    # get_ipath : get the instance path for a name in pathmap
+    # _get_ipath : get the instance path for a name in pathmap
     # (/var/lib/cloud/instances/<instance>/<name>)
     def _get_ipath(self, name=None):
         if not self.datasource:
@@ -302,6 +302,7 @@ class Paths(object):
 
     # get_ipath : get the instance path for a name in pathmap
     # (/var/lib/cloud/instances/<instance>/<name>)
+    # returns None + warns if no active datasource....
     def get_ipath(self, name=None):
         ipath = self._get_ipath(name)
         if not ipath:
@@ -337,7 +338,7 @@ class DefaultingConfigParser(RawConfigParser):
             pass
         return value
 
-    def set(self, section, option, value):
+    def set(self, section, option, value=None):
         if not self.has_section(section) and section.lower() != 'default':
             self.add_section(section)
         RawConfigParser.set(self, section, option, value)

From 38d516f2ec788fb0d0d2e5274e46dee9ed165923 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 20:14:50 -0700
Subject: [PATCH 295/434] 1. Go through a single protected get ipath method
 that will throw if there    is not an active datasource (ie the user has done
 an out of order call to    a function that needs the datasource to exist) 2.
 Add in a '_get_instance_subdirs' method that can be over-ridden    in the
 future if more subdirs are needed.

---
 cloudinit/stages.py | 26 ++++++++++++++++++++------
 1 file changed, 20 insertions(+), 6 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 9f28c2e8..25f13fd4 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -234,15 +234,29 @@ class Init(object):
             self.paths.datasource = ds
         return ds
 
+    def _get_instance_subdirs(self):
+        return ['handlers', 'scripts', 'sems']
+
+    def _get_ipath(self, subname=None):
+        # Force a check to see if anything
+        # actually comes back, if not
+        # then a datasource has not been assigned...
+        instance_dir = self.paths.get_ipath(subname)
+        if not instance_dir:
+            raise RuntimeError(("No instance directory is available."
+                                " Has a datasource been fetched??"))
+        return instance_dir
+
     def _reflect_cur_instance(self):
-        # Ensure we are hooked into the right symlink for the current instance
-        idir = self.paths.get_ipath()
+        # Remove the old symlink and attach a new one so
+        # that further reads/writes connect into the right location
+        idir = self._get_ipath()
         util.del_file(self.paths.instance_link)
         util.sym_link(idir, self.paths.instance_link)
 
         # Ensures these dirs exist
         dir_list = []
-        for d in ["handlers", "scripts", "sem"]:
+        for d in self._get_instance_subdirs():
             dir_list.append(os.path.join(idir, d))
         util.ensure_dirs(dir_list)
 
@@ -297,9 +311,9 @@ class Init(object):
 
     def _store_userdata(self):
         raw_ud = "%s" % (self.datasource.get_userdata_raw())
-        util.write_file(self.paths.get_ipath('userdata_raw'), raw_ud, 0600)
+        util.write_file(self._get_ipath('userdata_raw'), raw_ud, 0600)
         processed_ud = "%s" % (self.datasource.get_userdata())
-        util.write_file(self.paths.get_ipath('userdata'), processed_ud, 0600)
+        util.write_file(self._get_ipath('userdata'), processed_ud, 0600)
 
     def _default_userdata_handlers(self):
         opts = {
@@ -317,7 +331,7 @@ class Init(object):
 
     def consume(self, frequency=PER_INSTANCE):
         cdir = self.paths.get_cpath("handlers")
-        idir = self.paths.get_ipath("handlers")
+        idir = self._get_ipath("handlers")
 
         # Add the path to the plugins dir to the top of our list for import
         # instance dir should be read before cloud-dir

From 8f4786a3ba0d7ca8e9bd80f116ffd7ee5f7c255b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 21 Jun 2012 20:28:21 -0700
Subject: [PATCH 296/434] Use RuntimeError subclass instead of top level
 Exception

---
 cloudinit/config/cc_landscape.py        | 8 ++++----
 cloudinit/config/cc_update_etc_hosts.py | 4 ++--
 cloudinit/distros/rhel.py               | 4 ++--
 cloudinit/distros/ubuntu.py             | 4 ++--
 4 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/cloudinit/config/cc_landscape.py b/cloudinit/config/cc_landscape.py
index d45c9203..99a958b0 100644
--- a/cloudinit/config/cc_landscape.py
+++ b/cloudinit/config/cc_landscape.py
@@ -61,10 +61,10 @@ def handle(name, cfg, cloud, log, _args):
 
     ls_cloudcfg = cfg.get("landscape", {})
 
-    if not isinstance(ls_cloudcfg, dict):
-        raise Exception(("'landscape' key existed in config,"
-                         " but not a dictionary type,"
-                         " is a %s instead"), util.obj_name(ls_cloudcfg))
+    if not isinstance(ls_cloudcfg, (dict)):
+        raise RuntimeError(("'landscape' key existed in config,"
+                            " but not a dictionary type,"
+                            " is a %s instead"), util.obj_name(ls_cloudcfg))
 
     merge_data = [
         LSC_BUILTIN_CFG,
diff --git a/cloudinit/config/cc_update_etc_hosts.py b/cloudinit/config/cc_update_etc_hosts.py
index 6820ac4f..c148b12e 100644
--- a/cloudinit/config/cc_update_etc_hosts.py
+++ b/cloudinit/config/cc_update_etc_hosts.py
@@ -39,8 +39,8 @@ def handle(name, cfg, cloud, log, _args):
         distro_n = cloud.distro.name
         tpl_fn_name = cloud.get_template_filename("hosts.%s" % (distro_n))
         if not tpl_fn_name:
-            raise Exception(("No hosts template could be"
-                             " found for distro %s") % (distro_n))
+            raise RuntimeError(("No hosts template could be"
+                                " found for distro %s") % (distro_n))
 
         out_fn = cloud.paths.join(False, '/etc/hosts')
         templater.render_to_file(tpl_fn_name, out_fn,
diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index df63d559..dff76075 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -208,8 +208,8 @@ class Distro(distros.Distro):
     def set_timezone(self, tz):
         tz_file = os.path.join("/usr/share/zoneinfo", tz)
         if not os.path.isfile(tz_file):
-            raise Exception(("Invalid timezone %s,"
-                             " no file found at %s") % (tz, tz_file))
+            raise RuntimeError(("Invalid timezone %s,"
+                                " no file found at %s") % (tz, tz_file))
         # Adjust the sysconfig clock zone setting
         read_fn = self._paths.join(True, "/etc/sysconfig/clock")
         old_contents = self._read_conf(read_fn)
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index e8b95374..b23945d8 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -121,8 +121,8 @@ class Distro(distros.Distro):
     def set_timezone(self, tz):
         tz_file = os.path.join("/usr/share/zoneinfo", tz)
         if not os.path.isfile(tz_file):
-            raise Exception(("Invalid timezone %s,"
-                             " no file found at %s") % (tz, tz_file))
+            raise RuntimeError(("Invalid timezone %s,"
+                                " no file found at %s") % (tz, tz_file))
         tz_lines = [
             "# Created by cloud-init",
             str(tz),

From 017529db0b914b39084cd11971f7c873b07a0a9a Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Thu, 21 Jun 2012 23:35:07 -0700
Subject: [PATCH 297/434] Fixup python selinux guards, only try to restore
 after we check if its useful to restore, fix test to work with selinux
 enabled sysystems

---
 cloudinit/stages.py          | 20 ++++++++++++--------
 cloudinit/util.py            | 26 +++++++++++++++++---------
 tests/unittests/test_util.py | 13 ++++++-------
 3 files changed, 35 insertions(+), 24 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 25f13fd4..cf5e6924 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -221,11 +221,12 @@ class Init(object):
             (cfg_list, pkg_list) = self._get_datasources()
             # Deep copy so that user-data handlers can not modify
             # (which will affect user-data handlers down the line...)
-            sys_cfg = copy.deepcopy(self.cfg)
-            ds_deps = copy.deepcopy(self.ds_deps)
-            (ds, dsname) = sources.find_source(sys_cfg, self.distro,
+            (ds, dsname) = sources.find_source(self.cfg,
+                                               self.distro,
                                                self.paths,
-                                               ds_deps, cfg_list, pkg_list)
+                                               copy.deepcopy(self.ds_deps),
+                                               cfg_list,
+                                               pkg_list)
             LOG.debug("Loaded datasource %s - %s", dsname, ds)
         if ds:
             self.datasource = ds
@@ -408,7 +409,7 @@ class Modules(object):
     def __init__(self, init, cfg_files=None):
         self.datasource = init.datasource
         self.cfg_files = cfg_files
-        self.base_cfg = copy.deepcopy(init.cfg)
+        self.base_cfg = init.cfg
         self.init = init
         # Created on first use
         self._cached_cfg = None
@@ -419,7 +420,8 @@ class Modules(object):
         if self._cached_cfg is None:
             self._cached_cfg = self._get_config()
             LOG.debug("Loading 'module' config %s", self._cached_cfg)
-        return self._cached_cfg
+        # Only give out a copy so that others can't modify this...
+        return copy.deepcopy(self._cached_cfg)
 
     def _get_config(self):
         t_cfgs = []
@@ -531,9 +533,11 @@ class Modules(object):
                     LOG.warn(("Module %s is verified on %s distros"
                               " but not on %s distro. It may or may not work"
                               " correctly."), name, worked_distros, d_name)
-                # Deep copy the config so that modules can't alter it
                 # Use the configs logger and not our own
-                func_args = [name, copy.deepcopy(self.cfg),
+                # TODO: possibly check the module
+                # for having a LOG attr and just give it back
+                # its own logger?
+                func_args = [name, self.cfg,
                              cc, config.LOG, args]
                 # Mark it as having started running
                 am_ran += 1
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 3aa4e462..332b8379 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -35,6 +35,7 @@ import pwd
 import random
 import shutil
 import socket
+import stat
 import string  # pylint: disable=W0402
 import subprocess
 import sys
@@ -132,14 +133,24 @@ class SeLinuxGuard(object):
             self.enabled = True
 
     def __enter__(self):
-        # TODO: Should we try to engage selinux here??
         return self.enabled
 
     def __exit__(self, excp_type, excp_value, excp_traceback):
         if self.enabled:
-            LOG.debug("Restoring selinux mode for %s (recursive=%s)",
-                      self.path, self.recursive)
-            selinux.restorecon(self.path, recursive=self.recursive)
+            path = os.path.realpath(os.path.expanduser(self.path))
+            do_restore = False
+            try:
+                # See if even worth restoring??
+                stats = os.lstat(path)
+                if stat.ST_MODE in stats:
+                    selinux.matchpathcon(path, stats[stat.ST_MODE])
+                    do_restore = True
+            except OSError:
+                pass
+            if do_restore:
+                LOG.debug("Restoring selinux mode for %s (recursive=%s)",
+                          path, self.recursive)
+                selinux.restorecon(path, recursive=self.recursive)
 
 
 class MountFailedError(Exception):
@@ -1067,8 +1078,7 @@ def ensure_dir(path, mode=None):
     if not os.path.isdir(path):
         # Make the dir and adjust the mode
         LOG.debug("Ensuring directory exists at path %s", path)
-        # TODO: check if guard needed??
-        with SeLinuxGuard(path=os.path.dirname(path)):
+        with SeLinuxGuard(os.path.dirname(path), recursive=True):
             os.makedirs(path)
         chmod(path, mode)
     else:
@@ -1222,8 +1232,7 @@ def chmod(path, mode):
     if path and real_mode:
         LOG.debug("Adjusting the permissions of %s (perms=%o)",
                  path, real_mode)
-        # TODO: check if guard needed??
-        with SeLinuxGuard(path=path):
+        with SeLinuxGuard(path):
             os.chmod(path, real_mode)
 
 
@@ -1239,7 +1248,6 @@ def write_file(filename, content, mode=0644, omode="wb"):
     """
     ensure_dir(os.path.dirname(filename))
     LOG.debug("Writing to %s - %s, %s bytes", filename, omode, len(content))
-    # TODO: check if guard needed??
     with SeLinuxGuard(path=filename):
         with open(filename, omode) as fh:
             fh.write(content)
diff --git a/tests/unittests/test_util.py b/tests/unittests/test_util.py
index ba565b29..3be6e186 100644
--- a/tests/unittests/test_util.py
+++ b/tests/unittests/test_util.py
@@ -71,7 +71,7 @@ class TestGetCfgOptionListOrStr(TestCase):
         """None is returned if key is not found and no default given."""
         config = {}
         result = util.get_cfg_option_list(config, "key")
-        self.assertIsNone(result)
+        self.assertEqual(None, result)
 
     def test_not_found_with_default(self):
         """Default is returned if key is not found."""
@@ -166,14 +166,13 @@ class TestWriteFile(MockerTestCase):
                 "selinux.restorecon", passthrough=False)
             mock_is_selinux_enabled = self.mocker.replace(
                 "selinux.is_selinux_enabled", passthrough=False)
-            mock_is_selinux_enabled.result(True)
-            mock_restorecon(path)
+            mock_is_selinux_enabled()
+            self.mocker.result(True)
+            mock_restorecon("/etc/hosts", recursive=False)
+            self.mocker.result(True)
             self.mocker.replay()
-            old = util.HAVE_LIBSELINUX
-            util.HAVE_LIBSELINUX = True
-            with util.SeLinuxGuard(self.tmp) as is_on:
+            with util.SeLinuxGuard("/etc/hosts") as is_on:
                 self.assertTrue(is_on)
-            util.HAVE_LIBSELINUX = old
         except ImportError:
             pass
 

From 64db95904d61df834dc2ebb605e5fa753c14eb4b Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Thu, 21 Jun 2012 23:57:52 -0700
Subject: [PATCH 298/434] Ensure that nothing was ran by checking the total
 count

---
 bin/cloud-init | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index d193272e..aff8f967 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -92,7 +92,8 @@ def extract_fns(args):
 def run_module_section(mods, action_name, section):
     full_section_name = MOD_SECTION_TPL % (section)
     (ran_am, failures) = mods.run_section(full_section_name)
-    if not ran_am:
+    total_attempted = ran_am + len(failures)
+    if total_attempted == 0:
         msg = ("No '%s' modules to run"
                " under section '%s'") % (action_name, full_section_name)
         sys.stderr.write("%s\n" % (msg))

From ca046a8e33d27cc6111e7602988ddc3d5a9dce8a Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 00:04:07 -0700
Subject: [PATCH 299/434] 1. Return which modules ran from the run module
 function 2. Use that list in the main binary & adjust related comparisions

---
 bin/cloud-init      | 16 +++++++++-------
 cloudinit/stages.py | 10 ++++++----
 2 files changed, 15 insertions(+), 11 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index aff8f967..68c7ba76 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -91,8 +91,8 @@ def extract_fns(args):
 
 def run_module_section(mods, action_name, section):
     full_section_name = MOD_SECTION_TPL % (section)
-    (ran_am, failures) = mods.run_section(full_section_name)
-    total_attempted = ran_am + len(failures)
+    (which_ran, failures) = mods.run_section(full_section_name)
+    total_attempted = len(which_ran) + len(failures)
     if total_attempted == 0:
         msg = ("No '%s' modules to run"
                " under section '%s'") % (action_name, full_section_name)
@@ -100,7 +100,8 @@ def run_module_section(mods, action_name, section):
         LOG.debug(msg)
         return 0
     else:
-        LOG.debug("Ran %s modules with %s failures", ran_am, len(failures))
+        LOG.debug("Ran %s modules with %s failures",
+                  len(which_ran), len(failures))
         return len(failures)
 
 
@@ -316,16 +317,17 @@ def main_single(name, args):
         logging.resetLogging()
     logging.setupLogging(mods.cfg)
     # Stage 4
-    (run_am, failures) = mods.run_single(mod_name,
-                                         mod_args,
-                                         mod_freq)
+    (which_ran, failures) = mods.run_single(mod_name,
+                                            mod_args,
+                                            mod_freq)
     if failures:
         LOG.warn("Ran %s but it failed!", mod_name)
         return 1
-    elif run_am == 0:
+    elif not which_ran:
         LOG.warn("Did not run %s, does it exist?", mod_name)
         return 1
     else:
+        # Guess it worked
         return 0
 
 
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index cf5e6924..9481db83 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -517,10 +517,12 @@ class Modules(object):
         return mostly_mods
 
     def _run_modules(self, mostly_mods):
-        failures = []
         d_name = self.init.distro.name
         cc = self.init.cloudify()
-        am_ran = 0
+        # Return which ones ran
+        # and which ones failed + the exception of why it failed
+        failures = []
+        which_ran = []
         for (mod, name, freq, args) in mostly_mods:
             try:
                 # Try the modules frequency, otherwise fallback to a known one
@@ -540,14 +542,14 @@ class Modules(object):
                 func_args = [name, self.cfg,
                              cc, config.LOG, args]
                 # Mark it as having started running
-                am_ran += 1
+                which_ran.append(name)
                 # This name will affect the semaphore name created
                 run_name = "config-%s" % (name)
                 cc.run(run_name, mod.handle, func_args, freq=freq)
             except Exception as e:
                 util.logexc(LOG, "Running %s (%s) failed", name, mod)
                 failures.append((name, e))
-        return (am_ran, failures)
+        return (which_ran, failures)
 
     def run_single(self, mod_name, args=None, freq=None):
         # Form the users module 'specs'

From da3fc8992d8be83b5c95e974ecd3a569150b5dfe Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 08:47:49 -0700
Subject: [PATCH 300/434] Add comment that configobj is used for more than just
 old configs.

---
 Requires | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/Requires b/Requires
index 5a350900..bd2db00c 100644
--- a/Requires
+++ b/Requires
@@ -18,6 +18,10 @@ oauth>=1.0
 boto>=2.4
 
 # This is only needed if you have old style configurations
+# and any places where we need to support configs in a manner
+# that the built-in config parser is not sufficent (ie
+# when we need to preserve comments, or do not have a top-level
+# section)...
 configobj>=4.6
 
 # All new style configurations are in the yaml format

From 889125652632e0f0d60a5a36b0a3b5294451b20b Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 08:48:18 -0700
Subject: [PATCH 301/434] 1. Use configobj instead of configparser   a. This
 allows us to not have to add a fake section in   b. It will also preserver
 the files initial comments 2. Adjust how the new sections are being added and
    values are being written due to this change

---
 cloudinit/config/cc_mcollective.py | 65 +++++++++++++-----------------
 1 file changed, 29 insertions(+), 36 deletions(-)

diff --git a/cloudinit/config/cc_mcollective.py b/cloudinit/config/cc_mcollective.py
index 36a4cade..2acdbc6f 100644
--- a/cloudinit/config/cc_mcollective.py
+++ b/cloudinit/config/cc_mcollective.py
@@ -21,7 +21,10 @@
 
 from StringIO import StringIO
 
-from cloudinit import helpers
+# Used since this can maintain comments
+# and doesn't need a top level section
+from configobj import ConfigObj
+
 from cloudinit import util
 
 PUBCERT_FILE = "/etc/mcollective/ssl/server-public.pem"
@@ -43,54 +46,44 @@ def handle(name, cfg, cloud, log, _args):
 
     # ... and then update the mcollective configuration
     if 'conf' in mcollective_cfg:
-        # Create object for reading server.cfg values
-        mcollective_config = helpers.DefaultingConfigParser()
-        # Read server.cfg values from original file in order to be able to mix
-        # the rest up
+        # Read server.cfg values from the
+        # original file in order to be able to mix the rest up
         server_cfg_fn = cloud.paths.join(True, '/etc/mcollective/server.cfg')
-        old_contents = util.load_file(server_cfg_fn)
-        # It doesn't contain any sections so just add one temporarily
-        # Use a hash id based off the contents,
-        # just incase of conflicts... (try to not have any...)
-        # This is so that an error won't occur when reading (and no
-        # sections exist in the file)
-        section_tpl = "[nullsection_%s]"
-        attempts = 0
-        section_head = section_tpl % (attempts)
-        while old_contents.find(section_head) != -1:
-            attempts += 1
-            section_head = section_tpl % (attempts)
-        sectioned_contents = "%s\n%s" % (section_head, old_contents)
-        mcollective_config.readfp(StringIO(sectioned_contents),
-                                  filename=server_cfg_fn)
+        mcollective_config = ConfigObj(server_cfg_fn)
+        # See: http://tiny.cc/jh9agw
         for (cfg_name, cfg) in mcollective_cfg['conf'].iteritems():
             if cfg_name == 'public-cert':
                 pubcert_fn = cloud.paths.join(True, PUBCERT_FILE)
                 util.write_file(pubcert_fn, cfg, mode=0644)
-                mcollective_config.set(cfg_name,
-                    'plugin.ssl_server_public', pubcert_fn)
-                mcollective_config.set(cfg_name, 'securityprovider', 'ssl')
+                mcollective_config['plugin.ssl_server_public'] = pubcert_fn
+                mcollective_config['securityprovider'] = 'ssl'
             elif cfg_name == 'private-cert':
                 pricert_fn = cloud.paths.join(True, PRICERT_FILE)
                 util.write_file(pricert_fn, cfg, mode=0600)
-                mcollective_config.set(cfg_name,
-                    'plugin.ssl_server_private', pricert_fn)
-                mcollective_config.set(cfg_name, 'securityprovider', 'ssl')
+                mcollective_config['plugin.ssl_server_private'] = pricert_fn
+                mcollective_config['securityprovider'] = 'ssl'
             else:
-                # Iterate throug the config items, we'll use ConfigParser.set
-                # to overwrite or create new items as needed
-                for (o, v) in cfg.iteritems():
-                    mcollective_config.set(cfg_name, o, v)
+                if isinstance(cfg, (basestring, str)):
+                    # Just set it in the 'main' section
+                    mcollective_config[cfg_name] = cfg
+                elif isinstance(cfg, (dict)):
+                    # Iterate throug the config items, create a section
+                    # if it is needed and then add/or create items as needed
+                    if cfg_name not in mcollective_config.sections:
+                        mcollective_config[cfg_name] = {}
+                    for (o, v) in cfg.iteritems():
+                        mcollective_config[cfg_name][o] = v
+                else:
+                    # Otherwise just try to convert it to a string
+                    mcollective_config[cfg_name] = str(cfg)
         # We got all our config as wanted we'll rename
         # the previous server.cfg and create our new one
         old_fn = cloud.paths.join(False, '/etc/mcollective/server.cfg.old')
         util.rename(server_cfg_fn, old_fn)
-        # Now we got the whole file, write to disk except the section
-        # we added so that config parser won't error out when trying to read.
-        # Note below, that we've just used ConfigParser because it generally
-        # works.  Below, we remove the initial 'nullsection' header.
-        contents = mcollective_config.stringify()
-        contents = contents.replace("%s\n" % (section_head), "")
+        # Now we got the whole file, write to disk...
+        contents = StringIO()
+        mcollective_config.write(contents)
+        contents = contents.getvalue()
         server_cfg_rw = cloud.paths.join(False, '/etc/mcollective/server.cfg')
         util.write_file(server_cfg_rw, contents, mode=0644)
 

From 332cd4c126e0ca8b9f2d356fb14348ac9c91429c Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 08:50:19 -0700
Subject: [PATCH 302/434] Configobj should be a requirement now, and not
 optional, so there is no need to check the import for errors.

---
 cloudinit/config/cc_landscape.py | 11 ++---------
 1 file changed, 2 insertions(+), 9 deletions(-)

diff --git a/cloudinit/config/cc_landscape.py b/cloudinit/config/cc_landscape.py
index 99a958b0..906a6ff7 100644
--- a/cloudinit/config/cc_landscape.py
+++ b/cloudinit/config/cc_landscape.py
@@ -22,10 +22,7 @@ import os
 
 from StringIO import StringIO
 
-try:
-    from configobj import ConfigObj
-except ImportError:
-    ConfigObj = None
+from configobj import ConfigObj
 
 from cloudinit import util
 
@@ -48,16 +45,12 @@ LSC_BUILTIN_CFG = {
 }
 
 
-def handle(name, cfg, cloud, log, _args):
+def handle(_name, cfg, cloud, log, _args):
     """
     Basically turn a top level 'landscape' entry with a 'client' dict
     and render it to ConfigObj format under '[client]' section in
     /etc/landscape/client.conf
     """
-    if not ConfigObj:
-        log.warn(("'ConfigObj' support not available,"
-                  " running module %s disabled"), name)
-        return
 
     ls_cloudcfg = cfg.get("landscape", {})
 

From 20861fae0d60c6d48afccc95228192dca176a4e7 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 08:50:51 -0700
Subject: [PATCH 303/434] ConfigObj is a requirement now, so no need to see if
 the import worked or failed.

---
 cloudinit/stages.py | 10 ++--------
 1 file changed, 2 insertions(+), 8 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 9481db83..595f7aea 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -26,10 +26,7 @@ import copy
 import os
 import sys
 
-try:
-    from configobj import ConfigObj
-except ImportError:
-    ConfigObj = None
+from configobj import ConfigObj
 
 from cloudinit.settings import (OLD_CLOUD_CONFIG)
 from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
@@ -68,10 +65,7 @@ class Init(object):
         self.datasource = None
 
     def _read_cfg_old(self):
-        # Support reading the old ConfigObj format file and merging
-        # it into the yaml dictionary
-        if not ConfigObj:
-            return {}
+        # Support reading the old ConfigObj format file
         old_cfg = ConfigObj(OLD_CLOUD_CONFIG)
         return dict(old_cfg)
 

From 07a0393106bdc3cd25a84c29f8410b297ac0f213 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 12:35:36 -0700
Subject: [PATCH 304/434] Use configobj support for now to keep the comments
 and other k/v pairs that may already exist in these files

---
 cloudinit/distros/rhel.py | 160 +++++++++++---------------------------
 1 file changed, 45 insertions(+), 115 deletions(-)

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index dff76075..4ed9d43f 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -34,6 +34,10 @@ NETWORK_FN_TPL = '/etc/sysconfig/network-scripts/ifcfg-%s'
 # For what alot of these files that are being written
 # are and the format of them
 
+# This library is used to parse/write
+# out the various sysconfig files edited
+from configobj import ConfigObj
+
 
 class Distro(distros.Distro):
 
@@ -50,34 +54,38 @@ class Distro(distros.Distro):
                   settings, entries)
         # Make the intermediate format as the rhel format...
         for (dev, info) in entries.iteritems():
-            lines = []
-            lines.append("DEVICE=%s" % (dev))
+            net_fn = NETWORK_FN_TPL % (dev)
+            net_ro_fn = self._paths.join(True, net_fn)
+            (prev_exist, net_cfg) = self._read_conf(net_ro_fn)
+            net_cfg['DEVICE'] = dev
             boot_proto = info.get('bootproto')
             if boot_proto:
-                lines.append("BOOTPROTO=%s" % (boot_proto))
+                net_cfg['BOOTPROTO'] = boot_proto
             net_mask = info.get('netmask')
             if net_mask:
-                lines.append("NETMASK=%s" % (net_mask))
+                net_cfg["NETMASK"] = net_mask
             addr = info.get('address')
             if addr:
-                lines.append("IPADDR=%s" % (addr))
+                net_cfg["IPADDR"] = addr
             if info.get('auto'):
-                lines.append("ONBOOT=yes")
+                net_cfg['ONBOOT'] = 'yes'
             else:
-                lines.append("ONBOOT=no")
+                net_cfg['ONBOOT'] = 'no'
             gtway = info.get('gateway')
             if gtway:
-                lines.append("GATEWAY=%s" % (gtway))
+                net_cfg["GATEWAY"] = gtway
             bcast = info.get('broadcast')
             if bcast:
-                lines.append("BROADCAST=%s" % (bcast))
+                net_cfg["BROADCAST"] = bcast
             mac_addr = info.get('hwaddress')
             if mac_addr:
-                lines.append("MACADDR=%s" % (mac_addr))
-            lines.insert(0, '# Created by cloud-init')
-            contents = "\n".join(lines)
-            net_fn = NETWORK_FN_TPL % (dev)
-            util.write_file(self._paths.join(False, net_fn), contents, 0644)
+                net_cfg["MACADDR"] = mac_addr
+            lines = net_cfg.write()
+            if not prev_exist:
+                lines.insert(0, '# Created by cloud-init')
+            w_contents = "\n".join(lines)
+            net_rw_fn = self._paths.join(False, net_fn)
+            util.write_file(net_rw_fn, w_contents, 0644)
 
     def set_hostname(self, hostname):
         out_fn = self._paths.join(False, '/etc/sysconfig/network')
@@ -91,54 +99,16 @@ class Distro(distros.Distro):
         if not out_fn:
             out_fn = self._paths.join(False, '/etc/sysconfig/i18n')
         ro_fn = self._paths.join(True, '/etc/sysconfig/i18n')
-        # Update the 'LANG' if it exists instead of appending
-        old_contents = self._read_conf(ro_fn)
-        adjusted = False
-        new_contents = []
-        for entry in old_contents:
-            if not entry:
-                continue
-            if len(entry) == 1:
-                new_contents.append(entry[0])
-                continue
-            (cmd, args) = entry
-            cmd_c = cmd.strip().lower()
-            if cmd_c == 'lang':
-                args = "%s" % (locale)
-                adjusted = True
-            new_contents.append("=".join([cmd, args]))
-        # Guess not found, append it
-        if not adjusted:
-            new_contents.append("# Added by cloud-init")
-            new_contents.append('LANG="%s"' % (locale))
-        contents = "\n".join(new_contents)
-        util.write_file(out_fn, contents, 0644)
+        (_exists, contents) = self._read_conf(ro_fn)
+        contents['LANG'] = locale
+        w_contents = "\n".join(contents.write())
+        util.write_file(out_fn, w_contents, 0644)
 
     def _write_hostname(self, hostname, out_fn):
-        old_contents = []
-        if os.path.isfile(out_fn):
-            old_contents = self._read_conf(out_fn)
-        # Update the 'HOSTNAME' if it exists instead of appending
-        new_contents = []
-        adjusted = False
-        for entry in old_contents:
-            if not entry:
-                continue
-            if len(entry) == 1:
-                new_contents.append(entry[0])
-                continue
-            (cmd, args) = entry
-            cmd_c = cmd.strip().lower()
-            if cmd_c == 'hostname':
-                args = "%s" % (hostname)
-                adjusted = True
-            new_contents.append("=".join([cmd, args]))
-        # Guess not found, append it
-        if not adjusted:
-            new_contents.append("# Added by cloud-init")
-            new_contents.append("HOSTNAME=%s" % (hostname))
-        contents = "\n".join(new_contents)
-        util.write_file(out_fn, contents, 0644)
+        (_exists, contents) = self._read_conf(out_fn)
+        contents['HOSTNAME'] = hostname
+        w_contents = "\n".join(contents.write())
+        util.write_file(out_fn, w_contents, 0644)
 
     def update_hostname(self, hostname, prev_file):
         hostname_prev = self._read_hostname(prev_file)
@@ -168,42 +138,20 @@ class Distro(distros.Distro):
             util.subp(['hostname', hostname])
 
     def _read_hostname(self, filename, default=None):
-        contents = self._read_conf(filename)
-        for c in contents:
-            if len(c) != 2:
-                continue
-            (cmd, args) = c
-            cmd_c = cmd.lower().strip()
-            if cmd_c == 'hostname':
-                args_c = args.strip()
-                if args_c:
-                    return args_c
-        return default
+        (_exists, contents) = self._read_conf(filename)
+        if 'HOSTNAME' in contents:
+            return contents['HOSTNAME']
+        else:
+            return default
 
     def _read_conf(self, filename):
-        contents = util.load_file(filename, quiet=True)
-        conf_lines = []
-        for line in contents.splitlines():
-            c_line = line.strip()
-            if not c_line or c_line.startswith("#"):
-                conf_lines.append([line])
-                continue
-            # Handle inline comments
-            c_pos = c_line.find("#")
-            if c_pos != -1:
-                c_line = c_line[0:c_pos].strip()
-            if not c_line:
-                conf_lines.append([line])
-                continue
-            # Format should be CMD=ARG1 ARG2...
-            pieces = c_line.split("=", 1)
-            if not pieces or len(pieces) == 1:
-                conf_lines.append([line])
-                continue
-            (cmd, args) = pieces
-            cmd = cmd.strip()
-            conf_lines.append([cmd, args])
-        return conf_lines
+        exists = False
+        if os.path.isfile(filename):
+            contents = util.load_file(filename).splitlines()
+            exists = True
+        else:
+            contents = []
+        return (exists, ConfigObj(contents))
 
     def set_timezone(self, tz):
         tz_file = os.path.join("/usr/share/zoneinfo", tz)
@@ -212,27 +160,9 @@ class Distro(distros.Distro):
                                 " no file found at %s") % (tz, tz_file))
         # Adjust the sysconfig clock zone setting
         read_fn = self._paths.join(True, "/etc/sysconfig/clock")
-        old_contents = self._read_conf(read_fn)
-        new_contents = []
-        zone_added = False
-        # Update the 'ZONE' if it exists instead of appending
-        for entry in old_contents:
-            if not entry:
-                continue
-            if len(entry) == 1:
-                new_contents.append(entry[0])
-                continue
-            (cmd, args) = entry
-            cmd_c = cmd.lower().strip()
-            if cmd_c == 'zone':
-                args = '"%s"' % (tz)
-                zone_added = True
-            new_contents.append("=".join([cmd, args]))
-        # Guess not found, append it
-        if not zone_added:
-            new_contents.append("# Added by cloud-init")
-            new_contents.append('ZONE="%s"' % (tz))
-        tz_contents = "\n".join(new_contents)
+        (_exists, contents) = self._read_conf(read_fn)
+        contents['ZONE'] = tz
+        tz_contents = "\n".join(contents.write())
         write_fn = self._paths.join(False, "/etc/sysconfig/clock")
         util.write_file(write_fn, tz_contents)
         # This ensures that the correct tz will be used for the system

From 5b2d8db914669f2c451c562fab4bb2bf4a4cd362 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 12:35:51 -0700
Subject: [PATCH 305/434] Remove suppport for ec2-config

---
 cloudinit/settings.py | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/cloudinit/settings.py b/cloudinit/settings.py
index fac9b862..2083cf60 100644
--- a/cloudinit/settings.py
+++ b/cloudinit/settings.py
@@ -26,10 +26,6 @@ CFG_ENV_NAME = "CLOUD_CFG"
 # This is expected to be a yaml formatted file
 CLOUD_CONFIG = '/etc/cloud/cloud.cfg'
 
-# This legacy format is expected to be readable by
-# configobj, see http://pypi.python.org/pypi/configobj
-OLD_CLOUD_CONFIG = '/etc/ec2-init/ec2-config.cfg'
-
 # What u get if no config is provided
 CFG_BUILTIN = {
     'datasource_list': [

From c53a8553b16563ca67a617c32cfdf0ed4c45cc07 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 12:36:01 -0700
Subject: [PATCH 306/434] Remove support for older ec2 configobj merging.

---
 cloudinit/stages.py | 11 +----------
 1 file changed, 1 insertion(+), 10 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 595f7aea..cfe1c071 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -26,9 +26,6 @@ import copy
 import os
 import sys
 
-from configobj import ConfigObj
-
-from cloudinit.settings import (OLD_CLOUD_CONFIG)
 from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
 
 from cloudinit import handlers
@@ -64,11 +61,6 @@ class Init(object):
         # Created only when a fetch occurs
         self.datasource = None
 
-    def _read_cfg_old(self):
-        # Support reading the old ConfigObj format file
-        old_cfg = ConfigObj(OLD_CLOUD_CONFIG)
-        return dict(old_cfg)
-
     @property
     def distro(self):
         if not self._distro:
@@ -165,13 +157,12 @@ class Init(object):
                 except:
                     util.logexc(LOG, ("Failed loading of additional"
                                       " configuration from %s"), fn)
-        # Now read in the built-in + base + old
+        # Now read in the built-in + base
         try:
             conf = util.get_base_cfg(builtin=util.get_builtin_cfg())
         except Exception:
             conf = util.get_builtin_cfg()
         i_cfgs.append(conf)
-        i_cfgs.append(self._read_cfg_old())
         return util.mergemanydict(i_cfgs)
 
     def _restore_from_cache(self):

From 275c6363813feef189beb6734b6c0ca326fc03e8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 12:52:26 -0700
Subject: [PATCH 307/434] 1. Add a ubuntu and fedora subclass of the RH/debian
 root classes 2. Move the ubuntu class to the debian class (since thats really
 what it is)

---
 cloudinit/distros/debian.py | 149 ++++++++++++++++++++++++++++++++++++
 cloudinit/distros/fedora.py |  31 ++++++++
 cloudinit/distros/ubuntu.py | 124 +-----------------------------
 3 files changed, 183 insertions(+), 121 deletions(-)
 create mode 100644 cloudinit/distros/debian.py
 create mode 100644 cloudinit/distros/fedora.py

diff --git a/cloudinit/distros/debian.py b/cloudinit/distros/debian.py
new file mode 100644
index 00000000..b23945d8
--- /dev/null
+++ b/cloudinit/distros/debian.py
@@ -0,0 +1,149 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import os
+
+from cloudinit import distros
+from cloudinit import helpers
+from cloudinit import log as logging
+from cloudinit import util
+
+from cloudinit.settings import PER_INSTANCE
+
+LOG = logging.getLogger(__name__)
+
+
+class Distro(distros.Distro):
+
+    def __init__(self, name, cfg, paths):
+        distros.Distro.__init__(self, name, cfg, paths)
+        # This will be used to restrict certain
+        # calls from repeatly happening (when they
+        # should only happen say once per instance...)
+        self._runner = helpers.Runners(paths)
+
+    def apply_locale(self, locale, out_fn=None):
+        if not out_fn:
+            out_fn = self._paths.join(False, '/etc/default/locale')
+        util.subp(['locale-gen', locale], capture=False)
+        util.subp(['update-locale', locale], capture=False)
+        contents = [
+            "# Created by cloud-init",
+            'LANG="%s"' % (locale),
+        ]
+        util.write_file(out_fn, "\n".join(contents))
+
+    def install_packages(self, pkglist):
+        self._update_package_sources()
+        self.package_command('install', pkglist)
+
+    def _write_network(self, settings):
+        net_fn = self._paths.join(False, "/etc/network/interfaces")
+        util.write_file(net_fn, settings)
+
+    def set_hostname(self, hostname):
+        out_fn = self._paths.join(False, "/etc/hostname")
+        self._write_hostname(hostname, out_fn)
+        if out_fn == '/etc/hostname':
+            # Only do this if we are running in non-adjusted root mode
+            LOG.debug("Setting hostname to %s", hostname)
+            util.subp(['hostname', hostname])
+
+    def _write_hostname(self, hostname, out_fn):
+        lines = []
+        lines.append("# Created by cloud-init")
+        lines.append(str(hostname))
+        contents = "\n".join(lines)
+        util.write_file(out_fn, contents, 0644)
+
+    def update_hostname(self, hostname, prev_fn):
+        hostname_prev = self._read_hostname(prev_fn)
+        read_fn = self._paths.join(True, "/etc/hostname")
+        hostname_in_etc = self._read_hostname(read_fn)
+        update_files = []
+        if not hostname_prev or hostname_prev != hostname:
+            update_files.append(prev_fn)
+        if (not hostname_in_etc or
+            (hostname_in_etc == hostname_prev and
+             hostname_in_etc != hostname)):
+            write_fn = self._paths.join(False, "/etc/hostname")
+            update_files.append(write_fn)
+        for fn in update_files:
+            try:
+                self._write_hostname(hostname, fn)
+            except:
+                util.logexc(LOG, "Failed to write hostname %s to %s",
+                            hostname, fn)
+        if (hostname_in_etc and hostname_prev and
+            hostname_in_etc != hostname_prev):
+            LOG.debug(("%s differs from /etc/hostname."
+                        " Assuming user maintained hostname."), prev_fn)
+        if "/etc/hostname" in update_files:
+            # Only do this if we are running in non-adjusted root mode
+            LOG.debug("Setting hostname to %s", hostname)
+            util.subp(['hostname', hostname])
+
+    def _read_hostname(self, filename, default=None):
+        contents = util.load_file(filename, quiet=True)
+        for line in contents.splitlines():
+            c_pos = line.find("#")
+            # Handle inline comments
+            if c_pos != -1:
+                line = line[0:c_pos]
+            line_c = line.strip()
+            if line_c:
+                return line_c
+        return default
+
+    def _get_localhost_ip(self):
+        # Note: http://www.leonardoborda.com/blog/127-0-1-1-ubuntu-debian/
+        return "127.0.1.1"
+
+    def set_timezone(self, tz):
+        tz_file = os.path.join("/usr/share/zoneinfo", tz)
+        if not os.path.isfile(tz_file):
+            raise RuntimeError(("Invalid timezone %s,"
+                                " no file found at %s") % (tz, tz_file))
+        tz_lines = [
+            "# Created by cloud-init",
+            str(tz),
+        ]
+        tz_contents = "\n".join(tz_lines)
+        tz_fn = self._paths.join(False, "/etc/timezone")
+        util.write_file(tz_fn, tz_contents)
+        util.copy(tz_file, self._paths.join(False, "/etc/localtime"))
+
+    def package_command(self, command, args=None):
+        e = os.environ.copy()
+        # See: http://tiny.cc/kg91fw
+        # Or: http://tiny.cc/mh91fw
+        e['DEBIAN_FRONTEND'] = 'noninteractive'
+        cmd = ['apt-get', '--option', 'Dpkg::Options::=--force-confold',
+               '--assume-yes', command]
+        if args:
+            cmd.extend(args)
+        # Allow the output of this to flow outwards (ie not be captured)
+        util.subp(cmd, env=e, capture=False)
+
+    def _update_package_sources(self):
+        self._runner.run("update-sources", self.package_command,
+                         ["update"], freq=PER_INSTANCE)
diff --git a/cloudinit/distros/fedora.py b/cloudinit/distros/fedora.py
new file mode 100644
index 00000000..c777845d
--- /dev/null
+++ b/cloudinit/distros/fedora.py
@@ -0,0 +1,31 @@
+# vi: ts=4 expandtab
+#
+#    Copyright (C) 2012 Canonical Ltd.
+#    Copyright (C) 2012 Hewlett-Packard Development Company, L.P.
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Scott Moser <scott.moser@canonical.com>
+#    Author: Juerg Haefliger <juerg.haefliger@hp.com>
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+from cloudinit.distros import rhel
+
+from cloudinit import log as logging
+
+LOG = logging.getLogger(__name__)
+
+
+class Distro(rhel.Distro):
+    pass
diff --git a/cloudinit/distros/ubuntu.py b/cloudinit/distros/ubuntu.py
index b23945d8..77c2aff4 100644
--- a/cloudinit/distros/ubuntu.py
+++ b/cloudinit/distros/ubuntu.py
@@ -20,130 +20,12 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import os
+from cloudinit.distros import debian
 
-from cloudinit import distros
-from cloudinit import helpers
 from cloudinit import log as logging
-from cloudinit import util
-
-from cloudinit.settings import PER_INSTANCE
 
 LOG = logging.getLogger(__name__)
 
 
-class Distro(distros.Distro):
-
-    def __init__(self, name, cfg, paths):
-        distros.Distro.__init__(self, name, cfg, paths)
-        # This will be used to restrict certain
-        # calls from repeatly happening (when they
-        # should only happen say once per instance...)
-        self._runner = helpers.Runners(paths)
-
-    def apply_locale(self, locale, out_fn=None):
-        if not out_fn:
-            out_fn = self._paths.join(False, '/etc/default/locale')
-        util.subp(['locale-gen', locale], capture=False)
-        util.subp(['update-locale', locale], capture=False)
-        contents = [
-            "# Created by cloud-init",
-            'LANG="%s"' % (locale),
-        ]
-        util.write_file(out_fn, "\n".join(contents))
-
-    def install_packages(self, pkglist):
-        self._update_package_sources()
-        self.package_command('install', pkglist)
-
-    def _write_network(self, settings):
-        net_fn = self._paths.join(False, "/etc/network/interfaces")
-        util.write_file(net_fn, settings)
-
-    def set_hostname(self, hostname):
-        out_fn = self._paths.join(False, "/etc/hostname")
-        self._write_hostname(hostname, out_fn)
-        if out_fn == '/etc/hostname':
-            # Only do this if we are running in non-adjusted root mode
-            LOG.debug("Setting hostname to %s", hostname)
-            util.subp(['hostname', hostname])
-
-    def _write_hostname(self, hostname, out_fn):
-        lines = []
-        lines.append("# Created by cloud-init")
-        lines.append(str(hostname))
-        contents = "\n".join(lines)
-        util.write_file(out_fn, contents, 0644)
-
-    def update_hostname(self, hostname, prev_fn):
-        hostname_prev = self._read_hostname(prev_fn)
-        read_fn = self._paths.join(True, "/etc/hostname")
-        hostname_in_etc = self._read_hostname(read_fn)
-        update_files = []
-        if not hostname_prev or hostname_prev != hostname:
-            update_files.append(prev_fn)
-        if (not hostname_in_etc or
-            (hostname_in_etc == hostname_prev and
-             hostname_in_etc != hostname)):
-            write_fn = self._paths.join(False, "/etc/hostname")
-            update_files.append(write_fn)
-        for fn in update_files:
-            try:
-                self._write_hostname(hostname, fn)
-            except:
-                util.logexc(LOG, "Failed to write hostname %s to %s",
-                            hostname, fn)
-        if (hostname_in_etc and hostname_prev and
-            hostname_in_etc != hostname_prev):
-            LOG.debug(("%s differs from /etc/hostname."
-                        " Assuming user maintained hostname."), prev_fn)
-        if "/etc/hostname" in update_files:
-            # Only do this if we are running in non-adjusted root mode
-            LOG.debug("Setting hostname to %s", hostname)
-            util.subp(['hostname', hostname])
-
-    def _read_hostname(self, filename, default=None):
-        contents = util.load_file(filename, quiet=True)
-        for line in contents.splitlines():
-            c_pos = line.find("#")
-            # Handle inline comments
-            if c_pos != -1:
-                line = line[0:c_pos]
-            line_c = line.strip()
-            if line_c:
-                return line_c
-        return default
-
-    def _get_localhost_ip(self):
-        # Note: http://www.leonardoborda.com/blog/127-0-1-1-ubuntu-debian/
-        return "127.0.1.1"
-
-    def set_timezone(self, tz):
-        tz_file = os.path.join("/usr/share/zoneinfo", tz)
-        if not os.path.isfile(tz_file):
-            raise RuntimeError(("Invalid timezone %s,"
-                                " no file found at %s") % (tz, tz_file))
-        tz_lines = [
-            "# Created by cloud-init",
-            str(tz),
-        ]
-        tz_contents = "\n".join(tz_lines)
-        tz_fn = self._paths.join(False, "/etc/timezone")
-        util.write_file(tz_fn, tz_contents)
-        util.copy(tz_file, self._paths.join(False, "/etc/localtime"))
-
-    def package_command(self, command, args=None):
-        e = os.environ.copy()
-        # See: http://tiny.cc/kg91fw
-        # Or: http://tiny.cc/mh91fw
-        e['DEBIAN_FRONTEND'] = 'noninteractive'
-        cmd = ['apt-get', '--option', 'Dpkg::Options::=--force-confold',
-               '--assume-yes', command]
-        if args:
-            cmd.extend(args)
-        # Allow the output of this to flow outwards (ie not be captured)
-        util.subp(cmd, env=e, capture=False)
-
-    def _update_package_sources(self):
-        self._runner.run("update-sources", self.package_command,
-                         ["update"], freq=PER_INSTANCE)
+class Distro(debian.Distro):
+    pass

From 63c9a729d4f548d7ba6581fb10fa4a95389d22e2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 12:55:45 -0700
Subject: [PATCH 308/434] Add in debian, which should also work

---
 cloudinit/config/cc_ca_certs.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/config/cc_ca_certs.py b/cloudinit/config/cc_ca_certs.py
index 266a2d84..b4f9482a 100644
--- a/cloudinit/config/cc_ca_certs.py
+++ b/cloudinit/config/cc_ca_certs.py
@@ -23,7 +23,7 @@ CA_CERT_FILENAME = "cloud-init-ca-certs.crt"
 CA_CERT_CONFIG = "/etc/ca-certificates.conf"
 CA_CERT_SYSTEM_PATH = "/etc/ssl/certs/"
 
-distros = ['ubuntu']
+distros = ['ubuntu', 'debian']
 
 
 def update_ca_certs():

From 36ce760627cf944a8241b0dfbd130e9d6a814580 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 13:13:30 -0700
Subject: [PATCH 309/434] Remove comment about old-configs

---
 Requires | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/Requires b/Requires
index bd2db00c..bbe7baec 100644
--- a/Requires
+++ b/Requires
@@ -17,8 +17,7 @@ oauth>=1.0
 # those same fetchs and decodes and signing (...) that ec2 requires.
 boto>=2.4
 
-# This is only needed if you have old style configurations
-# and any places where we need to support configs in a manner
+# This is only needed for places where we need to support configs in a manner
 # that the built-in config parser is not sufficent (ie
 # when we need to preserve comments, or do not have a top-level
 # section)...

From a7ca4287a7fed9b7d3af71b512059bb50cbc953c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 18:07:05 -0700
Subject: [PATCH 310/434] 1. Fix the cfgobj to make sure it handles the quoting
    of the keys and values in sysconfig specially by    ensuring that it does
 the quoting so that the files    written out can be sourced into bash
 scripts, which    is typically what these files are used for.

---
 cloudinit/distros/rhel.py | 61 ++++++++++++++++++++++++++++++++++++---
 1 file changed, 57 insertions(+), 4 deletions(-)

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index 4ed9d43f..2c5bcab9 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -36,9 +36,24 @@ NETWORK_FN_TPL = '/etc/sysconfig/network-scripts/ifcfg-%s'
 
 # This library is used to parse/write
 # out the various sysconfig files edited
+#
+# It has to be slightly modified though
+# to ensure that all values are quoted
+# since these configs are usually sourced into
+# bash scripts...
 from configobj import ConfigObj
 
 
+# See: http://tiny.cc/oezbgw
+D_QUOTE_CHARS = {
+    "\"": "\\\"",
+    "(": "\\(",
+    ")": "\\)",
+    "$": '\$',
+    '`': '\`',
+}
+
+
 class Distro(distros.Distro):
 
     def __init__(self, name, cfg, paths):
@@ -144,14 +159,14 @@ class Distro(distros.Distro):
         else:
             return default
 
-    def _read_conf(self, filename):
+    def _read_conf(self, fn):
         exists = False
-        if os.path.isfile(filename):
-            contents = util.load_file(filename).splitlines()
+        if os.path.isfile(fn):
+            contents = util.load_file(fn).splitlines()
             exists = True
         else:
             contents = []
-        return (exists, ConfigObj(contents))
+        return (exists, QuotingConfigObj(contents))
 
     def set_timezone(self, tz):
         tz_file = os.path.join("/usr/share/zoneinfo", tz)
@@ -186,6 +201,44 @@ class Distro(distros.Distro):
         util.subp(cmd, capture=False)
 
 
+# This class helps adjust the configobj
+# writing to ensure that when writing a k/v
+# on a line, that they are properly quoted
+# and have no spaces between the '=' sign.
+# - This is mainly due to the fact that
+# the sysconfig scripts are often sourced
+# directly into bash/shell scripts so ensure
+# that it works for those types of use cases.
+class QuotingConfigObj(ConfigObj):
+    def __init__(self, lines):
+        ConfigObj.__init__(self, lines,
+                           interpolation=False,
+                           write_empty_values=True)
+
+    def _quote_posix(self, text):
+        if not text:
+            return '""'
+        for (k, v) in D_QUOTE_CHARS.iteritems():
+            text = text.replace(k, v)
+        return '"%s"' % (text)
+
+    def _write_line(self, indent_string, entry, this_entry, comment):
+        # Ensure it is formatted fine for
+        # how these sysconfig scripts are used
+        val = self._decode_element(self._quote(this_entry))
+        if not val.startswith("'"):
+            # Not already quoted, double quote
+            # it for safety
+            val = self._quote_posix(val)
+        key = self._decode_element(self._quote(entry, multiline=False))
+        cmnt = self._decode_element(comment)
+        return '%s%s%s%s%s' % (indent_string,
+                               key,
+                               "=",
+                               val,
+                               cmnt)
+
+
 # This is a util function to translate a ubuntu /etc/network/interfaces 'blob'
 # to a rhel equiv. that can then be written to /etc/sysconfig/network-scripts/
 # TODO remove when we have python-netcf active...

From 8fe97d05b70e40b04a6eca71f797d81872d2db50 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 18:17:29 -0700
Subject: [PATCH 311/434] 1. Adjust for the cases of 'yes', 'no', 'true',
 'false' by    leaving those unquoted 2. Add more comments as to why we are
 leaving single quoted    strings alone.

---
 cloudinit/distros/rhel.py | 16 +++++++++++-----
 1 file changed, 11 insertions(+), 5 deletions(-)

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index 2c5bcab9..87d5b7a8 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -43,7 +43,6 @@ NETWORK_FN_TPL = '/etc/sysconfig/network-scripts/ifcfg-%s'
 # bash scripts...
 from configobj import ConfigObj
 
-
 # See: http://tiny.cc/oezbgw
 D_QUOTE_CHARS = {
     "\"": "\\\"",
@@ -217,19 +216,26 @@ class QuotingConfigObj(ConfigObj):
 
     def _quote_posix(self, text):
         if not text:
-            return '""'
+            return ''
         for (k, v) in D_QUOTE_CHARS.iteritems():
             text = text.replace(k, v)
         return '"%s"' % (text)
 
+    def _quote_special(self, text):
+        if text.lower() in ['yes', 'no', 'true', 'false']:
+            return text
+        else:
+            return self._quote_posix(text)
+
     def _write_line(self, indent_string, entry, this_entry, comment):
         # Ensure it is formatted fine for
         # how these sysconfig scripts are used
         val = self._decode_element(self._quote(this_entry))
+        # Single quoted strings should
+        # always work.
         if not val.startswith("'"):
-            # Not already quoted, double quote
-            # it for safety
-            val = self._quote_posix(val)
+            # Perform any special quoting
+            val = self._quote_special(val)
         key = self._decode_element(self._quote(entry, multiline=False))
         cmnt = self._decode_element(comment)
         return '%s%s%s%s%s' % (indent_string,

From f309098535b461bc03055feef981f90982b731d3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 18:41:27 -0700
Subject: [PATCH 312/434] Add initial init.d script.

---
 initd/cloud-init.sh | 126 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 126 insertions(+)
 create mode 100755 initd/cloud-init.sh

diff --git a/initd/cloud-init.sh b/initd/cloud-init.sh
new file mode 100755
index 00000000..dd93d50f
--- /dev/null
+++ b/initd/cloud-init.sh
@@ -0,0 +1,126 @@
+#!/bin/sh
+
+#
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+#
+
+# See: http://wiki.debian.org/LSBInitScripts
+# See: http://tiny.cc/czvbgw
+# See: http://www.novell.com/coolsolutions/feature/15380.html
+# Also based on dhcpd in RHEL (for comparison)
+
+### BEGIN INIT INFO
+# Provides:          cloud-init
+# Required-Start:    $local_fs $network $named $remote_fs
+# Should-Start:      $time
+# Required-Stop:
+# Should-Stop:
+# Default-Start:     3 5
+# Default-Stop:
+# Short-Description: The initial cloud-init job (net and fs contingent)
+# Description:       Start cloud-init and runs the initialization phases
+#	and any associated initial modules as desired. Network
+#	and filesystem are required to have this script activate
+#	correctly.
+### END INIT INFO
+
+. /etc/init.d/functions
+
+# Return values acc. to LSB for all commands but status:
+# 0	  - success
+# 1       - generic or unspecified error
+# 2       - invalid or excess argument(s)
+# 3       - unimplemented feature (e.g. "reload")
+# 4       - user had insufficient privileges
+# 5       - program is not installed
+# 6       - program is not configured
+# 7       - program is not running
+# 8--199  - reserved (8--99 LSB, 100--149 distrib, 150--199 appl)
+# 
+# Note that starting an already running service, stopping
+# or restarting a not-running service as well as the restart
+# with force-reload (in case signaling is not supported) are
+# considered a success.
+
+RETVAL=0
+
+prog="cloud-init"
+cloud_init="/usr/bin/cloud-init"
+conf="/etc/cloud/cloud.cfg"
+
+# If there exists a sysconfig variable override file use it...
+[ -f /etc/sysconfig/cloud-init ] && . /etc/sysconfig/cloud-init
+
+start() {
+    [ -x $cloud_init ] || return 5
+    [ -f $conf ] || return 6
+
+    echo -n $"Starting $prog: "
+    $prog $CLOUD_INIT_ARGS init
+    RETVAL=$?
+    return $RETVAL
+}
+
+stop() {
+    echo -n $"Shutting down $prog: "
+    # No-op
+    RETVAL=7
+    return $RETVAL
+}
+
+. /etc/init.d/functions
+
+case "$1" in
+    start)
+        start
+        RETVAL=$?
+	;;
+    stop)
+        stop
+        RETVAL=$?
+	;;
+    restart|try-restart|condrestart)
+        ## Stop the service and regardless of whether it was
+        ## running or not, start it again.
+        # 
+        ## Note: try-restart is now part of LSB (as of 1.9).
+        ## RH has a similar command named condrestart.
+        stop ; start
+        RETVAL=$?
+	;;
+    reload|force-reload)
+        # It does not support reload
+        RETVAL=3
+	;;
+    status)
+        echo -n $"Checking for service $prog:"
+        # Return value is slightly different for the status command:
+        # 0 - service up and running
+        # 1 - service dead, but /var/run/  pid  file exists
+        # 2 - service dead, but /var/lock/ lock file exists
+        # 3 - service not running (unused)
+        # 4 - service status unknown :-(
+        # 5--199 reserved (5--99 LSB, 100--149 distro, 150--199 appl.)
+        RETVAL=3
+	;;
+    *)
+        echo "Usage: $0 {start|stop|status|try-restart|condrestart|restart|force-reload|reload}"
+        RETVAL=3
+	;;
+esac
+
+exit $RETVAL

From 0508c66f4ebdfa4b53ca44bb6abdfda7496d504d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 18:44:16 -0700
Subject: [PATCH 313/434] Use the full path + rename to CLOUDINITARGS

---
 initd/cloud-init.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/initd/cloud-init.sh b/initd/cloud-init.sh
index dd93d50f..5faa77f8 100755
--- a/initd/cloud-init.sh
+++ b/initd/cloud-init.sh
@@ -70,7 +70,7 @@ start() {
     [ -f $conf ] || return 6
 
     echo -n $"Starting $prog: "
-    $prog $CLOUD_INIT_ARGS init
+    $cloud_init $CLOUDINITARGS init
     RETVAL=$?
     return $RETVAL
 }

From 8b5a7958cf14e5b87aef34040b2f372c04b7c72d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 18:49:46 -0700
Subject: [PATCH 314/434] Restarting is just the same as starting, so don't
 return the exit code of the stop function

---
 initd/cloud-init.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/initd/cloud-init.sh b/initd/cloud-init.sh
index 5faa77f8..72b3bd47 100755
--- a/initd/cloud-init.sh
+++ b/initd/cloud-init.sh
@@ -99,7 +99,7 @@ case "$1" in
         # 
         ## Note: try-restart is now part of LSB (as of 1.9).
         ## RH has a similar command named condrestart.
-        stop ; start
+        start
         RETVAL=$?
 	;;
     reload|force-reload)

From 8703d31b173aa2758799c8442a8bb6cbdb3e36fb Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 18:51:10 -0700
Subject: [PATCH 315/434] Add a local only version

---
 initd/cloud-init-local.sh | 126 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 126 insertions(+)
 create mode 100755 initd/cloud-init-local.sh

diff --git a/initd/cloud-init-local.sh b/initd/cloud-init-local.sh
new file mode 100755
index 00000000..a3256d47
--- /dev/null
+++ b/initd/cloud-init-local.sh
@@ -0,0 +1,126 @@
+#!/bin/sh
+
+#
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+#
+
+# See: http://wiki.debian.org/LSBInitScripts
+# See: http://tiny.cc/czvbgw
+# See: http://www.novell.com/coolsolutions/feature/15380.html
+# Also based on dhcpd in RHEL (for comparison)
+
+### BEGIN INIT INFO
+# Provides:          cloud-init
+# Required-Start:    $local_fs $remote_fs
+# Should-Start:      $time
+# Required-Stop:
+# Should-Stop:
+# Default-Start:     3 5
+# Default-Stop:
+# Short-Description: The initial cloud-init job (local fs contingent)
+# Description:       Start cloud-init and runs the initialization phases
+#	and any associated initial modules as desired.
+#	A filesystem is required to have this script activate
+#	correctly.
+### END INIT INFO
+
+. /etc/init.d/functions
+
+# Return values acc. to LSB for all commands but status:
+# 0	  - success
+# 1       - generic or unspecified error
+# 2       - invalid or excess argument(s)
+# 3       - unimplemented feature (e.g. "reload")
+# 4       - user had insufficient privileges
+# 5       - program is not installed
+# 6       - program is not configured
+# 7       - program is not running
+# 8--199  - reserved (8--99 LSB, 100--149 distrib, 150--199 appl)
+# 
+# Note that starting an already running service, stopping
+# or restarting a not-running service as well as the restart
+# with force-reload (in case signaling is not supported) are
+# considered a success.
+
+RETVAL=0
+
+prog="cloud-init"
+cloud_init="/usr/bin/cloud-init"
+conf="/etc/cloud/cloud.cfg"
+
+# If there exists a sysconfig variable override file use it...
+[ -f /etc/sysconfig/cloud-init ] && . /etc/sysconfig/cloud-init
+
+start() {
+    [ -x $cloud_init ] || return 5
+    [ -f $conf ] || return 6
+
+    echo -n $"Starting $prog: "
+    $cloud_init $CLOUDINITARGS init --local
+    RETVAL=$?
+    return $RETVAL
+}
+
+stop() {
+    echo -n $"Shutting down $prog: "
+    # No-op
+    RETVAL=7
+    return $RETVAL
+}
+
+. /etc/init.d/functions
+
+case "$1" in
+    start)
+        start
+        RETVAL=$?
+	;;
+    stop)
+        stop
+        RETVAL=$?
+	;;
+    restart|try-restart|condrestart)
+        ## Stop the service and regardless of whether it was
+        ## running or not, start it again.
+        # 
+        ## Note: try-restart is now part of LSB (as of 1.9).
+        ## RH has a similar command named condrestart.
+        start
+        RETVAL=$?
+	;;
+    reload|force-reload)
+        # It does not support reload
+        RETVAL=3
+	;;
+    status)
+        echo -n $"Checking for service $prog:"
+        # Return value is slightly different for the status command:
+        # 0 - service up and running
+        # 1 - service dead, but /var/run/  pid  file exists
+        # 2 - service dead, but /var/lock/ lock file exists
+        # 3 - service not running (unused)
+        # 4 - service status unknown :-(
+        # 5--199 reserved (5--99 LSB, 100--149 distro, 150--199 appl.)
+        RETVAL=3
+	;;
+    *)
+        echo "Usage: $0 {start|stop|status|try-restart|condrestart|restart|force-reload|reload}"
+        RETVAL=3
+	;;
+esac
+
+exit $RETVAL

From 51ba081ded89b63c1787a0edf5fad5dbd19ca3b7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 19:08:05 -0700
Subject: [PATCH 316/434] 1. Add init.d/config and final scripts 2. Adjust the
 comments of the cloud-init* scripts to match the long    description of the
 config and final ones.

---
 initd/cloud-config.sh     | 124 ++++++++++++++++++++++++++++++++++++++
 initd/cloud-final.sh      | 124 ++++++++++++++++++++++++++++++++++++++
 initd/cloud-init-local.sh |   2 -
 initd/cloud-init.sh       |   6 +-
 4 files changed, 250 insertions(+), 6 deletions(-)
 create mode 100755 initd/cloud-config.sh
 create mode 100755 initd/cloud-final.sh

diff --git a/initd/cloud-config.sh b/initd/cloud-config.sh
new file mode 100755
index 00000000..dd0bca8b
--- /dev/null
+++ b/initd/cloud-config.sh
@@ -0,0 +1,124 @@
+#!/bin/sh
+
+#
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+#
+
+# See: http://wiki.debian.org/LSBInitScripts
+# See: http://tiny.cc/czvbgw
+# See: http://www.novell.com/coolsolutions/feature/15380.html
+# Also based on dhcpd in RHEL (for comparison)
+
+### BEGIN INIT INFO
+# Provides:          cloud-config
+# Required-Start:    cloud-init
+# Should-Start:      $time
+# Required-Stop:
+# Should-Stop:
+# Default-Start:     3 5
+# Default-Stop:
+# Short-Description: The config cloud-init job
+# Description:       Start cloud-init and runs the config phase
+#	and any associated config modules as desired.
+### END INIT INFO
+
+. /etc/init.d/functions
+
+# Return values acc. to LSB for all commands but status:
+# 0	  - success
+# 1       - generic or unspecified error
+# 2       - invalid or excess argument(s)
+# 3       - unimplemented feature (e.g. "reload")
+# 4       - user had insufficient privileges
+# 5       - program is not installed
+# 6       - program is not configured
+# 7       - program is not running
+# 8--199  - reserved (8--99 LSB, 100--149 distrib, 150--199 appl)
+# 
+# Note that starting an already running service, stopping
+# or restarting a not-running service as well as the restart
+# with force-reload (in case signaling is not supported) are
+# considered a success.
+
+RETVAL=0
+
+prog="cloud-init"
+cloud_init="/usr/bin/cloud-init"
+conf="/etc/cloud/cloud.cfg"
+
+# If there exists a sysconfig variable override file use it...
+[ -f /etc/sysconfig/cloud-init ] && . /etc/sysconfig/cloud-init
+
+start() {
+    [ -x $cloud_init ] || return 5
+    [ -f $conf ] || return 6
+
+    echo -n $"Starting $prog: "
+    $cloud_init $CLOUDINITARGS modules --mode config
+    RETVAL=$?
+    return $RETVAL
+}
+
+stop() {
+    echo -n $"Shutting down $prog: "
+    # No-op
+    RETVAL=7
+    return $RETVAL
+}
+
+. /etc/init.d/functions
+
+case "$1" in
+    start)
+        start
+        RETVAL=$?
+	;;
+    stop)
+        stop
+        RETVAL=$?
+	;;
+    restart|try-restart|condrestart)
+        ## Stop the service and regardless of whether it was
+        ## running or not, start it again.
+        # 
+        ## Note: try-restart is now part of LSB (as of 1.9).
+        ## RH has a similar command named condrestart.
+        start
+        RETVAL=$?
+	;;
+    reload|force-reload)
+        # It does not support reload
+        RETVAL=3
+	;;
+    status)
+        echo -n $"Checking for service $prog:"
+        # Return value is slightly different for the status command:
+        # 0 - service up and running
+        # 1 - service dead, but /var/run/  pid  file exists
+        # 2 - service dead, but /var/lock/ lock file exists
+        # 3 - service not running (unused)
+        # 4 - service status unknown :-(
+        # 5--199 reserved (5--99 LSB, 100--149 distro, 150--199 appl.)
+        RETVAL=3
+	;;
+    *)
+        echo "Usage: $0 {start|stop|status|try-restart|condrestart|restart|force-reload|reload}"
+        RETVAL=3
+	;;
+esac
+
+exit $RETVAL
diff --git a/initd/cloud-final.sh b/initd/cloud-final.sh
new file mode 100755
index 00000000..2e462c17
--- /dev/null
+++ b/initd/cloud-final.sh
@@ -0,0 +1,124 @@
+#!/bin/sh
+
+#
+#    Copyright (C) 2012 Yahoo! Inc.
+#
+#    Author: Joshua Harlow <harlowja@yahoo-inc.com>
+#
+#    This program is free software: you can redistribute it and/or modify
+#    it under the terms of the GNU General Public License version 3, as
+#    published by the Free Software Foundation.
+#
+#    This program is distributed in the hope that it will be useful,
+#    but WITHOUT ANY WARRANTY; without even the implied warranty of
+#    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#    GNU General Public License for more details.
+#
+#    You should have received a copy of the GNU General Public License
+#    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+#
+
+# See: http://wiki.debian.org/LSBInitScripts
+# See: http://tiny.cc/czvbgw
+# See: http://www.novell.com/coolsolutions/feature/15380.html
+# Also based on dhcpd in RHEL (for comparison)
+
+### BEGIN INIT INFO
+# Provides:          cloud-final
+# Required-Start:    $all cloud-init cloud-config
+# Should-Start:      $time
+# Required-Stop:
+# Should-Stop:
+# Default-Start:     3 5
+# Default-Stop:
+# Short-Description: The final cloud-init job
+# Description:       Start cloud-init and runs the final phase
+#	and any associated final modules as desired.
+### END INIT INFO
+
+. /etc/init.d/functions
+
+# Return values acc. to LSB for all commands but status:
+# 0	  - success
+# 1       - generic or unspecified error
+# 2       - invalid or excess argument(s)
+# 3       - unimplemented feature (e.g. "reload")
+# 4       - user had insufficient privileges
+# 5       - program is not installed
+# 6       - program is not configured
+# 7       - program is not running
+# 8--199  - reserved (8--99 LSB, 100--149 distrib, 150--199 appl)
+# 
+# Note that starting an already running service, stopping
+# or restarting a not-running service as well as the restart
+# with force-reload (in case signaling is not supported) are
+# considered a success.
+
+RETVAL=0
+
+prog="cloud-init"
+cloud_init="/usr/bin/cloud-init"
+conf="/etc/cloud/cloud.cfg"
+
+# If there exists a sysconfig variable override file use it...
+[ -f /etc/sysconfig/cloud-init ] && . /etc/sysconfig/cloud-init
+
+start() {
+    [ -x $cloud_init ] || return 5
+    [ -f $conf ] || return 6
+
+    echo -n $"Starting $prog: "
+    $cloud_init $CLOUDINITARGS modules --mode final
+    RETVAL=$?
+    return $RETVAL
+}
+
+stop() {
+    echo -n $"Shutting down $prog: "
+    # No-op
+    RETVAL=7
+    return $RETVAL
+}
+
+. /etc/init.d/functions
+
+case "$1" in
+    start)
+        start
+        RETVAL=$?
+	;;
+    stop)
+        stop
+        RETVAL=$?
+	;;
+    restart|try-restart|condrestart)
+        ## Stop the service and regardless of whether it was
+        ## running or not, start it again.
+        # 
+        ## Note: try-restart is now part of LSB (as of 1.9).
+        ## RH has a similar command named condrestart.
+        start
+        RETVAL=$?
+	;;
+    reload|force-reload)
+        # It does not support reload
+        RETVAL=3
+	;;
+    status)
+        echo -n $"Checking for service $prog:"
+        # Return value is slightly different for the status command:
+        # 0 - service up and running
+        # 1 - service dead, but /var/run/  pid  file exists
+        # 2 - service dead, but /var/lock/ lock file exists
+        # 3 - service not running (unused)
+        # 4 - service status unknown :-(
+        # 5--199 reserved (5--99 LSB, 100--149 distro, 150--199 appl.)
+        RETVAL=3
+	;;
+    *)
+        echo "Usage: $0 {start|stop|status|try-restart|condrestart|restart|force-reload|reload}"
+        RETVAL=3
+	;;
+esac
+
+exit $RETVAL
diff --git a/initd/cloud-init-local.sh b/initd/cloud-init-local.sh
index a3256d47..bf5d409a 100755
--- a/initd/cloud-init-local.sh
+++ b/initd/cloud-init-local.sh
@@ -34,8 +34,6 @@
 # Short-Description: The initial cloud-init job (local fs contingent)
 # Description:       Start cloud-init and runs the initialization phases
 #	and any associated initial modules as desired.
-#	A filesystem is required to have this script activate
-#	correctly.
 ### END INIT INFO
 
 . /etc/init.d/functions
diff --git a/initd/cloud-init.sh b/initd/cloud-init.sh
index 72b3bd47..7726c452 100755
--- a/initd/cloud-init.sh
+++ b/initd/cloud-init.sh
@@ -32,10 +32,8 @@
 # Default-Start:     3 5
 # Default-Stop:
 # Short-Description: The initial cloud-init job (net and fs contingent)
-# Description:       Start cloud-init and runs the initialization phases
-#	and any associated initial modules as desired. Network
-#	and filesystem are required to have this script activate
-#	correctly.
+# Description:       Start cloud-init and runs the initialization phase
+#	and any associated initial modules as desired.
 ### END INIT INFO
 
 . /etc/init.d/functions

From 996b9f7a2183e049fa6859bb59accf7485acc0c8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 20:30:08 -0700
Subject: [PATCH 317/434] Disable capturing of these subp calls

---
 cloudinit/config/cc_chef.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/cloudinit/config/cc_chef.py b/cloudinit/config/cc_chef.py
index d8bd85f8..d682398a 100644
--- a/cloudinit/config/cc_chef.py
+++ b/cloudinit/config/cc_chef.py
@@ -96,7 +96,8 @@ def handle(name, cfg, cloud, log, _args):
             install_chef_from_gems(cloud.distro, ruby_version, chef_version)
             # and finally, run chef-client
             log.debug('Running chef-client')
-            util.subp(['/usr/bin/chef-client', '-d', '-i', '1800', '-s', '20'])
+            util.subp(['/usr/bin/chef-client', 
+                       '-d', '-i', '1800', '-s', '20'], capture=False)
         elif install_type == 'packages':
             # this will install and run the chef-client from packages
             cloud.distro.install_packages(('chef',))
@@ -121,8 +122,8 @@ def install_chef_from_gems(ruby_version, chef_version, distro):
     if chef_version:
         util.subp(['/usr/bin/gem', 'install', 'chef',
                   '-v %s' % chef_version, '--no-ri',
-                  '--no-rdoc', '--bindir', '/usr/bin', '-q'])
+                  '--no-rdoc', '--bindir', '/usr/bin', '-q'], capture=False)
     else:
         util.subp(['/usr/bin/gem', 'install', 'chef',
                   '--no-ri', '--no-rdoc', '--bindir',
-                  '/usr/bin', '-q'])
+                  '/usr/bin', '-q'], capture=False)

From 860b571b6e04599a1e0d2eaa0b7de057a722d186 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 20:39:21 -0700
Subject: [PATCH 318/434] Constant adding for content type, allow the part
 filename to be over-ridden easily

---
 cloudinit/user_data.py | 27 +++++++++++++++++----------
 1 file changed, 17 insertions(+), 10 deletions(-)

diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 4babb8e5..91841bb8 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -39,6 +39,9 @@ NOT_MULTIPART_TYPE = handlers.NOT_MULTIPART_TYPE
 PART_FN_TPL = handlers.PART_FN_TPL
 OCTET_TYPE = handlers.OCTET_TYPE
 
+# Saves typing errors
+CONTENT_TYPE = 'Content-Type'
+
 # Various special content types that cause special actions
 TYPE_NEEDED = ["text/plain", "text/x-not-multipart"]
 INCLUDE_TYPES = ['text/x-include-url', 'text/x-include-once-url']
@@ -87,10 +90,10 @@ class UserDataProcessor(object):
                 self._explode_archive(payload, append_msg)
                 continue
 
-            if 'Content-Type' in base_msg:
-                base_msg.replace_header('Content-Type', ctype)
+            if CONTENT_TYPE in base_msg:
+                base_msg.replace_header(CONTENT_TYPE, ctype)
             else:
-                base_msg['Content-Type'] = ctype
+                base_msg[CONTENT_TYPE] = ctype
 
             self._attach_part(append_msg, part)
 
@@ -173,8 +176,8 @@ class UserDataProcessor(object):
                 msg.set_payload(content)
 
             if 'filename' in ent:
-                msg.add_header('Content-Disposition', 'attachment',
-                                filename=ent['filename'])
+                msg.add_header('Content-Disposition',
+                               'attachment', filename=ent['filename'])
 
             for header in list(ent.keys()):
                 if header in ('content', 'filename', 'type'):
@@ -201,17 +204,21 @@ class UserDataProcessor(object):
             outer_msg.replace_header(ATTACHMENT_FIELD, str(fetched_count))
         return fetched_count
 
+    def _part_filename(self, unnamed_part, count):
+        return PART_FN_TPL % (count + 1)
+
     def _attach_part(self, outer_msg, part):
         """
         Attach an part to an outer message. outermsg must be a MIMEMultipart.
         Modifies a header in the message to keep track of number of attachments.
         """
-        cur = self._multi_part_count(outer_msg)
+        cur_c = self._multi_part_count(outer_msg)
         if not part.get_filename():
-            fn = PART_FN_TPL % (cur + 1)
-            part.add_header('Content-Disposition', 'attachment', filename=fn)
+            fn = self._part_filename(part, cur_c)
+            part.add_header('Content-Disposition',
+                            'attachment', filename=fn)
         outer_msg.attach(part)
-        self._multi_part_count(outer_msg, cur + 1)
+        self._multi_part_count(outer_msg, cur_c + 1)
 
 
 # Coverts a raw string into a mime message
@@ -229,7 +236,7 @@ def convert_string(raw_data, headers=None):
             else:
                 msg[key] = val
     else:
-        mtype = headers.get("Content-Type", NOT_MULTIPART_TYPE)
+        mtype = headers.get(CONTENT_TYPE, NOT_MULTIPART_TYPE)
         maintype, subtype = mtype.split("/", 1)
         msg = MIMEBase(maintype, subtype, *headers)
         msg.set_payload(data)

From e0167044c7ba9122c382853390284d22d6a52b60 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 20:49:30 -0700
Subject: [PATCH 319/434] Fix ma english

---
 cloudinit/config/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/config/__init__.py b/cloudinit/config/__init__.py
index ab13045f..69a8cc68 100644
--- a/cloudinit/config/__init__.py
+++ b/cloudinit/config/__init__.py
@@ -26,7 +26,7 @@ from cloudinit import log as logging
 LOG = logging.getLogger(__name__)
 
 # This prefix is used to make it less
-# of a change that when importing
+# of a chance that when importing
 # we will not find something else with the same
 # name in the lookup path...
 MOD_PREFIX = "cc_"

From fa6ce05b956485cde05789d4be70304ff2ebb388 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 20:53:35 -0700
Subject: [PATCH 320/434] Use a module level constant for the filename

---
 cloudinit/config/cc_apt_update_upgrade.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/config/cc_apt_update_upgrade.py b/cloudinit/config/cc_apt_update_upgrade.py
index f5b4b58f..6719da52 100644
--- a/cloudinit/config/cc_apt_update_upgrade.py
+++ b/cloudinit/config/cc_apt_update_upgrade.py
@@ -27,6 +27,7 @@ from cloudinit import util
 distros = ['ubuntu', 'debian']
 
 PROXY_TPL = "Acquire::HTTP::Proxy \"%s\";\n"
+PROXY_FN = "/etc/apt/apt.conf.d/95cloud-init-proxy"
 
 
 def handle(_name, cfg, cloud, log, _args):
@@ -48,7 +49,7 @@ def handle(_name, cfg, cloud, log, _args):
 
     # Set up any apt proxy
     proxy = cfg.get("apt_proxy", None)
-    proxy_filename = "/etc/apt/apt.conf.d/95cloud-init-proxy"
+    proxy_filename = PROXY_FN
     if proxy:
         try:
             # See man 'apt.conf'

From 15e9b2907d2b584ed52db40d2ca3ad5c80780c61 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 20:58:50 -0700
Subject: [PATCH 321/434] Turn off capturing

---
 cloudinit/config/cc_byobu.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/config/cc_byobu.py b/cloudinit/config/cc_byobu.py
index 38586174..4e2e06bb 100644
--- a/cloudinit/config/cc_byobu.py
+++ b/cloudinit/config/cc_byobu.py
@@ -68,4 +68,4 @@ def handle(name, cfg, _cloud, log, args):
 
     log.debug("Setting byobu to %s", value)
 
-    util.subp(cmd)
+    util.subp(cmd, capture=False)

From 734f4b31cb66e2e05d52d9e665c30f2e994ce535 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 20:59:23 -0700
Subject: [PATCH 322/434] Turn off capturing

---
 cloudinit/config/cc_ca_certs.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/config/cc_ca_certs.py b/cloudinit/config/cc_ca_certs.py
index b4f9482a..dc046bda 100644
--- a/cloudinit/config/cc_ca_certs.py
+++ b/cloudinit/config/cc_ca_certs.py
@@ -30,7 +30,7 @@ def update_ca_certs():
     """
     Updates the CA certificate cache on the current machine.
     """
-    util.subp(["update-ca-certificates"])
+    util.subp(["update-ca-certificates"], capture=False)
 
 
 def add_ca_certs(paths, certs):

From 81b09ba73f9c42b80b8b6e9e9ed3f99609779613 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 21:00:30 -0700
Subject: [PATCH 323/434] Adjust test for turning off capturing

---
 tests/unittests/test_handler/test_handler_ca_certs.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/unittests/test_handler/test_handler_ca_certs.py b/tests/unittests/test_handler/test_handler_ca_certs.py
index 8d85d331..1f96e992 100644
--- a/tests/unittests/test_handler/test_handler_ca_certs.py
+++ b/tests/unittests/test_handler/test_handler_ca_certs.py
@@ -168,7 +168,7 @@ class TestUpdateCaCerts(MockerTestCase):
     def test_commands(self):
         mock_check_call = self.mocker.replace(util.subp,
                                               passthrough=False)
-        mock_check_call(["update-ca-certificates"])
+        mock_check_call(["update-ca-certificates"], capture=False)
         self.mocker.replay()
 
         cc_ca_certs.update_ca_certs()

From 67f4a0af8b26a08db894104cdd8d015e9649b5da Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 21:01:57 -0700
Subject: [PATCH 324/434] Turn off capturing

---
 cloudinit/config/cc_disable_ec2_metadata.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/config/cc_disable_ec2_metadata.py b/cloudinit/config/cc_disable_ec2_metadata.py
index a7c6a75b..8fb15e43 100644
--- a/cloudinit/config/cc_disable_ec2_metadata.py
+++ b/cloudinit/config/cc_disable_ec2_metadata.py
@@ -30,7 +30,7 @@ REJECT_CMD = ['route', 'add', '-host', '169.254.169.254', 'reject']
 def handle(name, cfg, _cloud, log, _args):
     disabled = util.get_cfg_option_bool(cfg, "disable_ec2_metadata", False)
     if disabled:
-        util.subp(REJECT_CMD)
+        util.subp(REJECT_CMD, subp=False)
     else:
         log.debug(("Skipping module named %s,"
                    " disabling the ec2 route not enabled"), name)

From 3ed847593b48ca00f55d885a962df648e72bf806 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 21:02:04 -0700
Subject: [PATCH 325/434] Turn off capturing

---
 cloudinit/config/cc_disable_ec2_metadata.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/config/cc_disable_ec2_metadata.py b/cloudinit/config/cc_disable_ec2_metadata.py
index 8fb15e43..3fd2c20f 100644
--- a/cloudinit/config/cc_disable_ec2_metadata.py
+++ b/cloudinit/config/cc_disable_ec2_metadata.py
@@ -30,7 +30,7 @@ REJECT_CMD = ['route', 'add', '-host', '169.254.169.254', 'reject']
 def handle(name, cfg, _cloud, log, _args):
     disabled = util.get_cfg_option_bool(cfg, "disable_ec2_metadata", False)
     if disabled:
-        util.subp(REJECT_CMD, subp=False)
+        util.subp(REJECT_CMD, capture=False)
     else:
         log.debug(("Skipping module named %s,"
                    " disabling the ec2 route not enabled"), name)

From 8e5a6aded8753edfcf03df9e1c6def78097e57c1 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 22:04:37 -0700
Subject: [PATCH 326/434] 1. Adjust the logging of phone home module when its
 not enabled 2. Fix pylint warning in userdata about unused variable

---
 cloudinit/config/cc_phone_home.py | 4 +++-
 cloudinit/user_data.py            | 2 +-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/cloudinit/config/cc_phone_home.py b/cloudinit/config/cc_phone_home.py
index d929eb64..ae1349eb 100644
--- a/cloudinit/config/cc_phone_home.py
+++ b/cloudinit/config/cc_phone_home.py
@@ -49,6 +49,8 @@ def handle(name, cfg, cloud, log, args):
         ph_cfg = util.read_conf(args[0])
     else:
         if not 'phone_home' in cfg:
+            log.debug(("Skipping module named %s, "
+                       "no 'phone_home' configuration found"), name)
             return
         ph_cfg = cfg['phone_home']
 
@@ -59,7 +61,7 @@ def handle(name, cfg, cloud, log, args):
 
     url = ph_cfg['url']
     post_list = ph_cfg.get('post', 'all')
-    tries = ph_cfg.get('tries', 10)
+    tries = ph_cfg.get('tries')
     try:
         tries = int(tries)
     except:
diff --git a/cloudinit/user_data.py b/cloudinit/user_data.py
index 91841bb8..0842594d 100644
--- a/cloudinit/user_data.py
+++ b/cloudinit/user_data.py
@@ -204,7 +204,7 @@ class UserDataProcessor(object):
             outer_msg.replace_header(ATTACHMENT_FIELD, str(fetched_count))
         return fetched_count
 
-    def _part_filename(self, unnamed_part, count):
+    def _part_filename(self, _unnamed_part, count):
         return PART_FN_TPL % (count + 1)
 
     def _attach_part(self, outer_msg, part):

From 80837d1e81d36392aea006c7f278f16dab31282a Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 22:12:34 -0700
Subject: [PATCH 327/434] 1. Add comment about conf.d overriding input config
 2. For reading config from conf.d, collect all the configs    then call the
 mergemany function

---
 cloudinit/util.py | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 332b8379..4c521bc3 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -641,11 +641,10 @@ def read_conf_d(confd):
     # remove anything not a file
     confs = [f for f in confs if os.path.isfile(os.path.join(confd, f))]
 
-    cfg = {}
-    for conf in confs:
-        cfg = mergedict(cfg, read_conf(os.path.join(confd, conf)))
-
-    return cfg
+    cfgs = []
+    for fn in confs:
+        cfgs.append(read_conf(os.path.join(confd, fn))
+    return mergemanydict(cfgs)
 
 
 def read_conf_with_confd(cfgfile):
@@ -667,8 +666,8 @@ def read_conf_with_confd(cfgfile):
     if not confd or not os.path.isdir(confd):
         return cfg
 
-    cfg = mergedict(read_conf_d(confd), cfg)
-    return cfg
+    # Conf.d settings override input configuration
+    return mergedict(read_conf_d(confd), cfg)
 
 
 def read_cc_from_cmdline(cmdline=None):

From 45cc6af3b6cdb9710fd8fa61d81c996fbe0b9681 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 22 Jun 2012 22:17:09 -0700
Subject: [PATCH 328/434] Fix syntax err, grrr

---
 cloudinit/util.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 4c521bc3..baa3def1 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -643,7 +643,8 @@ def read_conf_d(confd):
 
     cfgs = []
     for fn in confs:
-        cfgs.append(read_conf(os.path.join(confd, fn))
+        cfgs.append(read_conf(os.path.join(confd, fn)))
+
     return mergemanydict(cfgs)
 
 

From cf2745ebfc19fd0239059761493667ed354413ba Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 23:26:50 -0700
Subject: [PATCH 329/434] 1. Move	the getkeybyid function	back here but
 add some slight adjustments    a. Instead of executing a bash string, write
 out a temporary file       and then just execute '/bin/sh' on that file with
 the right arguments instead. 2. Rename util.SilentTemporaryFile to
 util.ExtendedTemporaryFile and update the usages    of the previous name
 accordingly, this better reflects what this temp file is. 3. More teenie pep8
 line length fixings

---
 cloudinit/config/cc_apt_update_upgrade.py | 27 ++++++++++++++++++++++-
 cloudinit/config/cc_bootcmd.py            |  3 +--
 cloudinit/config/cc_chef.py               |  2 +-
 cloudinit/config/cc_resizefs.py           |  4 ++--
 cloudinit/util.py                         | 22 +-----------------
 5 files changed, 31 insertions(+), 27 deletions(-)

diff --git a/cloudinit/config/cc_apt_update_upgrade.py b/cloudinit/config/cc_apt_update_upgrade.py
index 6719da52..8ecd9c94 100644
--- a/cloudinit/config/cc_apt_update_upgrade.py
+++ b/cloudinit/config/cc_apt_update_upgrade.py
@@ -29,6 +29,21 @@ distros = ['ubuntu', 'debian']
 PROXY_TPL = "Acquire::HTTP::Proxy \"%s\";\n"
 PROXY_FN = "/etc/apt/apt.conf.d/95cloud-init-proxy"
 
+# A temporary shell program to get a given gpg key
+# from a given keyserver
+EXPORT_GPG_KEYID = """
+    k=${1} ks=${2};
+    exec 2>/dev/null
+    [ -n "$k" ] || exit 1;
+    armour=$(gpg --list-keys --armour "${k}")
+    if [ -z "${armour}" ]; then
+       gpg --keyserver ${ks} --recv $k >/dev/null &&
+          armour=$(gpg --export --armour "${k}") &&
+          gpg --batch --yes --delete-keys "${k}"
+    fi
+    [ -n "${armour}" ] && echo "${armour}"
+"""
+
 
 def handle(_name, cfg, cloud, log, _args):
     update = util.get_cfg_option_bool(cfg, 'apt_update', False)
@@ -106,6 +121,16 @@ def handle(_name, cfg, cloud, log, _args):
         raise errors[-1]
 
 
+# get gpg keyid from keyserver
+def getkeybyid(keyid, keyserver):
+    with util.ExtendedTemporaryFile(suffix='.sh') as fh:
+        fh.write(EXPORT_GPG_KEYID)
+        fh.flush()
+        cmd = ['/bin/sh', fh.name, keyid, keyserver]
+        (stdout, _stderr) = util.subp(cmd)
+        return stdout.strip()
+
+
 def mirror2lists_fileprefix(mirror):
     string = mirror
     # take of http:// or ftp://
@@ -181,7 +206,7 @@ def add_sources(cloud, srclist, template_params=None):
             if 'keyserver' in ent:
                 ks = ent['keyserver']
             try:
-                ent['key'] = util.getkeybyid(ent['keyid'], ks)
+                ent['key'] = getkeybyid(ent['keyid'], ks)
             except:
                 errorlist.append([source, "failed to get key from %s" % ks])
                 continue
diff --git a/cloudinit/config/cc_bootcmd.py b/cloudinit/config/cc_bootcmd.py
index 89ccf3f1..bae1ea54 100644
--- a/cloudinit/config/cc_bootcmd.py
+++ b/cloudinit/config/cc_bootcmd.py
@@ -19,7 +19,6 @@
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 import os
-import tempfile
 
 from cloudinit import util
 from cloudinit.settings import PER_ALWAYS
@@ -34,7 +33,7 @@ def handle(name, cfg, cloud, log, _args):
                    " no 'bootcmd' key in configuration"), name)
         return
 
-    with tempfile.NamedTemporaryFile(suffix=".sh") as tmpf:
+    with util.ExtendedTemporaryFile(suffix=".sh") as tmpf:
         try:
             content = util.shellify(cfg["bootcmd"])
             tmpf.write(content)
diff --git a/cloudinit/config/cc_chef.py b/cloudinit/config/cc_chef.py
index d682398a..6f568261 100644
--- a/cloudinit/config/cc_chef.py
+++ b/cloudinit/config/cc_chef.py
@@ -96,7 +96,7 @@ def handle(name, cfg, cloud, log, _args):
             install_chef_from_gems(cloud.distro, ruby_version, chef_version)
             # and finally, run chef-client
             log.debug('Running chef-client')
-            util.subp(['/usr/bin/chef-client', 
+            util.subp(['/usr/bin/chef-client',
                        '-d', '-i', '1800', '-s', '20'], capture=False)
         elif install_type == 'packages':
             # this will install and run the chef-client from packages
diff --git a/cloudinit/config/cc_resizefs.py b/cloudinit/config/cc_resizefs.py
index 7e1428e9..69cd8872 100644
--- a/cloudinit/config/cc_resizefs.py
+++ b/cloudinit/config/cc_resizefs.py
@@ -79,8 +79,8 @@ def handle(name, cfg, cloud, log, args):
 
     # TODO: allow what is to be resized to be configurable??
     resize_what = cloud.paths.join(False, "/")
-    with util.SilentTemporaryFile(prefix="cloudinit.resizefs.",
-                                  dir=resize_root_d, delete=True) as tfh:
+    with util.ExtendedTemporaryFile(prefix="cloudinit.resizefs.",
+                                    dir=resize_root_d, delete=True) as tfh:
         devpth = tfh.name
 
         # Delete the file so that mknod will work
diff --git a/cloudinit/util.py b/cloudinit/util.py
index baa3def1..6cdf9ff3 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -157,7 +157,7 @@ class MountFailedError(Exception):
     pass
 
 
-def SilentTemporaryFile(**kwargs):
+def ExtendedTemporaryFile(**kwargs):
     fh = tempfile.NamedTemporaryFile(**kwargs)
     # Replace its unlink with a quiet version
     # that does not raise errors when the
@@ -517,26 +517,6 @@ def del_dir(path):
     shutil.rmtree(path)
 
 
-# get gpg keyid from keyserver
-def getkeybyid(keyid, keyserver):
-    # TODO fix this...
-    shcmd = """
-    k=${1} ks=${2};
-    exec 2>/dev/null
-    [ -n "$k" ] || exit 1;
-    armour=$(gpg --list-keys --armour "${k}")
-    if [ -z "${armour}" ]; then
-       gpg --keyserver ${ks} --recv $k >/dev/null &&
-          armour=$(gpg --export --armour "${k}") &&
-          gpg --batch --yes --delete-keys "${k}"
-    fi
-    [ -n "${armour}" ] && echo "${armour}"
-    """
-    args = ['sh', '-c', shcmd, "export-gpg-keyid", keyid, keyserver]
-    (stdout, _stderr) = subp(args)
-    return stdout
-
-
 def runparts(dirp, skip_no_exist=True):
     if skip_no_exist and not os.path.isdir(dirp):
         return

From 46baea3eadc702364c9f9d2eb3a05e3557576740 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 23:36:08 -0700
Subject: [PATCH 330/434] Use os.path.join instead of custom string path
 formation

---
 cloudinit/config/cc_apt_update_upgrade.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cloudinit/config/cc_apt_update_upgrade.py b/cloudinit/config/cc_apt_update_upgrade.py
index 8ecd9c94..42b6f3e9 100644
--- a/cloudinit/config/cc_apt_update_upgrade.py
+++ b/cloudinit/config/cc_apt_update_upgrade.py
@@ -133,7 +133,7 @@ def getkeybyid(keyid, keyserver):
 
 def mirror2lists_fileprefix(mirror):
     string = mirror
-    # take of http:// or ftp://
+    # take off http:// or ftp://
     if string.endswith("/"):
         string = string[0:-1]
     pos = string.find("://")
@@ -144,8 +144,8 @@ def mirror2lists_fileprefix(mirror):
 
 
 def rename_apt_lists(omirror, new_mirror, lists_d="/var/lib/apt/lists"):
-    oprefix = "%s/%s" % (lists_d, mirror2lists_fileprefix(omirror))
-    nprefix = "%s/%s" % (lists_d, mirror2lists_fileprefix(new_mirror))
+    oprefix = os.path.join(lists_d, mirror2lists_fileprefix(omirror))
+    nprefix = os.path.join(lists_d, mirror2lists_fileprefix(new_mirror))
     if oprefix == nprefix:
         return
     olen = len(oprefix)

From e06021a61bfe35b89b2e42db3279f43d2957027f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 22 Jun 2012 23:43:48 -0700
Subject: [PATCH 331/434] Don't complete the update if there is no datasource
 or if writing to cache fails

---
 cloudinit/stages.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index cfe1c071..3ed13009 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -178,10 +178,13 @@ class Init(object):
             return None
 
     def _write_to_cache(self):
+        if not self.datasource:
+            return False
         pickled_fn = self.paths.get_ipath_cur("obj_pkl")
         try:
             contents = pickle.dumps(self.datasource)
             util.write_file(pickled_fn, contents, mode=0400)
+            return True
         except Exception:
             util.logexc(LOG, "Failed pickling datasource to %s", pickled_fn)
             return False
@@ -292,7 +295,8 @@ class Init(object):
                            self.distro, helpers.Runners(self.paths))
 
     def update(self):
-        self._write_to_cache()
+        if not self._write_to_cache():
+            return
         self._store_userdata()
 
     def _store_userdata(self):

From 8ce86713f6b3df5717b05ced13b1393b71b24b4a Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sat, 23 Jun 2012 14:59:16 -0700
Subject: [PATCH 332/434] 1. Separate the pep8 check from the pylint check   
 a. This allows them to be run as different tools (if desired) 2. Adjust the
 makefile to have a 'make pep8' section which can run this new script

---
 Makefile       |  5 ++++-
 tools/run-pep8 | 28 ++++++++++++++++++++++++++++
 2 files changed, 32 insertions(+), 1 deletion(-)
 create mode 100755 tools/run-pep8

diff --git a/Makefile b/Makefile
index ab23bf1f..c20dfbd3 100644
--- a/Makefile
+++ b/Makefile
@@ -4,6 +4,9 @@ PY_FILES+="bin/cloud-init"
 
 all: test
 
+pep8:
+	$(CWD)/tools/run-pep8 $(PY_FILES)
+
 pylint:
 	$(CWD)/tools/run-pylint $(PY_FILES)
 
@@ -20,5 +23,5 @@ clean:
 	rm -rf /var/log/cloud-init.log \
 		   /var/lib/cloud/
 
-.PHONY: test pylint pyflakes 2to3 clean
+.PHONY: test pylint pyflakes 2to3 clean pep8
 
diff --git a/tools/run-pep8 b/tools/run-pep8
new file mode 100755
index 00000000..e7707985
--- /dev/null
+++ b/tools/run-pep8
@@ -0,0 +1,28 @@
+#!/bin/bash
+
+ci_files='cloud*.py cloudinit/*.py cloudinit/config/*.py'
+test_files=$(find tests -name "*.py")
+def_files="$ci_files $test_files"
+
+if [ $# -eq 0 ]; then
+   files=( )
+   for f in $def_files; do
+      [ -f "$f" ] || { echo "failed, $f not a file" 1>&2; exit 1; }
+      files[${#files[@]}]=${f}
+   done
+else
+   files=( "$@" );
+fi 
+
+cmd=(
+    pep8
+
+    --ignore=E501 # Line too long (these are caught by pylint)
+
+    "${files[@]}"
+)
+
+echo -e "\nRunning pep8:"
+echo "${cmd[@]}"
+"${cmd[@]}"
+

From b1f86c97b8b0a2ae65e58ad3da67d6f71254a4ba Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sat, 23 Jun 2012 15:00:06 -0700
Subject: [PATCH 333/434] Remove the pep8 tool from being ran in a script that
 has a name that seems to just say it will run pylint. Put the pep8 tool in a
 'run-pep8' script.

---
 tools/run-pylint | 13 +------------
 1 file changed, 1 insertion(+), 12 deletions(-)

diff --git a/tools/run-pylint b/tools/run-pylint
index 46748ffb..dd6369aa 100755
--- a/tools/run-pylint
+++ b/tools/run-pylint
@@ -1,6 +1,6 @@
 #!/bin/bash
 
-ci_files='cloud*.py cloudinit/*.py cloudinit/CloudConfig/*.py'
+ci_files='cloud*.py cloudinit/*.py cloudinit/config/*.py'
 test_files=$(find tests -name "*.py")
 def_files="$ci_files $test_files"
 
@@ -38,14 +38,3 @@ echo -e "\nRunning pylint:"
 echo "${cmd[@]}"
 "${cmd[@]}"
 
-cmd=(
-    pep8
-
-    --ignore=E501 # Line too long (these are caught by pylint above)
-
-    "${files[@]}"
-)
-
-echo -e "\nRunning pep8:"
-echo "${cmd[@]}"
-"${cmd[@]}"

From 77a6781fc39a0551b5e8ace32a97e2ba0fcc23ec Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sat, 23 Jun 2012 15:00:41 -0700
Subject: [PATCH 334/434] 1. Use a common config merging class now in helpers  
  that will be the central point of config fetching    for both the 'init'
 stage and the 'module' stages    a. This helps those who want to understand
 exactly       what configs are fetched and how the merging occurs.

---
 cloudinit/helpers.py | 82 +++++++++++++++++++++++++++++++++++++++++++-
 cloudinit/stages.py  | 59 ++++++++-----------------------
 2 files changed, 96 insertions(+), 45 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 7a2ac6b8..0f86285f 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -28,7 +28,8 @@ import os
 
 from ConfigParser import (NoSectionError, NoOptionError, RawConfigParser)
 
-from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE)
+from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE,
+                                CFG_ENV_NAME)
 
 from cloudinit import log as logging
 from cloudinit import util
@@ -176,6 +177,85 @@ class Runners(object):
                 return (True, results)
 
 
+class ConfigMerger(object):
+    def __init__(self, paths=None, datasource=None,
+                 additional_fns=None, base_cfg=None):
+        self._paths = paths
+        self._ds = datasource
+        self._fns = additional_fns
+        self._base_cfg = base_cfg
+        # Created on first use
+        self._cfg = None
+
+    def _get_datasource_configs(self):
+        d_cfgs = []
+        if self._ds:
+            try:
+                ds_cfg = self._ds.get_config_obj()
+                if ds_cfg and isinstance(ds_cfg, (dict)):
+                    d_cfgs.append(ds_cfg)
+            except:
+                util.logexc(LOG, ("Failed loading of datasource"
+                                  " config object from %s"), self._ds)
+        return d_cfgs
+
+    def _get_env_configs(self):
+        e_cfgs = []
+        if CFG_ENV_NAME in os.environ:
+            e_fn = os.environ[CFG_ENV_NAME]
+            try:
+                e_cfgs.append(util.read_conf(e_fn))
+            except:
+                util.logexc(LOG, ('Failed loading of env. config'
+                                  ' from %s'), e_fn)
+        return e_cfgs
+
+    def _get_instance_configs(self):
+        i_cfgs = []
+        # If cloud-config was written, pick it up as
+        # a configuration file to use when running...
+        if not self._paths:
+            return i_cfgs
+        cc_fn = self._paths.get_ipath_cur('cloud_config')
+        if cc_fn and os.path.isfile(cc_fn):
+            try:
+                i_cfgs.append(util.read_conf(cc_fn))
+            except:
+                util.logexc(LOG, ('Failed loading of cloud-config'
+                                      ' from %s'), cc_fn)
+        return i_cfgs
+
+    def _read_cfg(self):
+        # Input config files override
+        # env config files which
+        # override instance configs
+        # which override datasource
+        # configs which override
+        # base configuration
+        cfgs = []
+        if self._fns:
+            for c_fn in self._fns:
+                try:
+                    cfgs.append(util.read_conf(c_fn))
+                except:
+                    util.logexc(LOG, ("Failed loading of configuration"
+                                       " from %s"), c_fn)
+
+        cfgs.extend(self._get_env_configs())
+        cfgs.extend(self._get_instance_configs())
+        cfgs.extend(self._get_datasource_configs())
+        if self._base_cfg:
+            cfgs.append(self._base_cfg)
+        return util.mergemanydict(cfgs)
+
+    @property
+    def cfg(self):
+        # None check to avoid empty case causing re-reading
+        if self._cfg is None:
+            self._cfg = self._read_cfg()
+        return self._cfg
+
+
 class ContentHandlers(object):
 
     def __init__(self):
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index cfe1c071..1846dd4d 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -147,23 +147,16 @@ class Init(object):
             LOG.debug("Loaded 'init' config %s", self._cfg)
 
     def _read_cfg(self, extra_fns):
-        # Read extra files provided (if any)
-        i_cfgs = []
-        if extra_fns:
-            for fn in extra_fns:
-                try:
-                    fn_cfg = util.read_conf(fn)
-                    i_cfgs.append(fn_cfg)
-                except:
-                    util.logexc(LOG, ("Failed loading of additional"
-                                      " configuration from %s"), fn)
-        # Now read in the built-in + base
         try:
-            conf = util.get_base_cfg(builtin=util.get_builtin_cfg())
+            base_conf = util.get_base_cfg(builtin=util.get_builtin_cfg())
         except Exception:
-            conf = util.get_builtin_cfg()
-        i_cfgs.append(conf)
-        return util.mergemanydict(i_cfgs)
+            base_conf = util.get_builtin_cfg()
+        no_cfg_pths = helpers.Paths({}, self.datasource)
+        merger = helpers.ConfigMerger(paths=no_cfg_pths,
+                                      datasource=self.datasource,
+                                      additional_fns=extra_fns,
+                                      base_cfg=base_conf)
+        return merger.cfg
 
     def _restore_from_cache(self):
         pickled_fn = self.paths.get_ipath_cur('obj_pkl')
@@ -392,46 +385,24 @@ class Init(object):
 
 class Modules(object):
     def __init__(self, init, cfg_files=None):
-        self.datasource = init.datasource
-        self.cfg_files = cfg_files
-        self.base_cfg = init.cfg
         self.init = init
+        self.cfg_files = cfg_files
         # Created on first use
         self._cached_cfg = None
 
     @property
     def cfg(self):
-        # None check to avoid empty case
+        # None check to avoid empty case causing re-reading
         if self._cached_cfg is None:
-            self._cached_cfg = self._get_config()
+            merger = helpers.ConfigMerger(paths=self.init.paths,
+                                          datasource=self.init.datasource,
+                                          fns=self.cfg_files,
+                                          base_cfg=self.init.cfg)
+            self._cached_cfg = merger.cfg
             LOG.debug("Loading 'module' config %s", self._cached_cfg)
         # Only give out a copy so that others can't modify this...
         return copy.deepcopy(self._cached_cfg)
 
-    def _get_config(self):
-        t_cfgs = []
-        if self.cfg_files:
-            for fn in self.cfg_files:
-                try:
-                    t_cfgs.append(util.read_conf(fn))
-                except:
-                    util.logexc(LOG, ("Failed loading of configuration"
-                                       " from %s"), fn)
-
-        if self.datasource:
-            try:
-                d_cfg = self.datasource.get_config_obj()
-                if d_cfg:
-                    t_cfgs.append(d_cfg)
-            except:
-                util.logexc(LOG, ("Failed loading of datasource"
-                                  " config object from %s"), self.datasource)
-
-        if self.base_cfg:
-            t_cfgs.append(self.base_cfg)
-
-        return util.mergemanydict(t_cfgs)
-
     def _read_modules(self, name):
         module_list = []
         if name not in self.cfg:

From a299fdea70b724f649ccea3899d96ba0b13a4c14 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 12:27:47 -0700
Subject: [PATCH 335/434] Removed this, since it doesn't offer any value.

---
 install.sh | 31 -------------------------------
 1 file changed, 31 deletions(-)
 delete mode 100755 install.sh

diff --git a/install.sh b/install.sh
deleted file mode 100755
index e7521bfa..00000000
--- a/install.sh
+++ /dev/null
@@ -1,31 +0,0 @@
-#!/bin/sh
-
-#                    cd $(DEB_SRCDIR) && $(call cdbs_python_binary,python$(cdbs_python_compile_version)) $(DEB_PYTHON_SETUP_CMD) install --root=$(cdbs_python_destdir) $(DEB_PYTHON_INSTALL_ARGS_ALL)
-#                    for ddir in $(cdbs_python_destdir)/usr/lib/python?.?/dist-packages; do \
-#                      [ -d $$ddir ] || continue; \
-#                      sdir=$$(dirname $$ddir)/site-packages; \
-#                      mkdir -p $$sdir; \
-#                      tar -c -f - -C $$ddir . | tar -x -f - -C $$sdir; \
-#                      rm -rf $$ddir; \
-#                    done
-
-DEB_PYTHON_INSTALL_ARGS_ALL="-O0 --install-layout=deb"
-rm -Rf build
-
-destdir=$(readlink -f ${1})
-[ -z "${destdir}" ] && { echo "give destdir"; exit 1; }
-cd $(dirname ${0})
-./setup.py install --root=${destdir} ${DEB_PYTHON_INSTALL_ARGS_ALL}
-
-#mkdir -p ${destdir}/usr/share/pyshared
-#for x in ${destdir}/usr/lib/python2.6/dist-packages/*; do
-#   [ -d "$x" ] || continue
-#   [ ! -d "${destdir}/usr/share/pyshared/${x##*/}" ] ||
-#      rm -Rf "${destdir}/usr/share/pyshared/${x##*/}"
-#   mv $x ${destdir}/usr/share/pyshared
-#done
-#rm -Rf ${destdir}/usr/lib/python2.6
-
-for x in "${destdir}/usr/bin/"*.py; do
-   [ -f "${x}" ] && mv "${x}" "${x%.py}"
-done

From bfb728fbe8f3a0a4e094804ed2c497c7ec224469 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 12:28:04 -0700
Subject: [PATCH 336/434] Add warning when hitting a unknown api.

---
 tools/mock-meta.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index d4677af6..0f13acd6 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -6,10 +6,11 @@
 
 import functools
 import httplib
+import json
 import logging
-import sys
-import string
 import random
+import string
+import sys
 import yaml
 
 from optparse import OptionParser
@@ -88,6 +89,8 @@ PLACEMENT_CAPABILITIES = {
     'availability-zone': AVAILABILITY_ZONES,
 }
 
+NOT_IMPL_RESPONSE = json.dumps({})
+
 
 class WebException(Exception):
     def __init__(self, code, msg):
@@ -181,7 +184,11 @@ class MetaDataHandler(object):
                 else:
                     return "%s" % (PLACEMENT_CAPABILITIES.get(pentry, ''))
         else:
-            return '{}'
+            log.warn(("Did not implement action %s, "
+                      "returning empty response: %r"),
+                      action, NOT_IMPL_RESPONSE)
+            return NOT_IMPL_RESPONSE
+
 
 class UserDataHandler(object):
 

From 87a0c46d22c1501ffb2fb882185eba2dd5c69a5c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 12:28:59 -0700
Subject: [PATCH 337/434] 1. Moving around the packages dir. 2. Adjusting the
 bddep shell script 3. Starting to add a brpm

---
 packages/bddeb                                | 62 +++++++++++++++++++
 packages/brpm                                 |  3 +
 .../debian.trunk}/changelog                   |  0
 .../debian.trunk}/compat                      |  0
 .../debian.trunk}/control                     |  0
 .../debian.trunk}/copyright                   |  0
 {debian.trunk => packages/debian.trunk}/dirs  |  0
 .../debian.trunk}/pycompat                    |  0
 {debian.trunk => packages/debian.trunk}/rules |  0
 {tools => packages}/make-dist-tarball         |  4 +-
 tools/bddeb                                   | 33 ----------
 11 files changed, 67 insertions(+), 35 deletions(-)
 create mode 100755 packages/bddeb
 create mode 100755 packages/brpm
 rename {debian.trunk => packages/debian.trunk}/changelog (100%)
 rename {debian.trunk => packages/debian.trunk}/compat (100%)
 rename {debian.trunk => packages/debian.trunk}/control (100%)
 rename {debian.trunk => packages/debian.trunk}/copyright (100%)
 rename {debian.trunk => packages/debian.trunk}/dirs (100%)
 rename {debian.trunk => packages/debian.trunk}/pycompat (100%)
 rename {debian.trunk => packages/debian.trunk}/rules (100%)
 rename {tools => packages}/make-dist-tarball (91%)
 delete mode 100755 tools/bddeb

diff --git a/packages/bddeb b/packages/bddeb
new file mode 100755
index 00000000..74932985
--- /dev/null
+++ b/packages/bddeb
@@ -0,0 +1,62 @@
+#!/bin/sh 
+
+# Ensure we can find the setup.py file which
+# should be at the root of the cloud-init tree
+PKG_DIR=`pwd`
+ROOT="$PKG_DIR/../"
+if [ ! -e "$ROOT/setup.py" ]; then
+    echo "No setup.py found at $ROOT"
+    exit 1
+fi
+echo "Using root directory $ROOT for building your debian package"
+
+# Ensure tempdir is cleaned and ready to go
+TEMP_D=$(mktemp -d "${TMPDIR:-/tmp}/${0##*/}.XXXXXXX")
+echo "With $TEMP_D as a temporary workspace"
+rm -Rf "${TEMP_D}"; mkdir "${TEMP_D}"
+set -e
+
+# Ensure tempdir removed if breaks...
+trap "rm -Rf '${TEMP_D}'" EXIT SIGINT SIGTERM
+
+# Go to the root and start making a package!
+cd $ROOT
+files=$(bzr ls --versioned)
+revno=$(bzr revno)
+version=$(awk -F: \
+   '$1 ~ /[0-9][.][0-9]+[.][0-9]+/ { print $1 ; exit(0); }' ChangeLog )
+
+# Ensure that the version found in 'Changelog' is the same in the python 
+# cloud-init version directory
+py_version=$(python -c 'from cloudinit import version; import sys; \
+sys.stdout.write(version.version_string())')
+
+# Canonicalize the changelog version
+ch_version=$(python -c "from distutils import version; import sys; \
+sys.stdout.write(str(version.StrictVersion('$version')));")
+
+if [ "$py_version" != "$ch_version" ]; then
+    echo "Cloud-init python version $py_version" \
+         " != changelog version $ch_version"
+    echo "Please ensure they are the same!"
+    exit 1
+fi
+
+mkdir "${TEMP_D}/cloud-init"
+otar="$TEMP_D/cloud-init_$version~bzr${revno}.orig.tar.gz"
+tar -czf - ${files} > "$otar"
+tar -C "${TEMP_D}/cloud-init" -xzf - < "$otar"
+
+if [ ! -d "${TEMP_D}/cloud-init/debian" ]; then
+   rsync -a $PKG_DIR/debian.trunk/ "${TEMP_D}/cloud-init/debian"
+fi
+
+sed -i -e "s,VERSION,$version," -e "s,REVNO,bzr$revno," \
+          "$TEMP_D/cloud-init/debian/changelog"
+
+cd "${TEMP_D}/cloud-init"
+debuild "$@"
+debname="cloud-init_${version}~bzr${revno}-1_all.deb"
+mv "../$debname" "$PKG_DIR"
+echo "Wrote $debname to $PKG_DIR"
+
diff --git a/packages/brpm b/packages/brpm
new file mode 100755
index 00000000..829303ea
--- /dev/null
+++ b/packages/brpm
@@ -0,0 +1,3 @@
+#!/bin/sh
+
+
diff --git a/debian.trunk/changelog b/packages/debian.trunk/changelog
similarity index 100%
rename from debian.trunk/changelog
rename to packages/debian.trunk/changelog
diff --git a/debian.trunk/compat b/packages/debian.trunk/compat
similarity index 100%
rename from debian.trunk/compat
rename to packages/debian.trunk/compat
diff --git a/debian.trunk/control b/packages/debian.trunk/control
similarity index 100%
rename from debian.trunk/control
rename to packages/debian.trunk/control
diff --git a/debian.trunk/copyright b/packages/debian.trunk/copyright
similarity index 100%
rename from debian.trunk/copyright
rename to packages/debian.trunk/copyright
diff --git a/debian.trunk/dirs b/packages/debian.trunk/dirs
similarity index 100%
rename from debian.trunk/dirs
rename to packages/debian.trunk/dirs
diff --git a/debian.trunk/pycompat b/packages/debian.trunk/pycompat
similarity index 100%
rename from debian.trunk/pycompat
rename to packages/debian.trunk/pycompat
diff --git a/debian.trunk/rules b/packages/debian.trunk/rules
similarity index 100%
rename from debian.trunk/rules
rename to packages/debian.trunk/rules
diff --git a/tools/make-dist-tarball b/packages/make-dist-tarball
similarity index 91%
rename from tools/make-dist-tarball
rename to packages/make-dist-tarball
index d6d53aa7..622283bd 100755
--- a/tools/make-dist-tarball
+++ b/packages/make-dist-tarball
@@ -9,7 +9,7 @@ Usage: ${0##*/} version
 EOF
 }
 
-topdir=$PWD
+topdir="../$PWD"
 tag=${1}
 
 [ -n "$tag" ] || { Usage 1>&2 ; exit 1; }
@@ -22,4 +22,4 @@ out=${topdir}/cloud-init-${tag}.tar.gz
 cd ${tmpd} && 
    bzr branch -r "tag:${tag}" "${topdir}" ./cloud-init-${tag} &&
    tar czf "${out}" cloud-init-${tag}/ --exclude cloud-init-${tag}/.bzr &&
-   echo "wrote ${out}"
+   echo "Wrote ${out}"
diff --git a/tools/bddeb b/tools/bddeb
deleted file mode 100755
index b162b06f..00000000
--- a/tools/bddeb
+++ /dev/null
@@ -1,33 +0,0 @@
-#!/bin/sh
-
-TEMP_D=$(mktemp -d "${TMPDIR:-/tmp}/${0##*/}.XXXXXXX")
-#TEMP_D=/tmp/my.d
-start=${PWD}
-rm -Rf "${TEMP_D}"; mkdir "${TEMP_D}"
-set -e
-trap "rm -Rf '${TEMP_D}'" exit
-files=$(bzr ls --versioned)
-revno=$(bzr revno)
-version=$(awk -F: \
-   '$1 ~ /[0-9][.][0-9]+[.][0-9]+/ { print $1 ; exit(0); }' ChangeLog )
-mkdir "${TEMP_D}/cloud-init"
-otar="$TEMP_D/cloud-init_$version~bzr${revno}.orig.tar.gz"
-tar -czf - ${files} > "$otar"
-tar -C "${TEMP_D}/cloud-init" -xzf - <"$otar"
-
-if [ ! -d "${TEMP_D}/cloud-init/debian" ]; then
-   rsync -a debian.trunk/ "${TEMP_D}/cloud-init/debian"
-fi
-sed -i -e "s,VERSION,$version," -e "s,REVNO,bzr$revno," \
-   "$TEMP_D/cloud-init/debian/changelog"
-cd "${TEMP_D}/cloud-init"
-debuild "$@"
-#for x in ../*.deb; do
-#   echo wrote ${x##*/}
-#done
-debname="cloud-init_${version}~bzr${revno}-1_all.deb"
-mv "../$debname" "$start"
-link="$start/cloud-init_all.deb"
-echo "wrote $debname"
-[ ! -e "$link" -o -L "$link" ] 
-   { ln -sf "$debname" "$link" && echo "linked ${link##*/}"; }

From f9bd9be426a77949411e9345036a1b8e59be0b28 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 13:07:00 -0700
Subject: [PATCH 338/434] This will be a rpm template file for the eventual
 specfile that will be created.

---
 packages/brpm.tmpl | 173 +++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 173 insertions(+)
 create mode 100644 packages/brpm.tmpl

diff --git a/packages/brpm.tmpl b/packages/brpm.tmpl
new file mode 100644
index 00000000..141578a5
--- /dev/null
+++ b/packages/brpm.tmpl
@@ -0,0 +1,173 @@
+%{!?python_sitelib: %global python_sitelib %(%{__python} -c "from distutils.sysconfig import get_python_lib; print get_python_lib()")}
+
+Name:           cloud-init
+Version:        {{version}}
+Release:        {{release}}%{?dist}
+Summary:        Cloud instance init scripts
+
+Group:          System Environment/Base
+License:        GPLv3
+URL:            http://launchpad.net/cloud-init
+
+Source0:        %{name}-%{version}-bzr532.tar.gz
+
+BuildArch:      noarch
+BuildRoot:      %{_tmppath}/%{name}-%{version}-%{release}-root-%(%{__id_u} -n)
+
+BuildRequires:  python-devel
+BuildRequires:  python-setuptools-devel
+Requires:       e2fsprogs
+Requires:       iproute
+Requires:       libselinux-python
+Requires:       net-tools
+Requires:       procps
+Requires:       python-boto
+Requires:       python-cheetah
+Requires:       python-configobj
+Requires:       PyYAML
+Requires:       rsyslog
+Requires:       shadow-utils
+Requires:       /usr/bin/run-parts
+Requires(post):   chkconfig
+Requires(preun):  chkconfig
+Requires(postun): initscripts
+
+%description
+Cloud-init is a set of init scripts for cloud instances.  Cloud instances
+need special scripts to run during initialization to retrieve and install
+ssh keys and to let the user run various scripts.
+
+
+%prep
+%setup -q -n %{name}-%{version}-bzr532
+%patch0 -p0
+%patch1 -p0
+%patch2 -p1
+%patch3 -p1
+
+cp -p %{SOURCE2} README.fedora
+
+
+%build
+%{__python} setup.py build
+
+
+%install
+rm -rf $RPM_BUILD_ROOT
+%{__python} setup.py install -O1 --skip-build --root $RPM_BUILD_ROOT
+
+for x in $RPM_BUILD_ROOT/%{_bindir}/*.py; do mv "$x" "${x%.py}"; done
+chmod +x $RPM_BUILD_ROOT/%{python_sitelib}/cloudinit/SshUtil.py
+mkdir -p $RPM_BUILD_ROOT/%{_sharedstatedir}/cloud
+
+# We supply our own config file since our software differs from Ubuntu's.
+cp -p %{SOURCE1} $RPM_BUILD_ROOT/%{_sysconfdir}/cloud/cloud.cfg
+
+# Note that /etc/rsyslog.d didn't exist by default until F15.
+# el6 request: https://bugzilla.redhat.com/show_bug.cgi?id=740420
+mkdir -p $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d
+cp -p tools/21-cloudinit.conf $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d/21-cloudinit.conf
+
+# Install the init scripts
+install -p -D -m 755 %{SOURCE3} %{buildroot}%{_initrddir}/cloud-config
+install -p -D -m 755 %{SOURCE4} %{buildroot}%{_initrddir}/cloud-final
+install -p -D -m 755 %{SOURCE5} %{buildroot}%{_initrddir}/cloud-init
+install -p -D -m 755 %{SOURCE6} %{buildroot}%{_initrddir}/cloud-init-local
+
+
+%clean
+rm -rf $RPM_BUILD_ROOT
+
+
+%post
+if [ $1 -eq 1 ] ; then
+    # Initial installation
+    # Enabled by default per "runs once then goes away" exception
+    for svc in config final init init-local; do
+        chkconfig --add cloud-$svc
+        chkconfig cloud-$svc on
+    done
+fi
+
+%preun
+if [ $1 -eq 0 ] ; then
+    # Package removal, not upgrade
+    for svc in config final init init-local; do
+        chkconfig --del cloud-$svc
+        chkconfig cloud-$svc on
+    done
+    # One-shot services -> no need to stop
+fi
+
+%postun
+# One-shot services -> no need to restart
+
+
+%files
+%doc ChangeLog LICENSE TODO README.fedora
+%config(noreplace) %{_sysconfdir}/cloud/cloud.cfg
+%dir               %{_sysconfdir}/cloud/cloud.cfg.d
+%config(noreplace) %{_sysconfdir}/cloud/cloud.cfg.d/*.cfg
+%doc               %{_sysconfdir}/cloud/cloud.cfg.d/README
+%dir               %{_sysconfdir}/cloud/templates
+%config(noreplace) %{_sysconfdir}/cloud/templates/*
+%{_initrddir}/cloud-*
+%{python_sitelib}/*
+%{_libexecdir}/%{name}
+%{_bindir}/cloud-init*
+%doc %{_datadir}/doc/%{name}
+%dir %{_sharedstatedir}/cloud
+
+%config(noreplace) %{_sysconfdir}/rsyslog.d/21-cloudinit.conf
+
+
+%changelog
+* Mon Jun 18 2012 Pádraig Brady <P@draigBrady.com> - 0.6.3-0.6.bzr532
+- Further adjustments to support EPEL 6
+
+* Fri Jun 15 2012 Tomas Karasek <tomas.karasek@cern.ch> - 0.6.3-0.5.bzr532
+- Fix cloud-init-cfg invocation in init script
+
+* Tue May 22 2012 Pádraig Brady <P@draigBrady.com> - 0.6.3-0.4.bzr532
+- Support EPEL 6
+
+* Sat Mar 31 2012 Andy Grimm <agrimm@gmail.com> - 0.6.3-0.2.bzr532
+- Fixed incorrect interpretation of relative path for
+  AuthorizedKeysFile (BZ #735521)
+
+* Mon Mar  5 2012 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.3-0.1.bzr532
+- Rebased against upstream rev 532
+- Fixed runparts() incompatibility with Fedora
+
+* Thu Jan 12 2012 Fedora Release Engineering <rel-eng@lists.fedoraproject.org> - 0.6.2-0.8.bzr457
+- Rebuilt for https://fedoraproject.org/wiki/Fedora_17_Mass_Rebuild
+
+* Wed Oct  5 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.7.bzr457
+- Disabled SSH key-deleting on startup
+
+* Wed Sep 28 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.6.bzr457
+- Consolidated selinux file context patches
+- Fixed cloud-init.service dependencies
+- Updated sshkeytypes patch
+- Dealt with differences from Ubuntu's sshd
+
+* Sat Sep 24 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.5.bzr457
+- Rebased against upstream rev 457
+- Added missing dependencies
+
+* Fri Sep 23 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.4.bzr450
+- Added more macros to the spec file
+
+* Fri Sep 23 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.3.bzr450
+- Fixed logfile permission checking
+- Fixed SSH key generation
+- Fixed a bad method call in FQDN-guessing [LP:857891]
+- Updated localefile patch
+- Disabled the grub_dpkg module
+- Fixed failures due to empty script dirs [LP:857926]
+
+* Fri Sep 23 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.2.bzr450
+- Updated tzsysconfig patch
+
+* Wed Sep 21 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.1.bzr450
+- Initial packaging

From 11860840a5e4a3eb4b2aa495800afe4de8d72ee0 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 13:07:17 -0700
Subject: [PATCH 339/434] This tool knows how to extract the current version
 from the 'changelog' file.

---
 tools/read-version | 51 ++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 51 insertions(+)
 create mode 100755 tools/read-version

diff --git a/tools/read-version b/tools/read-version
new file mode 100755
index 00000000..4458c712
--- /dev/null
+++ b/tools/read-version
@@ -0,0 +1,51 @@
+#!/usr/bin/python
+# vi: ts=4 expandtab
+
+import os
+import sys
+import re
+
+def parse_versions(fn):
+    with open(fn, 'r') as fh:
+        lines = fh.read().splitlines()
+    versions = []
+    for line in lines:
+        line = line.strip()
+        if line.startswith("-") or not line:
+            continue
+        if not re.match(r"[\d]", line):
+            continue
+        line = line.strip(":")
+        if (re.match(r"^[\d+]\.[\d+]\.[\d+]$", line) or
+            re.match(r"^[\d+]\.[\d+]$", line)):
+            versions.append(line)
+    return versions
+
+def find_changelog(args):
+    p_files = []
+    if args:
+        p_files.append(args[0])
+    p_files.append(os.path.join(os.pardir, "ChangeLog"))
+    p_files.append(os.path.join(os.getcwd(), 'ChangeLog'))
+    found = None
+    for fn in p_files:
+        if os.path.isfile(fn):
+            found = fn
+            break
+    return found
+
+
+if __name__ == '__main__':
+    run_args = sys.argv[1:]
+    fn = find_changelog(run_args)
+    if not fn:
+        sys.stderr.write("'ChangeLog' file not found!\n")
+        sys.exit(1)
+    else:
+        versions = parse_versions(fn)
+        if not versions:
+            sys.stderr.write("No versions found in %s!\n" % (fn))
+            sys.exit(1)
+        else:
+            sys.stdout.write(versions[0].strip())
+            sys.exit(0)

From fa9d76421245252fbdf63eb8c0a0f80a5defbd87 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 13:07:40 -0700
Subject: [PATCH 340/434] Use the new version extraction tool to get the
 current active version.

---
 packages/bddeb | 19 +------------------
 1 file changed, 1 insertion(+), 18 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index 74932985..2a089295 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -23,24 +23,7 @@ trap "rm -Rf '${TEMP_D}'" EXIT SIGINT SIGTERM
 cd $ROOT
 files=$(bzr ls --versioned)
 revno=$(bzr revno)
-version=$(awk -F: \
-   '$1 ~ /[0-9][.][0-9]+[.][0-9]+/ { print $1 ; exit(0); }' ChangeLog )
-
-# Ensure that the version found in 'Changelog' is the same in the python 
-# cloud-init version directory
-py_version=$(python -c 'from cloudinit import version; import sys; \
-sys.stdout.write(version.version_string())')
-
-# Canonicalize the changelog version
-ch_version=$(python -c "from distutils import version; import sys; \
-sys.stdout.write(str(version.StrictVersion('$version')));")
-
-if [ "$py_version" != "$ch_version" ]; then
-    echo "Cloud-init python version $py_version" \
-         " != changelog version $ch_version"
-    echo "Please ensure they are the same!"
-    exit 1
-fi
+version=$(tools/read-version)
 
 mkdir "${TEMP_D}/cloud-init"
 otar="$TEMP_D/cloud-init_$version~bzr${revno}.orig.tar.gz"

From be8b3cdaec23c4f33d3beecbc15b1af89892374f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 13:07:57 -0700
Subject: [PATCH 341/434] Continue working on getting a specfile generated.

---
 packages/brpm | 44 +++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 43 insertions(+), 1 deletion(-)

diff --git a/packages/brpm b/packages/brpm
index 829303ea..f2c3dac4 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -1,3 +1,45 @@
-#!/bin/sh
+#!/usr/bin/python
+# vi: ts=4 expandtab
+
+import os
+import subprocess
+import sys
+import tempfile
+import re
+
+import tempita
+
+# This is more just for running from the bin folder so that
+# cloud-init binary can find the cloudinit module
+possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
+        sys.argv[0]), os.pardir, os.pardir))
+if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
+    sys.path.insert(0, possible_topdir)
+
+PWD = os.getcwd()
+
+def info(msg):
+    sys.stderr.write("INFO: %s\n" % (msg))
 
 
+def warn(msg):
+    sys.stderr.write("WARNING: %s\n" % (msg))
+
+
+def main():
+    if not os.path.isfile(os.path.join(PWD, 'brpm.tmpl')):
+        warn("Can not find required template file 'brpm.tmpl'")
+        return 1
+    if not os.path.isfile(os.path.join(os.pardir, 'setup.py')):
+        warn("Can not find required root 'setup.py' file")
+        return 1
+
+    cmd = [os.path.join(os.pardir, 'tools', 'read-version')]
+    version = subprocess.check_Call(cmd)
+    
+    
+    return 0
+
+
+if __name__ == '__main__':
+    sys.exit(main())

From ca9c402c25580418ddcb8c05e1d3216a1154052b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 13:08:20 -0700
Subject: [PATCH 342/434] Use the new tool created to get the version.

---
 setup.py | 23 +++++++----------------
 1 file changed, 7 insertions(+), 16 deletions(-)

diff --git a/setup.py b/setup.py
index 81468943..59548a41 100755
--- a/setup.py
+++ b/setup.py
@@ -27,26 +27,17 @@ import re
 
 import setuptools
 
+import subprocess
+
 
 def is_f(p):
     return os.path.isfile(p)
 
 
-def versions(fn="ChangeLog"):
-    with open(fn, 'r') as fh:
-        lines = fh.read().splitlines()
-    versions = []
-    for line in lines:
-        line = line.strip()
-        if line.startswith("-") or not line:
-            continue
-        if not re.match(r"[\d]", line):
-            continue
-        line = line.strip(":")
-        if (re.match(r"^[\d+]\.[\d+]\.[\d+]$", line) or
-            re.match(r"^[\d+]\.[\d+]$", line)):
-            versions.append(line)
-    return versions
+def get_version():
+    cmd = ['tools/read-version']
+    ver = subprocess.check_output(cmd)
+    return ver.strip()
 
 
 def requires(fn='Requires'):
@@ -63,7 +54,7 @@ def requires(fn='Requires'):
 
 
 setuptools.setup(name='cloud-init',
-      version=versions()[0],
+      version=get_version(),
       description='EC2 initialisation magic',
       author='Scott Moser',
       author_email='scott.moser@canonical.com',

From 80eb005650346c48ef0d91ec20dc2d279853de1d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 16:59:15 -0700
Subject: [PATCH 343/434] Add a simple tool that will parse the requires file

---
 tools/read-dependencies | 45 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 45 insertions(+)
 create mode 100755 tools/read-dependencies

diff --git a/tools/read-dependencies b/tools/read-dependencies
new file mode 100755
index 00000000..72e1e095
--- /dev/null
+++ b/tools/read-dependencies
@@ -0,0 +1,45 @@
+#!/usr/bin/python
+# vi: ts=4 expandtab
+
+import os
+import sys
+import re
+
+
+def parse_requires(fn):
+    requires = []
+    with open(fn, 'r') as fh:
+        lines = fh.read().splitlines()
+    for line in lines:
+        line = line.strip()
+        if not line or line[0] == '#':
+            continue
+        else:
+            requires.append(line)
+    return requires
+
+
+def find_requires(args):
+    p_files = []
+    if args:
+        p_files.append(args[0])
+    p_files.append(os.path.join(os.pardir, "Requires"))
+    p_files.append(os.path.join(os.getcwd(), 'Requires'))
+    found = None
+    for fn in p_files:
+        if os.path.isfile(fn):
+            found = fn
+            break
+    return found
+
+
+if __name__ == '__main__':
+    run_args = sys.argv[1:]
+    fn = find_requires(run_args)
+    if not fn:
+        sys.stderr.write("'Requires' file not found!\n")
+        sys.exit(1)
+    else:
+        deps = parse_requires(fn)
+        for entry in deps:
+            print entry

From 6a2ffea82bd337dc727d6b1178c21d6b42d54f4f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 16:59:39 -0700
Subject: [PATCH 344/434] Get rpm building working with a template.

---
 packages/brpm      | 276 ++++++++++++++++++++++++++++++++++++++++++---
 packages/brpm.tmpl | 165 +++++----------------------
 2 files changed, 294 insertions(+), 147 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index f2c3dac4..5feade24 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -6,9 +6,19 @@ import subprocess
 import sys
 import tempfile
 import re
+import textwrap
+import shutil
+import zipfile
+
+import glob
 
 import tempita
 
+from datetime import datetime
+from datetime import date
+
+from distutils import version as ver
+
 # This is more just for running from the bin folder so that
 # cloud-init binary can find the cloudinit module
 possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
@@ -16,28 +26,268 @@ possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
 if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
     sys.path.insert(0, possible_topdir)
 
+from cloudinit import util
+from cloudinit import version
+
+import contextlib
+
+# Mapping of expected packages to there full name...
+PKG_MP = {
+    'boto': 'python-boto',
+    'tempita': 'python-tempita',
+    'prettytable': 'python-prettytable',
+    'oauth': 'python-oauth',
+    'configobj': 'python-configobj',
+    'yaml': 'PyYAML',
+    'argparse': 'python-argparse'
+}
+
+
+@contextlib.contextmanager
+def chdir(where_to):
+    cur_cwd = os.path.abspath(os.getcwd())
+    where_to = os.path.abspath(where_to)
+    os.chdir(where_to)
+    yield where_to
+    os.chdir(cur_cwd)
+
+
 PWD = os.getcwd()
 
 def info(msg):
-    sys.stderr.write("INFO: %s\n" % (msg))
+    print("INFO: %s" % (msg))
 
 
 def warn(msg):
-    sys.stderr.write("WARNING: %s\n" % (msg))
+    print("WARNING: %s" % (msg))
+
+
+def cut_up(entry, maxline=80):
+    if len(entry) < maxline:
+        return entry
+    else:
+        c = entry[0:maxline]
+        return "%s..." % (c)
+
+
+def extract_entry(collecting):
+    a_entry = {}
+    for t in ['tags', 'revno', 'author', 'timestamp', 'committer']:
+        look_for = "%s:" % (t)
+        for v in collecting:
+            if v.startswith(look_for):
+                a_entry[t] = v[len(look_for):].strip()
+                break
+    i = -1
+    for a, v in enumerate(collecting):
+        if v.startswith("message:"):
+            i = a
+            break
+    if i != -1:
+        msg_lines = collecting[i + 1:]
+        n_lines = []
+        for m in msg_lines:
+            m = m.strip()
+            if not m:
+                continue
+            m = m.replace("\n", " ")
+            n_lines.append("" + m.lstrip())
+        message = " ".join(n_lines).lstrip()
+        a_entry['message'] = message
+    return a_entry
+
+
+def build_changelog(history=-1):
+    cmd = ['bzr', 'log', '--timezone=utc']
+    (stdout, _stderr) = util.subp(cmd)
+    # Clean the format up
+    entries = stdout.splitlines()
+    all_entries = []
+    collecting = []
+    for e in entries:
+        if e.startswith("---"):
+            if collecting:
+                a_entry = extract_entry(collecting)
+                if a_entry:
+                    all_entries.append(a_entry)
+                collecting = []
+        else:
+            collecting.append(e)
+
+    a_entry = extract_entry(collecting)
+    if a_entry:
+        all_entries.append(a_entry)
+
+    if history > 0:
+        take_entries = list(all_entries[0:history])
+    else:
+        take_entries = list(all_entries)
+
+    # Merge those with same date
+    date_entries = {}
+    for e in take_entries:
+        author = e.get('author')
+        if not author:
+            author = e.get('committer')
+        if not author:
+            continue
+        timestamp = e.get('timestamp')
+        if not timestamp:
+            continue
+        msg = e.get('message')
+        if not msg:
+            continue
+        revno = e.get('revno')
+        if not revno:
+            continue
+        # http://bugs.python.org/issue6641
+        timestamp = timestamp.replace("+0000", '').strip()
+        ds = datetime.strptime(timestamp, '%a %Y-%m-%d %H:%M:%S')
+        c_ds = ds.date()
+        if c_ds not in date_entries:
+            ap_entry = {}
+            ap_entry['messages'] = []
+            ap_entry['authors'] = []
+            ap_entry['revnos'] = []
+            date_entries[c_ds] = ap_entry
+        ap_entry = date_entries[c_ds]
+        ap_entry['messages'].append(msg)
+        ap_entry['authors'].append(author)
+        ap_entry['revnos'].append(revno)
+
+    dates = sorted(date_entries.keys())
+    chglog = []
+    for ds in reversed(dates):
+        e = date_entries[ds]
+        authors = ", ".join(set(e['authors']))
+        revnos = ", ".join(list(sorted(e['revnos'])))
+        top_line = "%s %s - %s" % (ds.strftime("%a %b %d %Y"),
+                                   authors, revnos)
+        chglog.append("* %s" % (top_line))
+        for msg in e['messages']:
+            chglog.append("- %s" % (cut_up(msg)))
+    return "\n".join(chglog)
+
+
+def generate_spec_contents(tmpl_fn):
+    # Version junk
+    cmd = [os.path.join(os.pardir, 'tools', 'read-version')]
+    (stdout, _stderr) = util.subp(cmd)
+    i_version = stdout.strip()
+
+    # Ensure ok match!
+    if ver.StrictVersion(i_version) != version.version():
+        raise RuntimeError("Version found does not match the code version")
+
+    # Tmpl params
+    subs = {}
+    subs['version'] = i_version
+    (stdout, _stderr) = util.subp(['bzr', 'revno'])
+    subs['revno'] = "%s" % (stdout.strip())
+    subs['release'] = "%s" % (subs['revno'])
+    subs['archive_name'] = '%{name}-%{version}-' + subs['revno'] + '.tar.gz'
+    subs['bd_requires'] = ['python-devel', 'python-setuptools']
+
+    requires = []
+    cmd = [os.path.join(os.pardir, 'tools', 'read-dependencies')]
+    (stdout, _stderr) = util.subp(cmd)
+    pkgs = stdout.splitlines()
+    
+    # Map to known packages
+    for e in pkgs:
+        e = e.lower().strip()
+        tgt_pkg = None
+        for n in PKG_MP.keys():
+            if e.find(n) != -1:
+                tgt_pkg = PKG_MP.get(n)
+        if not tgt_pkg:
+            raise RuntimeError(("Do not know how to translate %s to "
+                                " a known package") % (e))
+        else:
+            requires.append(tgt_pkg)
+
+    base_name = 'cloud-init-%s-%s' % (i_version, subs['revno'])
+    subs['requires'] = requires
+    subs['changelog'] = build_changelog()
+
+    # See: http://www.zarb.org/~jasonc/macros.php
+    
+    # Pickup any special files
+    docs = [
+        'TODO',
+        'LICENSE',
+        'ChangeLog',
+        'Requires',
+        '%{_defaultdocdir}/cloud-init/*',
+    ]
+    subs['docs'] = docs
+    configs = [
+        'cloud/cloud.cfg',
+        'cloud/cloud.cfg.d/*.cfg',
+        'cloud/cloud.cfg.d/README',
+        'cloud/templates/*',
+    ]
+    subs['configs'] = configs
+    other_files = [
+        '%{_bindir}/*',
+        '/usr/lib/cloud-init/*',
+    ]
+    subs['files'] = other_files
+    
+    with open(tmpl_fn, 'r') as fh:
+        tmpl = tempita.Template(fh.read())
+        contents = tmpl.substitute(**subs)
+        return (base_name, '%s.tar.gz' % (base_name), contents)
 
 
 def main():
-    if not os.path.isfile(os.path.join(PWD, 'brpm.tmpl')):
-        warn("Can not find required template file 'brpm.tmpl'")
-        return 1
-    if not os.path.isfile(os.path.join(os.pardir, 'setup.py')):
-        warn("Can not find required root 'setup.py' file")
-        return 1
-
-    cmd = [os.path.join(os.pardir, 'tools', 'read-version')]
-    version = subprocess.check_Call(cmd)
-    
-    
+    root_dir = os.path.expanduser("~/rpmbuild")
+    info("Cleaning %s" % (root_dir))
+    util.delete_dir_contents(root_dir)
+    arc_dir = os.path.join(root_dir, 'SOURCES')
+    util.ensure_dirs([root_dir, arc_dir])
+    tmpl_fn = os.path.join(os.getcwd(), 'brpm.tmpl')
+    info("Generated spec file from template %s" % (tmpl_fn))
+    (base_name, arc_name, contents) = generate_spec_contents(tmpl_fn)
+    spec_fn = os.path.join(root_dir, 'cloud-init.spec')
+    util.write_file(spec_fn, contents)
+    info("Wrote spec file to %s" % (spec_fn))
+    with util.tempdir() as td:
+        src_dir = os.path.join(td, base_name)
+        os.makedirs(src_dir)
+        for fn in os.listdir(os.pardir):
+            if fn.startswith("."):
+                continue
+            full_fn = os.path.abspath(os.path.join(os.pardir, fn))
+            if os.path.isfile(full_fn):
+                shutil.copy(full_fn, os.path.join(src_dir, fn))
+            else:
+                shutil.copytree(full_fn, os.path.join(src_dir, fn),
+                                ignore=shutil.ignore_patterns('*.pyc',
+                                                              '.bzr',
+                                                              'tmp*',
+                                                              '*bzr*'))
+            arc_fn = os.path.join(arc_dir, arc_name)
+        cmd = ['tar', '-zcvf', arc_fn, '-C', td]
+        cmd.extend(os.listdir(td))
+        util.subp(cmd)
+        info("Archived code at %s" % (arc_fn))
+    cmd = ['rpmbuild', '-ba', spec_fn]
+    info("Running rpmbuild %s" % (cmd))
+    util.subp(cmd)
+    info("Rpmbuild completed!")
+    globs = [] 
+    globs.extend(glob.glob("%s/*.rpm" %
+                           (os.path.join(root_dir, 'RPMS', 'noarch'))))
+    globs.extend(glob.glob("%s/*.rpm" %
+                           (os.path.join(root_dir, 'RPMS'))))
+    globs.extend(glob.glob("%s/*.rpm" %
+                           (os.path.join(root_dir, 'SRPMS'))))
+    for fn in globs:
+        n = os.path.basename(fn)
+        tgt_fn = os.path.join(os.getcwd(), n)
+        util.copy(fn, tgt_fn)
+        info("Copied %s to %s" % (n, tgt_fn))
     return 0
 
 
diff --git a/packages/brpm.tmpl b/packages/brpm.tmpl
index 141578a5..f0c874ee 100644
--- a/packages/brpm.tmpl
+++ b/packages/brpm.tmpl
@@ -9,28 +9,21 @@ Group:          System Environment/Base
 License:        GPLv3
 URL:            http://launchpad.net/cloud-init
 
-Source0:        %{name}-%{version}-bzr532.tar.gz
+Source0:        {{archive_name}}
 
 BuildArch:      noarch
-BuildRoot:      %{_tmppath}/%{name}-%{version}-%{release}-root-%(%{__id_u} -n)
 
-BuildRequires:  python-devel
-BuildRequires:  python-setuptools-devel
-Requires:       e2fsprogs
-Requires:       iproute
-Requires:       libselinux-python
-Requires:       net-tools
-Requires:       procps
-Requires:       python-boto
-Requires:       python-cheetah
-Requires:       python-configobj
-Requires:       PyYAML
-Requires:       rsyslog
-Requires:       shadow-utils
-Requires:       /usr/bin/run-parts
-Requires(post):   chkconfig
-Requires(preun):  chkconfig
-Requires(postun): initscripts
+BuildRoot:      %{_tmppath}
+
+
+{{for r in bd_requires}}
+BuildRequires: {{r}}
+{{endfor}}
+
+# Install requirements
+{{for r in requires}}
+Requires: {{r}}
+{{endfor}}
 
 %description
 Cloud-init is a set of init scripts for cloud instances.  Cloud instances
@@ -39,14 +32,7 @@ ssh keys and to let the user run various scripts.
 
 
 %prep
-%setup -q -n %{name}-%{version}-bzr532
-%patch0 -p0
-%patch1 -p0
-%patch2 -p1
-%patch3 -p1
-
-cp -p %{SOURCE2} README.fedora
-
+%setup -q -n %{name}-%{version}-{{revno}}
 
 %build
 %{__python} setup.py build
@@ -56,118 +42,29 @@ cp -p %{SOURCE2} README.fedora
 rm -rf $RPM_BUILD_ROOT
 %{__python} setup.py install -O1 --skip-build --root $RPM_BUILD_ROOT
 
-for x in $RPM_BUILD_ROOT/%{_bindir}/*.py; do mv "$x" "${x%.py}"; done
-chmod +x $RPM_BUILD_ROOT/%{python_sitelib}/cloudinit/SshUtil.py
-mkdir -p $RPM_BUILD_ROOT/%{_sharedstatedir}/cloud
-
-# We supply our own config file since our software differs from Ubuntu's.
-cp -p %{SOURCE1} $RPM_BUILD_ROOT/%{_sysconfdir}/cloud/cloud.cfg
-
-# Note that /etc/rsyslog.d didn't exist by default until F15.
-# el6 request: https://bugzilla.redhat.com/show_bug.cgi?id=740420
-mkdir -p $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d
-cp -p tools/21-cloudinit.conf $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d/21-cloudinit.conf
-
-# Install the init scripts
-install -p -D -m 755 %{SOURCE3} %{buildroot}%{_initrddir}/cloud-config
-install -p -D -m 755 %{SOURCE4} %{buildroot}%{_initrddir}/cloud-final
-install -p -D -m 755 %{SOURCE5} %{buildroot}%{_initrddir}/cloud-init
-install -p -D -m 755 %{SOURCE6} %{buildroot}%{_initrddir}/cloud-init-local
-
-
 %clean
 rm -rf $RPM_BUILD_ROOT
 
-
-%post
-if [ $1 -eq 1 ] ; then
-    # Initial installation
-    # Enabled by default per "runs once then goes away" exception
-    for svc in config final init init-local; do
-        chkconfig --add cloud-$svc
-        chkconfig cloud-$svc on
-    done
-fi
-
-%preun
-if [ $1 -eq 0 ] ; then
-    # Package removal, not upgrade
-    for svc in config final init init-local; do
-        chkconfig --del cloud-$svc
-        chkconfig cloud-$svc on
-    done
-    # One-shot services -> no need to stop
-fi
-
-%postun
-# One-shot services -> no need to restart
-
-
 %files
-%doc ChangeLog LICENSE TODO README.fedora
-%config(noreplace) %{_sysconfdir}/cloud/cloud.cfg
-%dir               %{_sysconfdir}/cloud/cloud.cfg.d
-%config(noreplace) %{_sysconfdir}/cloud/cloud.cfg.d/*.cfg
-%doc               %{_sysconfdir}/cloud/cloud.cfg.d/README
-%dir               %{_sysconfdir}/cloud/templates
-%config(noreplace) %{_sysconfdir}/cloud/templates/*
-%{_initrddir}/cloud-*
+
+# Docs
+{{for r in docs}}
+%doc {{r}}
+{{endfor}}
+
+# Configs
+{{for r in configs}}
+%config(noreplace) %{_sysconfdir}/{{r}}
+{{endfor}}
+
+# Other files
+{{for r in files}}
+{{r}}
+{{endfor}}
+
+# Python sitelib
 %{python_sitelib}/*
-%{_libexecdir}/%{name}
-%{_bindir}/cloud-init*
-%doc %{_datadir}/doc/%{name}
-%dir %{_sharedstatedir}/cloud
-
-%config(noreplace) %{_sysconfdir}/rsyslog.d/21-cloudinit.conf
-
 
 %changelog
-* Mon Jun 18 2012 Pádraig Brady <P@draigBrady.com> - 0.6.3-0.6.bzr532
-- Further adjustments to support EPEL 6
 
-* Fri Jun 15 2012 Tomas Karasek <tomas.karasek@cern.ch> - 0.6.3-0.5.bzr532
-- Fix cloud-init-cfg invocation in init script
-
-* Tue May 22 2012 Pádraig Brady <P@draigBrady.com> - 0.6.3-0.4.bzr532
-- Support EPEL 6
-
-* Sat Mar 31 2012 Andy Grimm <agrimm@gmail.com> - 0.6.3-0.2.bzr532
-- Fixed incorrect interpretation of relative path for
-  AuthorizedKeysFile (BZ #735521)
-
-* Mon Mar  5 2012 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.3-0.1.bzr532
-- Rebased against upstream rev 532
-- Fixed runparts() incompatibility with Fedora
-
-* Thu Jan 12 2012 Fedora Release Engineering <rel-eng@lists.fedoraproject.org> - 0.6.2-0.8.bzr457
-- Rebuilt for https://fedoraproject.org/wiki/Fedora_17_Mass_Rebuild
-
-* Wed Oct  5 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.7.bzr457
-- Disabled SSH key-deleting on startup
-
-* Wed Sep 28 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.6.bzr457
-- Consolidated selinux file context patches
-- Fixed cloud-init.service dependencies
-- Updated sshkeytypes patch
-- Dealt with differences from Ubuntu's sshd
-
-* Sat Sep 24 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.5.bzr457
-- Rebased against upstream rev 457
-- Added missing dependencies
-
-* Fri Sep 23 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.4.bzr450
-- Added more macros to the spec file
-
-* Fri Sep 23 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.3.bzr450
-- Fixed logfile permission checking
-- Fixed SSH key generation
-- Fixed a bad method call in FQDN-guessing [LP:857891]
-- Updated localefile patch
-- Disabled the grub_dpkg module
-- Fixed failures due to empty script dirs [LP:857926]
-
-* Fri Sep 23 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.2.bzr450
-- Updated tzsysconfig patch
-
-* Wed Sep 21 2011 Garrett Holmstrom <gholms@fedoraproject.org> - 0.6.2-0.1.bzr450
-- Initial packaging
+{{changelog}}

From c829485aeb1bd6f4639d78145ed537a0fb420385 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 16:59:54 -0700
Subject: [PATCH 345/434] Use the standard utils now in tools for reading
 requires/dependencies/versions.

---
 setup.py | 30 +++++++++++++++---------------
 1 file changed, 15 insertions(+), 15 deletions(-)

diff --git a/setup.py b/setup.py
index 59548a41..fd67da46 100755
--- a/setup.py
+++ b/setup.py
@@ -29,6 +29,12 @@ import setuptools
 
 import subprocess
 
+def tiny_p(cmd):
+    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
+                    stderr=subprocess.PIPE, stdin=None)
+    (out, err) = sp.communicate()
+    return (out, err)
+
 
 def is_f(p):
     return os.path.isfile(p)
@@ -36,21 +42,14 @@ def is_f(p):
 
 def get_version():
     cmd = ['tools/read-version']
-    ver = subprocess.check_output(cmd)
+    (ver, _e) = tiny_p(cmd)
     return ver.strip()
 
 
-def requires(fn='Requires'):
-    requires = []
-    with open(fn, 'r') as fh:
-        lines = fh.read().splitlines()
-    for line in lines:
-        line = line.strip()
-        if not line or line[0] == '#':
-            continue
-        else:
-            requires.append(line)
-    return requires
+def read_requires():
+    cmd = ['tools/read-dependencies']
+    (deps, _e) = tiny_p(cmd)
+    return deps.splitlines()
 
 
 setuptools.setup(name='cloud-init',
@@ -68,14 +67,15 @@ setuptools.setup(name='cloud-init',
                   ('/etc/cloud/cloud.cfg.d', glob('config/cloud.cfg.d/*')),
                   ('/etc/cloud/templates', glob('templates/*')),
                   # Only really need for upstart based systems
-                  ('/etc/init', glob('upstart/*.conf')),
+                  #('/etc/init', glob('upstart/*.conf')),
                   ('/usr/share/cloud-init', []),
                   ('/usr/lib/cloud-init',
                     ['tools/uncloud-init', 'tools/write-ssh-key-fingerprints']),
                   ('/usr/share/doc/cloud-init', filter(is_f, glob('doc/*'))),
                   ('/usr/share/doc/cloud-init/examples', filter(is_f, glob('doc/examples/*'))),
                   ('/usr/share/doc/cloud-init/examples/seed', filter(is_f, glob('doc/examples/seed/*'))),
-                  ('/etc/profile.d', ['tools/Z99-cloud-locale-test.sh']),
+                  # ??
+                  # ('/etc/profile.d', ['tools/Z99-cloud-locale-test.sh']),
                   ],
-      install_requires=requires(),
+      install_requires=read_requires(),
       )

From d73dd489fe620396e723ba5702e6db3405d315da Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 17:01:41 -0700
Subject: [PATCH 346/434] Ensure rpmbuild is actually a directory before
 cleaning

---
 packages/brpm | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/packages/brpm b/packages/brpm
index 5feade24..c11b86ff 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -243,7 +243,8 @@ def generate_spec_contents(tmpl_fn):
 def main():
     root_dir = os.path.expanduser("~/rpmbuild")
     info("Cleaning %s" % (root_dir))
-    util.delete_dir_contents(root_dir)
+    if os.path.isdir(root_dir):
+        util.delete_dir_contents(root_dir)
     arc_dir = os.path.join(root_dir, 'SOURCES')
     util.ensure_dirs([root_dir, arc_dir])
     tmpl_fn = os.path.join(os.getcwd(), 'brpm.tmpl')

From 944073a638daa18b4d5ebebe56f86f96fec308a1 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 18:50:29 -0700
Subject: [PATCH 347/434] Add a nicer helper util for the rpm changelog

---
 packages/brpm          | 145 +++------------------------
 packages/rpm-changelog | 220 +++++++++++++++++++++++++++++++++++++++++
 2 files changed, 235 insertions(+), 130 deletions(-)
 create mode 100755 packages/rpm-changelog

diff --git a/packages/brpm b/packages/brpm
index c11b86ff..cc9325cb 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -2,21 +2,13 @@
 # vi: ts=4 expandtab
 
 import os
-import subprocess
 import sys
-import tempfile
-import re
-import textwrap
 import shutil
-import zipfile
 
 import glob
 
 import tempita
 
-from datetime import datetime
-from datetime import date
-
 from distutils import version as ver
 
 # This is more just for running from the bin folder so that
@@ -29,8 +21,6 @@ if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
 from cloudinit import util
 from cloudinit import version
 
-import contextlib
-
 # Mapping of expected packages to there full name...
 PKG_MP = {
     'boto': 'python-boto',
@@ -43,17 +33,6 @@ PKG_MP = {
 }
 
 
-@contextlib.contextmanager
-def chdir(where_to):
-    cur_cwd = os.path.abspath(os.getcwd())
-    where_to = os.path.abspath(where_to)
-    os.chdir(where_to)
-    yield where_to
-    os.chdir(cur_cwd)
-
-
-PWD = os.getcwd()
-
 def info(msg):
     print("INFO: %s" % (msg))
 
@@ -62,114 +41,8 @@ def warn(msg):
     print("WARNING: %s" % (msg))
 
 
-def cut_up(entry, maxline=80):
-    if len(entry) < maxline:
-        return entry
-    else:
-        c = entry[0:maxline]
-        return "%s..." % (c)
-
-
-def extract_entry(collecting):
-    a_entry = {}
-    for t in ['tags', 'revno', 'author', 'timestamp', 'committer']:
-        look_for = "%s:" % (t)
-        for v in collecting:
-            if v.startswith(look_for):
-                a_entry[t] = v[len(look_for):].strip()
-                break
-    i = -1
-    for a, v in enumerate(collecting):
-        if v.startswith("message:"):
-            i = a
-            break
-    if i != -1:
-        msg_lines = collecting[i + 1:]
-        n_lines = []
-        for m in msg_lines:
-            m = m.strip()
-            if not m:
-                continue
-            m = m.replace("\n", " ")
-            n_lines.append("" + m.lstrip())
-        message = " ".join(n_lines).lstrip()
-        a_entry['message'] = message
-    return a_entry
-
-
-def build_changelog(history=-1):
-    cmd = ['bzr', 'log', '--timezone=utc']
-    (stdout, _stderr) = util.subp(cmd)
-    # Clean the format up
-    entries = stdout.splitlines()
-    all_entries = []
-    collecting = []
-    for e in entries:
-        if e.startswith("---"):
-            if collecting:
-                a_entry = extract_entry(collecting)
-                if a_entry:
-                    all_entries.append(a_entry)
-                collecting = []
-        else:
-            collecting.append(e)
-
-    a_entry = extract_entry(collecting)
-    if a_entry:
-        all_entries.append(a_entry)
-
-    if history > 0:
-        take_entries = list(all_entries[0:history])
-    else:
-        take_entries = list(all_entries)
-
-    # Merge those with same date
-    date_entries = {}
-    for e in take_entries:
-        author = e.get('author')
-        if not author:
-            author = e.get('committer')
-        if not author:
-            continue
-        timestamp = e.get('timestamp')
-        if not timestamp:
-            continue
-        msg = e.get('message')
-        if not msg:
-            continue
-        revno = e.get('revno')
-        if not revno:
-            continue
-        # http://bugs.python.org/issue6641
-        timestamp = timestamp.replace("+0000", '').strip()
-        ds = datetime.strptime(timestamp, '%a %Y-%m-%d %H:%M:%S')
-        c_ds = ds.date()
-        if c_ds not in date_entries:
-            ap_entry = {}
-            ap_entry['messages'] = []
-            ap_entry['authors'] = []
-            ap_entry['revnos'] = []
-            date_entries[c_ds] = ap_entry
-        ap_entry = date_entries[c_ds]
-        ap_entry['messages'].append(msg)
-        ap_entry['authors'].append(author)
-        ap_entry['revnos'].append(revno)
-
-    dates = sorted(date_entries.keys())
-    chglog = []
-    for ds in reversed(dates):
-        e = date_entries[ds]
-        authors = ", ".join(set(e['authors']))
-        revnos = ", ".join(list(sorted(e['revnos'])))
-        top_line = "%s %s - %s" % (ds.strftime("%a %b %d %Y"),
-                                   authors, revnos)
-        chglog.append("* %s" % (top_line))
-        for msg in e['messages']:
-            chglog.append("- %s" % (cut_up(msg)))
-    return "\n".join(chglog)
-
-
 def generate_spec_contents(tmpl_fn):
+
     # Version junk
     cmd = [os.path.join(os.pardir, 'tools', 'read-version')]
     (stdout, _stderr) = util.subp(cmd)
@@ -208,10 +81,11 @@ def generate_spec_contents(tmpl_fn):
 
     base_name = 'cloud-init-%s-%s' % (i_version, subs['revno'])
     subs['requires'] = requires
-    subs['changelog'] = build_changelog()
+
+    (stdout, _stderr) = util.subp(['rpm-changelog'])
+    subs['changelog'] = stdout
 
     # See: http://www.zarb.org/~jasonc/macros.php
-    
     # Pickup any special files
     docs = [
         'TODO',
@@ -241,18 +115,24 @@ def generate_spec_contents(tmpl_fn):
 
 
 def main():
+
+    # Clean out the root dir and make sure the dirs we want are in place
     root_dir = os.path.expanduser("~/rpmbuild")
     info("Cleaning %s" % (root_dir))
     if os.path.isdir(root_dir):
         util.delete_dir_contents(root_dir)
     arc_dir = os.path.join(root_dir, 'SOURCES')
     util.ensure_dirs([root_dir, arc_dir])
+
+    # Form the spec file to be used
     tmpl_fn = os.path.join(os.getcwd(), 'brpm.tmpl')
     info("Generated spec file from template %s" % (tmpl_fn))
     (base_name, arc_name, contents) = generate_spec_contents(tmpl_fn)
     spec_fn = os.path.join(root_dir, 'cloud-init.spec')
     util.write_file(spec_fn, contents)
     info("Wrote spec file to %s" % (spec_fn))
+
+    # Archive the code and files that we want to
     with util.tempdir() as td:
         src_dir = os.path.join(td, base_name)
         os.makedirs(src_dir)
@@ -273,10 +153,14 @@ def main():
         cmd.extend(os.listdir(td))
         util.subp(cmd)
         info("Archived code at %s" % (arc_fn))
+
+    # Now build it!
     cmd = ['rpmbuild', '-ba', spec_fn]
     info("Running rpmbuild %s" % (cmd))
     util.subp(cmd)
     info("Rpmbuild completed!")
+
+    # Copy the items built to our local dir
     globs = [] 
     globs.extend(glob.glob("%s/*.rpm" %
                            (os.path.join(root_dir, 'RPMS', 'noarch'))))
@@ -289,6 +173,7 @@ def main():
         tgt_fn = os.path.join(os.getcwd(), n)
         util.copy(fn, tgt_fn)
         info("Copied %s to %s" % (n, tgt_fn))
+
     return 0
 
 
diff --git a/packages/rpm-changelog b/packages/rpm-changelog
new file mode 100755
index 00000000..80db94c5
--- /dev/null
+++ b/packages/rpm-changelog
@@ -0,0 +1,220 @@
+#!/usr/bin/python
+# vi: ts=4 expandtab
+
+import sys
+import os
+import re
+
+import textwrap
+
+from datetime import datetime
+from datetime import date
+
+import subprocess
+
+def tiny_p(cmd):
+    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
+                    stderr=subprocess.PIPE, stdin=None)
+    (out, err) = sp.communicate()
+    return (out, err)
+
+# This util converts a bzr log into a useful rpm changelog
+
+def cut_up(entry, maxline=80):
+    if len(entry) < maxline:
+        return entry
+    else:
+        c = entry[0:maxline]
+        return "%s..." % (c)
+
+
+def adj_iter(elems):
+    if not elems:
+        raise StopIteration()
+    curr = elems[0]
+    yield curr
+    for i in range(1, len(elems)):
+        e = elems[i]
+        if e != curr:
+            yield e
+            curr = e
+
+def extract_entry(collecting):
+    a_entry = {}
+    for t in ['tags', 'revno', 'author', 'timestamp', 'committer']:
+        look_for = "%s:" % (t)
+        for v in collecting:
+            if v.startswith(look_for):
+                a_entry[t] = v[len(look_for):].strip()
+                break
+    i = -1
+    for a, v in enumerate(collecting):
+        if v.startswith("message:"):
+            i = a
+            break
+    if i != -1:
+        msg_lines = collecting[i + 1:]
+        a_entry['message'] = "\n".join(msg_lines)
+    return a_entry
+
+
+def clean_authors(authors):
+    if not authors:
+        return ''
+    auth_cleaned = set()
+    for a in authors:
+        a = a.strip()
+        if a:
+            auth_cleaned.add(a)
+    if not auth_cleaned:
+        return ''
+    uniq_authors = list(auth_cleaned)
+    if len(uniq_authors) == 1:
+        return authors[0]
+    auths = "(%s)" % ", ".join(uniq_authors)
+    return auths
+
+
+def clean_revnos(revnos):
+    novs = list()
+    for r in revnos:
+        r = r.strip()
+        r = r.replace("[merge]", "")
+        if r:
+            novs.append(int(r))
+    entries = list(novs)
+    if not entries:
+        return ''
+    entries.sort()
+    if len(entries) == 1:
+        return "%s" % (entries[0])
+
+    # Check if consecutive
+    start = entries[0]
+    consec = True
+    for (i, v) in enumerate(entries):
+        if v != start + i:
+            consec = False
+            break
+    if consec:
+        end = entries[-1]
+        return "%s => %s" % (start, end)
+    v = [str(b) for b in entries]
+    return ", ".join(v)
+
+
+def spacey(am):
+    return " " * am
+
+
+def justify(text, space_wanted):
+    c_bef = len(text)
+    t_c = len(text.lstrip())
+    space_am = (c_bef - t_c)
+    needed = (space_wanted - space_am)
+    if needed < 0:
+        return text
+    return (" " * (needed) + text)
+
+
+def clean_messages(messages):
+    contents = []
+    for msg in messages:
+        # Split into sub-messages...
+        # if we can
+        lines = []
+        pieces = msg.splitlines()
+        if len(pieces) == 1:
+            lines.append("%s- %s " %
+                         (spacey(4), msg.strip()))
+        else:
+            n_lines = []
+            n_lines.append(pieces[0].strip())
+            for line in pieces[1:]:
+                line = line.lstrip()
+                if not line:
+                    continue
+                n_lines.append(justify(line, 6))
+            lines.append("%s- %s" % (spacey(4), "\n".join(n_lines)))
+        contents.extend(lines)
+    return "\n".join(contents)
+
+
+def build_changelog(history=-1):
+    cmd = ['bzr', 'log', '--timezone=utc']
+    (stdout, _stderr) = tiny_p(cmd)
+    # Clean the format up
+    entries = stdout.splitlines()
+    all_entries = []
+    collecting = []
+    for e in entries:
+        if e.startswith("---"):
+            if collecting:
+                a_entry = extract_entry(collecting)
+                if a_entry:
+                    all_entries.append(a_entry)
+                collecting = []
+        else:
+            collecting.append(e)
+
+    a_entry = extract_entry(collecting)
+    if a_entry:
+        all_entries.append(a_entry)
+
+    if history > 0:
+        take_entries = list(all_entries[0:history])
+    else:
+        take_entries = list(all_entries)
+
+    # Merge those with same date
+    date_entries = {}
+    for e in take_entries:
+        author = e.get('author')
+        if not author:
+            author = e.get('committer')
+        if not author:
+            continue
+        timestamp = e.get('timestamp')
+        if not timestamp:
+            continue
+        msg = e.get('message')
+        if not msg:
+            continue
+        revno = e.get('revno')
+        if not revno:
+            continue
+        # http://bugs.python.org/issue6641
+        timestamp = timestamp.replace("+0000", '').strip()
+        ds = datetime.strptime(timestamp, '%a %Y-%m-%d %H:%M:%S')
+        c_ds = ds.date()
+        if c_ds not in date_entries:
+            ap_entry = {}
+            ap_entry['messages'] = []
+            ap_entry['authors'] = []
+            ap_entry['revnos'] = []
+            date_entries[c_ds] = ap_entry
+        ap_entry = date_entries[c_ds]
+        ap_entry['messages'].append(msg)
+        ap_entry['authors'].append(author)
+        ap_entry['revnos'].append(revno)
+
+    dates = sorted(date_entries.keys())
+    chglog = []
+    for ds in reversed(dates):
+        e = date_entries[ds]
+        authors = clean_authors(e['authors'])
+        revnos = clean_revnos(e['revnos'])
+        top_line = "%s %s - %s" % (ds.strftime("%a %b %d %Y"),
+                                   authors, revnos)
+        chglog.append("* %s" % (top_line))
+        chglog.append(clean_messages(e['messages']))
+    return "\n".join(chglog)
+
+
+if __name__ == '__main__':
+    args = sys.argv[1:]
+    history_am = -1
+    if args:
+        history_am = int(args[0])
+    chglog = build_changelog(history_am)
+    print chglog

From dd747b010406dec05ad33ae9b98dc77776c3ce7b Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 18:53:51 -0700
Subject: [PATCH 348/434] Fix call to rpm-changelog

---
 packages/brpm | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/brpm b/packages/brpm
index cc9325cb..50ac4467 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -82,7 +82,7 @@ def generate_spec_contents(tmpl_fn):
     base_name = 'cloud-init-%s-%s' % (i_version, subs['revno'])
     subs['requires'] = requires
 
-    (stdout, _stderr) = util.subp(['rpm-changelog'])
+    (stdout, _stderr) = util.subp([os.path.join(os.getcwd(), 'rpm-changelog')])
     subs['changelog'] = stdout
 
     # See: http://www.zarb.org/~jasonc/macros.php

From b646fa667c55301ebc65efec881f064c12095027 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 20:29:32 -0700
Subject: [PATCH 349/434] Remove need to depend on cloudinit for the util
 functions used

---
 packages/brpm | 80 ++++++++++++++++++++++++++++++---------------------
 1 file changed, 47 insertions(+), 33 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index 50ac4467..c989892e 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -1,25 +1,15 @@
 #!/usr/bin/python
-# vi: ts=4 expandtab
-
-import os
-import sys
-import shutil
 
+import contextlib
 import glob
+import os
+import shutil
+import subprocess
+import sys
+import tempfile
 
 import tempita
 
-from distutils import version as ver
-
-# This is more just for running from the bin folder so that
-# cloud-init binary can find the cloudinit module
-possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
-        sys.argv[0]), os.pardir, os.pardir))
-if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
-    sys.path.insert(0, possible_topdir)
-
-from cloudinit import util
-from cloudinit import version
 
 # Mapping of expected packages to there full name...
 PKG_MP = {
@@ -33,6 +23,31 @@ PKG_MP = {
 }
 
 
+@contextlib.contextmanager
+def tmpdir():
+    t = tempfile.mkdtemp()
+    try:
+        yield t
+    finally:
+        shutil.rmtree(t)
+
+
+def join(*paths):
+    p = os.path.join(*paths)
+    return os.path.abspath(p)
+
+
+def tiny_p(cmd):
+    # Darn python 2.6 doesn't have check_output (argggg)
+    info("Running %s" % (cmd))
+    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
+                    stderr=subprocess.PIPE, stdin=None)
+    (out, err) = sp.communicate()
+    if sp.returncode not in [0]:
+        raise RuntimeError("Failed running %s [rc=%s]" % (cmd, sp.returncode))
+    return (out, err)
+
+
 def info(msg):
     print("INFO: %s" % (msg))
 
@@ -44,26 +59,22 @@ def warn(msg):
 def generate_spec_contents(tmpl_fn):
 
     # Version junk
-    cmd = [os.path.join(os.pardir, 'tools', 'read-version')]
-    (stdout, _stderr) = util.subp(cmd)
+    cmd = [sys.executable, join(os.pardir, 'tools', 'read-version')]
+    (stdout, _stderr) = tiny_p(cmd)
     i_version = stdout.strip()
 
-    # Ensure ok match!
-    if ver.StrictVersion(i_version) != version.version():
-        raise RuntimeError("Version found does not match the code version")
-
     # Tmpl params
     subs = {}
     subs['version'] = i_version
-    (stdout, _stderr) = util.subp(['bzr', 'revno'])
+    (stdout, _stderr) = tiny_p(['bzr', 'revno'])
     subs['revno'] = "%s" % (stdout.strip())
     subs['release'] = "%s" % (subs['revno'])
     subs['archive_name'] = '%{name}-%{version}-' + subs['revno'] + '.tar.gz'
     subs['bd_requires'] = ['python-devel', 'python-setuptools']
 
     requires = []
-    cmd = [os.path.join(os.pardir, 'tools', 'read-dependencies')]
-    (stdout, _stderr) = util.subp(cmd)
+    cmd = [sys.executable, join(os.pardir, 'tools', 'read-dependencies')]
+    (stdout, _stderr) = tiny_p(cmd)
     pkgs = stdout.splitlines()
     
     # Map to known packages
@@ -82,7 +93,8 @@ def generate_spec_contents(tmpl_fn):
     base_name = 'cloud-init-%s-%s' % (i_version, subs['revno'])
     subs['requires'] = requires
 
-    (stdout, _stderr) = util.subp([os.path.join(os.getcwd(), 'rpm-changelog')])
+    (stdout, _stderr) = tiny_p([sys.executable, 
+                               join(os.getcwd(), 'rpm-changelog')])
     subs['changelog'] = stdout
 
     # See: http://www.zarb.org/~jasonc/macros.php
@@ -120,20 +132,22 @@ def main():
     root_dir = os.path.expanduser("~/rpmbuild")
     info("Cleaning %s" % (root_dir))
     if os.path.isdir(root_dir):
-        util.delete_dir_contents(root_dir)
+        shutil.rmtree(root_dir)
     arc_dir = os.path.join(root_dir, 'SOURCES')
-    util.ensure_dirs([root_dir, arc_dir])
+    for d in [root_dir, arc_dir]:
+        os.makedirs(d)
 
     # Form the spec file to be used
     tmpl_fn = os.path.join(os.getcwd(), 'brpm.tmpl')
     info("Generated spec file from template %s" % (tmpl_fn))
     (base_name, arc_name, contents) = generate_spec_contents(tmpl_fn)
     spec_fn = os.path.join(root_dir, 'cloud-init.spec')
-    util.write_file(spec_fn, contents)
-    info("Wrote spec file to %s" % (spec_fn))
+    with open(spec_fn, 'w') as fh:
+        fh.write(contents)
+        info("Wrote spec file to %s" % (spec_fn))
 
     # Archive the code and files that we want to
-    with util.tempdir() as td:
+    with tmpdir() as td:
         src_dir = os.path.join(td, base_name)
         os.makedirs(src_dir)
         for fn in os.listdir(os.pardir):
@@ -151,13 +165,13 @@ def main():
             arc_fn = os.path.join(arc_dir, arc_name)
         cmd = ['tar', '-zcvf', arc_fn, '-C', td]
         cmd.extend(os.listdir(td))
-        util.subp(cmd)
+        tiny_p(cmd)
         info("Archived code at %s" % (arc_fn))
 
     # Now build it!
     cmd = ['rpmbuild', '-ba', spec_fn]
     info("Running rpmbuild %s" % (cmd))
-    util.subp(cmd)
+    tiny_p(cmd)
     info("Rpmbuild completed!")
 
     # Copy the items built to our local dir

From 575bb1c72de1209023444bd26b691faf13670b62 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 20:29:58 -0700
Subject: [PATCH 350/434] Some cleanups around util functions and formatting

---
 packages/rpm-changelog | 77 +++++++++++++++++++-----------------------
 1 file changed, 34 insertions(+), 43 deletions(-)

diff --git a/packages/rpm-changelog b/packages/rpm-changelog
index 80db94c5..8acaa5b9 100755
--- a/packages/rpm-changelog
+++ b/packages/rpm-changelog
@@ -1,61 +1,49 @@
 #!/usr/bin/python
 # vi: ts=4 expandtab
 
-import sys
+# A crappy little script
+# that changes bzr 'log' 
+# into someting that rpm spec files can use (best effort)
+
 import os
 import re
-
-import textwrap
+import sys
 
 from datetime import datetime
 from datetime import date
 
 import subprocess
 
+E_TYPES = ['tags', 'revno', 'author', 'timestamp', 'committer']
+
+
 def tiny_p(cmd):
+    # Darn python 2.6 doesn't have check_output (argggg)
     sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
                     stderr=subprocess.PIPE, stdin=None)
     (out, err) = sp.communicate()
     return (out, err)
 
-# This util converts a bzr log into a useful rpm changelog
-
-def cut_up(entry, maxline=80):
-    if len(entry) < maxline:
-        return entry
-    else:
-        c = entry[0:maxline]
-        return "%s..." % (c)
-
-
-def adj_iter(elems):
-    if not elems:
-        raise StopIteration()
-    curr = elems[0]
-    yield curr
-    for i in range(1, len(elems)):
-        e = elems[i]
-        if e != curr:
-            yield e
-            curr = e
 
 def extract_entry(collecting):
-    a_entry = {}
-    for t in ['tags', 'revno', 'author', 'timestamp', 'committer']:
+    entry = {}
+    for t in E_TYPES:
         look_for = "%s:" % (t)
         for v in collecting:
             if v.startswith(look_for):
-                a_entry[t] = v[len(look_for):].strip()
+                entry[t] = v[len(look_for):].strip()
                 break
     i = -1
+    # Messages seem to be the last element so suck 
+    # those all up
     for a, v in enumerate(collecting):
         if v.startswith("message:"):
             i = a
             break
     if i != -1:
         msg_lines = collecting[i + 1:]
-        a_entry['message'] = "\n".join(msg_lines)
-    return a_entry
+        entry['message'] = "\n".join(msg_lines)
+    return entry
 
 
 def clean_authors(authors):
@@ -143,6 +131,7 @@ def clean_messages(messages):
 def build_changelog(history=-1):
     cmd = ['bzr', 'log', '--timezone=utc']
     (stdout, _stderr) = tiny_p(cmd)
+
     # Clean the format up
     entries = stdout.splitlines()
     all_entries = []
@@ -157,9 +146,10 @@ def build_changelog(history=-1):
         else:
             collecting.append(e)
 
-    a_entry = extract_entry(collecting)
-    if a_entry:
-        all_entries.append(a_entry)
+    # Anything that we left behind??
+    entry = extract_entry(collecting)
+    if entry:
+        all_entries.append(entry)
 
     if history > 0:
         take_entries = list(all_entries[0:history])
@@ -186,25 +176,26 @@ def build_changelog(history=-1):
         # http://bugs.python.org/issue6641
         timestamp = timestamp.replace("+0000", '').strip()
         ds = datetime.strptime(timestamp, '%a %Y-%m-%d %H:%M:%S')
-        c_ds = ds.date()
-        if c_ds not in date_entries:
-            ap_entry = {}
-            ap_entry['messages'] = []
-            ap_entry['authors'] = []
-            ap_entry['revnos'] = []
-            date_entries[c_ds] = ap_entry
-        ap_entry = date_entries[c_ds]
-        ap_entry['messages'].append(msg)
-        ap_entry['authors'].append(author)
-        ap_entry['revnos'].append(revno)
+        ds = ds.date()
+        if ds not in date_entries:
+            entry = {}
+            entry['messages'] = []
+            entry['authors'] = []
+            entry['revnos'] = []
+            date_entries[ds] = entry
+        entry = date_entries[ds]
+        entry['messages'].append(msg)
+        entry['authors'].append(author)
+        entry['revnos'].append(revno)
 
+    # It wants them in chronological order...
     dates = sorted(date_entries.keys())
     chglog = []
     for ds in reversed(dates):
         e = date_entries[ds]
         authors = clean_authors(e['authors'])
         revnos = clean_revnos(e['revnos'])
-        top_line = "%s %s - %s" % (ds.strftime("%a %b %d %Y"),
+        top_line = "%s %s - [revison %s]" % (ds.strftime("%a %b %d %Y"),
                                    authors, revnos)
         chglog.append("* %s" % (top_line))
         chglog.append(clean_messages(e['messages']))

From c676d0c4e218f9ec43b7aade137bbab324905d2a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:04:38 -0700
Subject: [PATCH 351/434] Continue working on cleaning this up

---
 packages/brpm      | 60 +++++++++++++++++++---------------------------
 packages/brpm.tmpl |  2 +-
 2 files changed, 26 insertions(+), 36 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index c989892e..241f08fd 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -44,7 +44,8 @@ def tiny_p(cmd):
                     stderr=subprocess.PIPE, stdin=None)
     (out, err) = sp.communicate()
     if sp.returncode not in [0]:
-        raise RuntimeError("Failed running %s [rc=%s]" % (cmd, sp.returncode))
+        raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
+                            % (cmd, sp.returncode, out, err))
     return (out, err)
 
 
@@ -56,19 +57,13 @@ def warn(msg):
     print("WARNING: %s" % (msg))
 
 
-def generate_spec_contents(tmpl_fn):
-
-    # Version junk
-    cmd = [sys.executable, join(os.pardir, 'tools', 'read-version')]
-    (stdout, _stderr) = tiny_p(cmd)
-    i_version = stdout.strip()
+def generate_spec_contents(tmpl_fn, revno, version):
 
     # Tmpl params
     subs = {}
-    subs['version'] = i_version
-    (stdout, _stderr) = tiny_p(['bzr', 'revno'])
-    subs['revno'] = "%s" % (stdout.strip())
-    subs['release'] = "%s" % (subs['revno'])
+    subs['version'] = version
+    subs['revno'] = revno
+    subs['release'] = revno
     subs['archive_name'] = '%{name}-%{version}-' + subs['revno'] + '.tar.gz'
     subs['bd_requires'] = ['python-devel', 'python-setuptools']
 
@@ -90,7 +85,7 @@ def generate_spec_contents(tmpl_fn):
         else:
             requires.append(tgt_pkg)
 
-    base_name = 'cloud-init-%s-%s' % (i_version, subs['revno'])
+    base_name = 'cloud-init-%s-%s' % (version, subs['revno'])
     subs['requires'] = requires
 
     (stdout, _stderr) = tiny_p([sys.executable, 
@@ -126,6 +121,16 @@ def generate_spec_contents(tmpl_fn):
         return (base_name, '%s.tar.gz' % (base_name), contents)
 
 
+def archive_code():
+    (stdout, _stderr) = tiny_p([sys.executable, 
+                               join(os.getcwd(), 'tar-me')])
+    lines = stdout.splitlines()
+    revno = lines[0]
+    version = lines[1]
+    arc_fn = lines[2]
+    return (revno, version, arc_fn)
+
+
 def main():
 
     # Clean out the root dir and make sure the dirs we want are in place
@@ -136,38 +141,23 @@ def main():
     arc_dir = os.path.join(root_dir, 'SOURCES')
     for d in [root_dir, arc_dir]:
         os.makedirs(d)
+        
+    # Archive the code
+    (revno, version, archive_fn) = archive_code()
+    real_archive_fn = os.path.join(arc_dir, os.path.basename(archive_fn))
+    shutil.copy(archive_fn, real_archive_fn)
+    info("Archived code to %s" % (real_archive_fn))
 
     # Form the spec file to be used
     tmpl_fn = os.path.join(os.getcwd(), 'brpm.tmpl')
     info("Generated spec file from template %s" % (tmpl_fn))
-    (base_name, arc_name, contents) = generate_spec_contents(tmpl_fn)
+    (base_name, arc_name, contents) = generate_spec_contents(tmpl_fn,
+                                                             revno, version)
     spec_fn = os.path.join(root_dir, 'cloud-init.spec')
     with open(spec_fn, 'w') as fh:
         fh.write(contents)
         info("Wrote spec file to %s" % (spec_fn))
 
-    # Archive the code and files that we want to
-    with tmpdir() as td:
-        src_dir = os.path.join(td, base_name)
-        os.makedirs(src_dir)
-        for fn in os.listdir(os.pardir):
-            if fn.startswith("."):
-                continue
-            full_fn = os.path.abspath(os.path.join(os.pardir, fn))
-            if os.path.isfile(full_fn):
-                shutil.copy(full_fn, os.path.join(src_dir, fn))
-            else:
-                shutil.copytree(full_fn, os.path.join(src_dir, fn),
-                                ignore=shutil.ignore_patterns('*.pyc',
-                                                              '.bzr',
-                                                              'tmp*',
-                                                              '*bzr*'))
-            arc_fn = os.path.join(arc_dir, arc_name)
-        cmd = ['tar', '-zcvf', arc_fn, '-C', td]
-        cmd.extend(os.listdir(td))
-        tiny_p(cmd)
-        info("Archived code at %s" % (arc_fn))
-
     # Now build it!
     cmd = ['rpmbuild', '-ba', spec_fn]
     info("Running rpmbuild %s" % (cmd))
diff --git a/packages/brpm.tmpl b/packages/brpm.tmpl
index f0c874ee..0128bb69 100644
--- a/packages/brpm.tmpl
+++ b/packages/brpm.tmpl
@@ -32,7 +32,7 @@ ssh keys and to let the user run various scripts.
 
 
 %prep
-%setup -q -n %{name}-%{version}-{{revno}}
+%setup -q -n
 
 %build
 %{__python} setup.py build

From ec56f22b4789641694448aaa548ca5bdac00a7c1 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:04:51 -0700
Subject: [PATCH 352/434] Add a small script to tall the whole code

---
 packages/tar-me | 84 +++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 84 insertions(+)
 create mode 100755 packages/tar-me

diff --git a/packages/tar-me b/packages/tar-me
new file mode 100755
index 00000000..b15399a1
--- /dev/null
+++ b/packages/tar-me
@@ -0,0 +1,84 @@
+#!/usr/bin/python
+
+import contextlib
+import os
+import shutil
+import subprocess
+import sys
+import tempfile
+
+
+def join(*paths):
+    p = os.path.join(*paths)
+    return os.path.abspath(p)
+
+
+def tiny_p(cmd):
+    # Darn python 2.6 doesn't have check_output (argggg)
+    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
+                    stderr=subprocess.PIPE, stdin=None)
+    (out, err) = sp.communicate()
+    if sp.returncode not in [0]:
+        raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
+                            % (cmd, sp.returncode, out, err))
+    return (out, err)
+
+
+@contextlib.contextmanager
+def tmpdir():
+    t = tempfile.mkdtemp()
+    try:
+        yield t
+    finally:
+        shutil.rmtree(t)
+
+
+
+def main(args):
+    
+    tag = None
+    if args:
+        tag = args[0]
+
+    with tmpdir() as td:
+        (stdout, _stderr) = tiny_p(['bzr', 'revno'])
+        revno = stdout.strip()
+
+        cmd = [sys.executable, join(os.pardir, 'tools', 'read-version')]
+        (stdout, _stderr) = tiny_p(cmd)
+        version = stdout.strip()
+
+        owcd = os.getcwd()
+        os.chdir(os.path.abspath(os.pardir))
+        if not os.path.exists('setup.py'):
+            raise RuntimeError("No setup.py found in %s" % (os.getcwd()))
+
+        cmd = ['bzr', 'ls', '--versioned']
+        (stdout, _stderr) = tiny_p(cmd)
+        fns = []
+        for fn in stdout.splitlines():
+            fn = fn.strip()
+            if not fn or fn.startswith("."):
+                continue
+            fns.append(fn)
+
+        bfn = 'cloud-init-%s-%s' % (version, revno)
+        fn = '%s.tar.gz' % (bfn)
+        o_fn = join(td, fn)
+        cmd = ['tar', '-czf', o_fn]
+        cmd.extend(fns)
+        tiny_p(cmd)
+
+        os.chdir(owcd)
+        shutil.copy(o_fn, fn)
+
+        print revno
+        print version
+        print(os.path.abspath(fn))
+
+    return 0
+
+
+if __name__ == '__main__':
+    sys.exit(main(sys.argv[1:]))
+

From c5a0fa1ec010cd72ecc0b279807ca2fb8246e276 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:06:07 -0700
Subject: [PATCH 353/434] Continue working on cleaning this up

---
 packages/brpm.tmpl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/brpm.tmpl b/packages/brpm.tmpl
index 0128bb69..f0c874ee 100644
--- a/packages/brpm.tmpl
+++ b/packages/brpm.tmpl
@@ -32,7 +32,7 @@ ssh keys and to let the user run various scripts.
 
 
 %prep
-%setup -q -n
+%setup -q -n %{name}-%{version}-{{revno}}
 
 %build
 %{__python} setup.py build

From 9d845219c9f0fe8bceebbb84acdba2c75b516277 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:11:57 -0700
Subject: [PATCH 354/434] Use a directory prefix

---
 packages/tar-me | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/packages/tar-me b/packages/tar-me
index b15399a1..4a4a0253 100755
--- a/packages/tar-me
+++ b/packages/tar-me
@@ -61,12 +61,18 @@ def main(args):
             if not fn or fn.startswith("."):
                 continue
             fns.append(fn)
-
         bfn = 'cloud-init-%s-%s' % (version, revno)
+        os.makedirs(join(td, bfn))
+        
+        for fn in fns:
+            if os.path.isfile(fn):
+                shutil.copy(fn, join(td, bfn, fn))
+            else:
+                shutil.copytree(fn, join(td, bfn, fn))
+
         fn = '%s.tar.gz' % (bfn)
         o_fn = join(td, fn)
-        cmd = ['tar', '-czf', o_fn]
-        cmd.extend(fns)
+        cmd = ['tar', '-czf', o_fn, '-C', join(td), bfn]
         tiny_p(cmd)
 
         os.chdir(owcd)

From 8fe2f786b21b88cca10abc940f8138e6502d8367 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:13:29 -0700
Subject: [PATCH 355/434] Use move instead of copy

---
 packages/tar-me | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/tar-me b/packages/tar-me
index 4a4a0253..261b77bb 100755
--- a/packages/tar-me
+++ b/packages/tar-me
@@ -76,7 +76,7 @@ def main(args):
         tiny_p(cmd)
 
         os.chdir(owcd)
-        shutil.copy(o_fn, fn)
+        shutil.move(o_fn, fn)
 
         print revno
         print version

From 3a13fbc66c3f2f19048ed8b0ddd1049d92df263d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:13:37 -0700
Subject: [PATCH 356/434] Use move and not util copy

---
 packages/bddeb | 93 +++++++++++++++++++++++++++++++-------------------
 packages/brpm  |  4 +--
 2 files changed, 59 insertions(+), 38 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index 2a089295..465bd986 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -1,45 +1,66 @@
-#!/bin/sh 
+#!/usr/bin/python
 
-# Ensure we can find the setup.py file which
-# should be at the root of the cloud-init tree
-PKG_DIR=`pwd`
-ROOT="$PKG_DIR/../"
-if [ ! -e "$ROOT/setup.py" ]; then
-    echo "No setup.py found at $ROOT"
-    exit 1
-fi
-echo "Using root directory $ROOT for building your debian package"
+import contextlib
+import glob
+import os
+import shutil
+import subprocess
+import sys
+import tempfile
 
-# Ensure tempdir is cleaned and ready to go
-TEMP_D=$(mktemp -d "${TMPDIR:-/tmp}/${0##*/}.XXXXXXX")
-echo "With $TEMP_D as a temporary workspace"
-rm -Rf "${TEMP_D}"; mkdir "${TEMP_D}"
-set -e
 
-# Ensure tempdir removed if breaks...
-trap "rm -Rf '${TEMP_D}'" EXIT SIGINT SIGTERM
+@contextlib.contextmanager
+def tmpdir():
+    t = tempfile.mkdtemp()
+    try:
+        yield t
+    finally:
+        shutil.rmtree(t)
 
-# Go to the root and start making a package!
-cd $ROOT
-files=$(bzr ls --versioned)
-revno=$(bzr revno)
-version=$(tools/read-version)
 
-mkdir "${TEMP_D}/cloud-init"
-otar="$TEMP_D/cloud-init_$version~bzr${revno}.orig.tar.gz"
-tar -czf - ${files} > "$otar"
-tar -C "${TEMP_D}/cloud-init" -xzf - < "$otar"
+def join(*paths):
+    p = os.path.join(*paths)
+    return os.path.abspath(p)
 
-if [ ! -d "${TEMP_D}/cloud-init/debian" ]; then
-   rsync -a $PKG_DIR/debian.trunk/ "${TEMP_D}/cloud-init/debian"
-fi
 
-sed -i -e "s,VERSION,$version," -e "s,REVNO,bzr$revno," \
-          "$TEMP_D/cloud-init/debian/changelog"
+def tiny_p(cmd):
+    # Darn python 2.6 doesn't have check_output (argggg)
+    info("Running %s" % (cmd))
+    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
+                    stderr=subprocess.PIPE, stdin=None)
+    (out, err) = sp.communicate()
+    if sp.returncode not in [0]:
+        raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
+                            % (cmd, sp.returncode, out, err))
+    return (out, err)
 
-cd "${TEMP_D}/cloud-init"
-debuild "$@"
-debname="cloud-init_${version}~bzr${revno}-1_all.deb"
-mv "../$debname" "$PKG_DIR"
-echo "Wrote $debname to $PKG_DIR"
 
+def info(msg):
+    print("INFO: %s" % (msg))
+
+
+def warn(msg):
+    print("WARNING: %s" % (msg))
+
+ 
+
+def main():
+
+    with tmpdir() as td:
+        info("Using %s as a temporary workspace" % (td))
+        (stdout, _stderr) = tiny_p(['bzr', 'revno'])
+        revno = stdout.strip()
+        
+        
+        
+        cmd = [sys.executable, join(os.pardir, 'tools', 'read-version')]
+        (stdout, _stderr) = tiny_p(cmd)
+        version = stdout.strip()
+        
+        
+
+    return 0
+
+
+if __name__ == '__main__':
+    sys.exit(main())
diff --git a/packages/brpm b/packages/brpm
index 241f08fd..febbfb5e 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -145,7 +145,7 @@ def main():
     # Archive the code
     (revno, version, archive_fn) = archive_code()
     real_archive_fn = os.path.join(arc_dir, os.path.basename(archive_fn))
-    shutil.copy(archive_fn, real_archive_fn)
+    shutil.move(archive_fn, real_archive_fn)
     info("Archived code to %s" % (real_archive_fn))
 
     # Form the spec file to be used
@@ -175,7 +175,7 @@ def main():
     for fn in globs:
         n = os.path.basename(fn)
         tgt_fn = os.path.join(os.getcwd(), n)
-        util.copy(fn, tgt_fn)
+        shutil.move(fn, tgt_fn)
         info("Copied %s to %s" % (n, tgt_fn))
 
     return 0

From bf5a58d8f010207997e378824391bdd79c434d31 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:33:25 -0700
Subject: [PATCH 357/434] Coverting this to use the python utils

---
 packages/bddeb | 46 +++++++++++++++++++++++++++++++++++-----------
 1 file changed, 35 insertions(+), 11 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index 465bd986..f2158d5b 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -42,22 +42,46 @@ def info(msg):
 def warn(msg):
     print("WARNING: %s" % (msg))
 
- 
+
+def archive_code():
+    (stdout, _stderr) = tiny_p([sys.executable, 
+                               join(os.getcwd(), 'tar-me')])
+    lines = stdout.splitlines()
+    revno = lines[0]
+    version = lines[1]
+    bname = lines[2]
+    arc_fn = lines[3]
+    return (revno, version, bname, arc_fn)
+
 
 def main():
 
     with tmpdir() as td:
-        info("Using %s as a temporary workspace" % (td))
-        (stdout, _stderr) = tiny_p(['bzr', 'revno'])
-        revno = stdout.strip()
-        
-        
-        
-        cmd = [sys.executable, join(os.pardir, 'tools', 'read-version')]
-        (stdout, _stderr) = tiny_p(cmd)
-        version = stdout.strip()
-        
+        (revno, version, bname, archive_fn) = archive_code()
+        real_archive_fn = os.path.join(td, os.path.basename(archive_fn))
+        shutil.move(archive_fn, real_archive_fn)
+        info("Archived code to %s" % (real_archive_fn))
+
+        cmd = ['tar', '-xvzf', real_archive_fn, '-C', td]
+        stdout, stderr = tiny_p(cmd)
+
+        edir = join(td, bname)
+        shutil.move(edir, join(td, 'cloud-init'))
+        shutil.copytree('debian.trunk', join(td, 'cloud-init', 'debian'))
+
+        cmd = ['sed', '-i', '-e',"s,VERSION,%s," %(version),
+               '-e', "s,REVNO,bzr%s," % (revno),
+               join(td, 'cloud-init', 'debian', 'changelog')]
+        tiny_p(cmd)
         
+        ocwd = os.getcwd()
+        os.chdir(join(td, 'cloud-init'))
+        cmd = ['debuild']
+        tiny_p(cmd)
+
+        debname = "cloud-init_%s~bzr%s-1_all.deb" % (version, revno)
+        shutil.move(debname, join(owcwd, debname))
+        info("Wrote out debian package %s" % (join(owcwd, debname)))
 
     return 0
 

From bcc896deae308f449760ec43f6b4a05388299408 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:33:36 -0700
Subject: [PATCH 358/434] Output the base tar name

---
 packages/brpm   | 5 +++--
 packages/tar-me | 1 +
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index febbfb5e..c3be5997 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -90,7 +90,7 @@ def generate_spec_contents(tmpl_fn, revno, version):
 
     (stdout, _stderr) = tiny_p([sys.executable, 
                                join(os.getcwd(), 'rpm-changelog')])
-    subs['changelog'] = stdout
+    subs['changelog'] = stdout.strip()
 
     # See: http://www.zarb.org/~jasonc/macros.php
     # Pickup any special files
@@ -127,7 +127,8 @@ def archive_code():
     lines = stdout.splitlines()
     revno = lines[0]
     version = lines[1]
-    arc_fn = lines[2]
+    bname = lines[2]
+    arc_fn = lines[3]
     return (revno, version, arc_fn)
 
 
diff --git a/packages/tar-me b/packages/tar-me
index 261b77bb..14b59960 100755
--- a/packages/tar-me
+++ b/packages/tar-me
@@ -80,6 +80,7 @@ def main(args):
 
         print revno
         print version
+        print bfn
         print(os.path.abspath(fn))
 
     return 0

From 832c511e0f6087bcf63ab1eededf7ca3edf1effa Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 21:51:36 -0700
Subject: [PATCH 359/434] Get the new builddeb working and fix the rules file

---
 packages/bddeb              | 15 +++++++++++++--
 packages/debian.trunk/rules |  1 -
 2 files changed, 13 insertions(+), 3 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index f2158d5b..1a9f13f3 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -15,7 +15,8 @@ def tmpdir():
     try:
         yield t
     finally:
-        shutil.rmtree(t)
+        pass
+        #shutil.rmtree(t)
 
 
 def join(*paths):
@@ -56,6 +57,10 @@ def archive_code():
 
 def main():
 
+    # cmd = ['apt-get', 'install', 'python-nose',
+    #'pyflakes', 'python-mocker', 'cdbs', 'debhelper']
+    # tiny_p(cmd)
+
     with tmpdir() as td:
         (revno, version, bname, archive_fn) = archive_code()
         real_archive_fn = os.path.join(td, os.path.basename(archive_fn))
@@ -68,12 +73,18 @@ def main():
         edir = join(td, bname)
         shutil.move(edir, join(td, 'cloud-init'))
         shutil.copytree('debian.trunk', join(td, 'cloud-init', 'debian'))
-
+        
         cmd = ['sed', '-i', '-e',"s,VERSION,%s," %(version),
                '-e', "s,REVNO,bzr%s," % (revno),
                join(td, 'cloud-init', 'debian', 'changelog')]
         tiny_p(cmd)
         
+        # Seems to want an original tar ball
+        o_tar = "cloud-init_%s~bzr%s.orig.tar.gz" % (version, revno)
+        cmd = ['tar', '-czf', join(td, o_tar), '-C', join(td, 'cloud-init')]
+        cmd.extend(os.listdir(join(td, 'cloud-init')))
+        tiny_p(cmd)
+        
         ocwd = os.getcwd()
         os.chdir(join(td, 'cloud-init'))
         cmd = ['debuild']
diff --git a/packages/debian.trunk/rules b/packages/debian.trunk/rules
index 0f79136c..a907b594 100755
--- a/packages/debian.trunk/rules
+++ b/packages/debian.trunk/rules
@@ -10,7 +10,6 @@ include /usr/share/cdbs/1/class/python-distutils.mk
 DEB_DH_INSTALL_SOURCEDIR := debian/tmp
 
 cloud-init-fixups:
-	for x in $(DEB_DESTDIR)/usr/bin/*.py; do mv "$$x" "$${x%.py}"; done
 	install -d $(DEB_DESTDIR)/etc/rsyslog.d
 	cp tools/21-cloudinit.conf $(DEB_DESTDIR)/etc/rsyslog.d/21-cloudinit.conf
 

From 2fc1bc4957f11c9ad57b8f0f0811085621e6cc66 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 23:55:40 -0700
Subject: [PATCH 360/434] Move redhat spec file templates to this directory

---
 packages/{brpm.tmpl => redhat/cloud-init.spec} | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename packages/{brpm.tmpl => redhat/cloud-init.spec} (100%)

diff --git a/packages/brpm.tmpl b/packages/redhat/cloud-init.spec
similarity index 100%
rename from packages/brpm.tmpl
rename to packages/redhat/cloud-init.spec

From 07e6ade94066848ebe91fb0f5cde8bdd6c314abf Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 23:55:48 -0700
Subject: [PATCH 361/434] Rename this to be 'make-tarball' to match the other
 tar tools name, also change output to be tab separated.

---
 packages/{tar-me => make-tarball} | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)
 rename packages/{tar-me => make-tarball} (95%)

diff --git a/packages/tar-me b/packages/make-tarball
similarity index 95%
rename from packages/tar-me
rename to packages/make-tarball
index 14b59960..98f669a9 100755
--- a/packages/tar-me
+++ b/packages/make-tarball
@@ -78,11 +78,9 @@ def main(args):
         os.chdir(owcd)
         shutil.move(o_fn, fn)
 
-        print revno
-        print version
-        print bfn
-        print(os.path.abspath(fn))
-
+        out = [revno, version, bfn, os.path.abspath(fn)]
+        print('\t'.join(out))
+        
     return 0
 
 

From 41d79ff623e9e2920783887f3ac09e28c800c84e Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 23:56:15 -0700
Subject: [PATCH 362/434] 1. Change these to be templates where possible. 2.
 Rename to be a debian subdir, matching the redhat subdir.

---
 packages/{debian.trunk => debian}/changelog | 2 +-
 packages/{debian.trunk => debian}/compat    | 0
 packages/{debian.trunk => debian}/control   | 8 +++-----
 packages/{debian.trunk => debian}/copyright | 0
 packages/{debian.trunk => debian}/dirs      | 0
 packages/{debian.trunk => debian}/pycompat  | 0
 packages/{debian.trunk => debian}/rules     | 0
 7 files changed, 4 insertions(+), 6 deletions(-)
 rename packages/{debian.trunk => debian}/changelog (55%)
 rename packages/{debian.trunk => debian}/compat (100%)
 rename packages/{debian.trunk => debian}/control (85%)
 rename packages/{debian.trunk => debian}/copyright (100%)
 rename packages/{debian.trunk => debian}/dirs (100%)
 rename packages/{debian.trunk => debian}/pycompat (100%)
 rename packages/{debian.trunk => debian}/rules (100%)

diff --git a/packages/debian.trunk/changelog b/packages/debian/changelog
similarity index 55%
rename from packages/debian.trunk/changelog
rename to packages/debian/changelog
index a36d00d6..ac5bcf98 100644
--- a/packages/debian.trunk/changelog
+++ b/packages/debian/changelog
@@ -1,4 +1,4 @@
-cloud-init (VERSION~REVNO-1) UNRELEASED; urgency=low
+cloud-init ({{version}}~{{revision}}-1) UNRELEASED; urgency=low
 
   * build
 
diff --git a/packages/debian.trunk/compat b/packages/debian/compat
similarity index 100%
rename from packages/debian.trunk/compat
rename to packages/debian/compat
diff --git a/packages/debian.trunk/control b/packages/debian/control
similarity index 85%
rename from packages/debian.trunk/control
rename to packages/debian/control
index f0dcef6a..e00901af 100644
--- a/packages/debian.trunk/control
+++ b/packages/debian/control
@@ -17,12 +17,10 @@ Architecture: all
 Depends: cloud-utils,
          procps,
          python,
-         python-boto (>=2.0),
-         python-cheetah,
-         python-configobj,
-         python-oauth,
+{{for r in requires}}
+         {{r}},
+{{endfor}}
          python-software-properties,
-         python-yaml,
          ${misc:Depends},
          ${python:Depends}
 XB-Python-Version: ${python:Versions}
diff --git a/packages/debian.trunk/copyright b/packages/debian/copyright
similarity index 100%
rename from packages/debian.trunk/copyright
rename to packages/debian/copyright
diff --git a/packages/debian.trunk/dirs b/packages/debian/dirs
similarity index 100%
rename from packages/debian.trunk/dirs
rename to packages/debian/dirs
diff --git a/packages/debian.trunk/pycompat b/packages/debian/pycompat
similarity index 100%
rename from packages/debian.trunk/pycompat
rename to packages/debian/pycompat
diff --git a/packages/debian.trunk/rules b/packages/debian/rules
similarity index 100%
rename from packages/debian.trunk/rules
rename to packages/debian/rules

From b9029e9c55ab9cfba1a9768b0a52e542700f2e7c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 25 Jun 2012 23:57:01 -0700
Subject: [PATCH 363/434] Get these working again after the subdirectory and
 output format changes.

---
 packages/bddeb | 99 +++++++++++++++++++++++++++++++++++++-------------
 packages/brpm  | 32 ++++++++--------
 2 files changed, 89 insertions(+), 42 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index 1a9f13f3..c39965da 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -8,6 +8,17 @@ import subprocess
 import sys
 import tempfile
 
+import tempita
+
+PKG_MP = {
+    'tempita': 'python-tempita',
+    'boto': 'python-boto',
+    'configobj': 'python-configobj',
+    'oauth': 'python-oauth',
+    'yaml': 'python-yaml',
+    'prettytable': 'python-prettytable',
+    'argparse': 'python-argparse',
+}
 
 @contextlib.contextmanager
 def tmpdir():
@@ -24,11 +35,16 @@ def join(*paths):
     return os.path.abspath(p)
 
 
-def tiny_p(cmd):
+def tiny_p(cmd, capture=True):
     # Darn python 2.6 doesn't have check_output (argggg)
     info("Running %s" % (cmd))
-    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
-                    stderr=subprocess.PIPE, stdin=None)
+    stdout = subprocess.PIPE
+    stderr = subprocess.PIPE
+    if not capture:
+        stdout = None
+        stderr = None
+    sp = subprocess.Popen(cmd, stdout=stdout,
+                    stderr=stderr, stdin=None)
     (out, err) = sp.communicate()
     if sp.returncode not in [0]:
         raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
@@ -36,6 +52,53 @@ def tiny_p(cmd):
     return (out, err)
 
 
+def tmpl_file(name, params):
+    with open(join('debian', name), 'r') as fh:
+        contents = fh.read()
+    tpl = tempita.Template(contents)
+    return tpl.substitute(**params)
+    
+
+def write_debian(version, revno, root):
+    db_dir = join(root, 'debian')
+    os.makedirs(db_dir)
+    
+    # Fill in the change log template
+    with open(join(db_dir, 'changelog'), 'w') as fh:
+        params = {
+            'version': version,
+            'revision': revno,
+        }
+        contents = tmpl_file('changelog', params) 
+        fh.write(contents)
+
+    # Write out the control file template
+    cmd = [sys.executable, join(os.pardir, 'tools', 'read-dependencies')]
+    (stdout, _stderr) = tiny_p(cmd)
+    pkgs = stdout.splitlines()
+    requires = []
+    
+    # Map to known packages
+    for e in pkgs:
+        e = e.lower().strip()
+        tgt_pkg = None
+        for n in PKG_MP.keys():
+            if e.find(n) != -1:
+                tgt_pkg = PKG_MP.get(n)
+        if not tgt_pkg:
+            raise RuntimeError(("Do not know how to translate %s to "
+                                " a known package") % (e))
+        else:
+            requires.append(tgt_pkg)
+    contents = tmpl_file('control', {'requires': requires})
+    with open(join(db_dir, 'control'), 'w') as fh:
+        fh.write(contents)
+    
+    # Just copy the following directly
+    for fn in ['dirs', 'copyright', 'compat', 'pycompat', 'rules']:
+        shutil.copy(join('debian', fn), 
+                    join(db_dir, fn))
+
 def info(msg):
     print("INFO: %s" % (msg))
 
@@ -46,49 +109,33 @@ def warn(msg):
 
 def archive_code():
     (stdout, _stderr) = tiny_p([sys.executable, 
-                               join(os.getcwd(), 'tar-me')])
-    lines = stdout.splitlines()
-    revno = lines[0]
-    version = lines[1]
-    bname = lines[2]
-    arc_fn = lines[3]
-    return (revno, version, bname, arc_fn)
+                               join(os.getcwd(), 'make-tarball')])
+    return stdout.split(None)
 
 
 def main():
 
-    # cmd = ['apt-get', 'install', 'python-nose',
-    #'pyflakes', 'python-mocker', 'cdbs', 'debhelper']
-    # tiny_p(cmd)
-
     with tmpdir() as td:
         (revno, version, bname, archive_fn) = archive_code()
         real_archive_fn = os.path.join(td, os.path.basename(archive_fn))
         shutil.move(archive_fn, real_archive_fn)
-        info("Archived code to %s" % (real_archive_fn))
-
         cmd = ['tar', '-xvzf', real_archive_fn, '-C', td]
         stdout, stderr = tiny_p(cmd)
 
         edir = join(td, bname)
         shutil.move(edir, join(td, 'cloud-init'))
-        shutil.copytree('debian.trunk', join(td, 'cloud-init', 'debian'))
-        
-        cmd = ['sed', '-i', '-e',"s,VERSION,%s," %(version),
-               '-e', "s,REVNO,bzr%s," % (revno),
-               join(td, 'cloud-init', 'debian', 'changelog')]
-        tiny_p(cmd)
-        
+        write_debian(version, revno, join(td, 'cloud-init'))
+
         # Seems to want an original tar ball
-        o_tar = "cloud-init_%s~bzr%s.orig.tar.gz" % (version, revno)
-        cmd = ['tar', '-czf', join(td, o_tar), '-C', join(td, 'cloud-init')]
+        o_tar = "cloud-init_%s~%s.orig.tar.gz" % (version, revno)
+        cmd = ['tar', '-czvf', join(td, o_tar), '-C', join(td, 'cloud-init')]
         cmd.extend(os.listdir(join(td, 'cloud-init')))
         tiny_p(cmd)
         
         ocwd = os.getcwd()
         os.chdir(join(td, 'cloud-init'))
         cmd = ['debuild']
-        tiny_p(cmd)
+        tiny_p(cmd, capture=False)
 
         debname = "cloud-init_%s~bzr%s-1_all.deb" % (version, revno)
         shutil.move(debname, join(owcwd, debname))
diff --git a/packages/brpm b/packages/brpm
index c3be5997..bbe637e8 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -37,11 +37,16 @@ def join(*paths):
     return os.path.abspath(p)
 
 
-def tiny_p(cmd):
+def tiny_p(cmd, capture=True):
     # Darn python 2.6 doesn't have check_output (argggg)
     info("Running %s" % (cmd))
-    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
-                    stderr=subprocess.PIPE, stdin=None)
+    stdout = subprocess.PIPE
+    stderr = subprocess.PIPE
+    if not capture:
+        stdout = None
+        stderr = None
+    sp = subprocess.Popen(cmd, stdout=stdout,
+                    stderr=stderr, stdin=None)
     (out, err) = sp.communicate()
     if sp.returncode not in [0]:
         raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
@@ -123,12 +128,8 @@ def generate_spec_contents(tmpl_fn, revno, version):
 
 def archive_code():
     (stdout, _stderr) = tiny_p([sys.executable, 
-                               join(os.getcwd(), 'tar-me')])
-    lines = stdout.splitlines()
-    revno = lines[0]
-    version = lines[1]
-    bname = lines[2]
-    arc_fn = lines[3]
+                               join(os.getcwd(), 'make-tarball')])
+    (revno, version, bname, arc_fn) = stdout.split(None)
     return (revno, version, arc_fn)
 
 
@@ -136,7 +137,7 @@ def main():
 
     # Clean out the root dir and make sure the dirs we want are in place
     root_dir = os.path.expanduser("~/rpmbuild")
-    info("Cleaning %s" % (root_dir))
+    info("Cleaning %r" % (root_dir))
     if os.path.isdir(root_dir):
         shutil.rmtree(root_dir)
     arc_dir = os.path.join(root_dir, 'SOURCES')
@@ -147,22 +148,21 @@ def main():
     (revno, version, archive_fn) = archive_code()
     real_archive_fn = os.path.join(arc_dir, os.path.basename(archive_fn))
     shutil.move(archive_fn, real_archive_fn)
-    info("Archived code to %s" % (real_archive_fn))
+    info("Archived code to %r" % (real_archive_fn))
 
     # Form the spec file to be used
-    tmpl_fn = os.path.join(os.getcwd(), 'brpm.tmpl')
-    info("Generated spec file from template %s" % (tmpl_fn))
+    tmpl_fn = os.path.join(os.getcwd(), 'redhat', 'cloud-init.spec')
+    info("Generated spec file from template %r" % (tmpl_fn))
     (base_name, arc_name, contents) = generate_spec_contents(tmpl_fn,
                                                              revno, version)
     spec_fn = os.path.join(root_dir, 'cloud-init.spec')
     with open(spec_fn, 'w') as fh:
         fh.write(contents)
-        info("Wrote spec file to %s" % (spec_fn))
+        info("Wrote spec file to %r" % (spec_fn))
 
     # Now build it!
     cmd = ['rpmbuild', '-ba', spec_fn]
-    info("Running rpmbuild %s" % (cmd))
-    tiny_p(cmd)
+    tiny_p(cmd, capture=False)
     info("Rpmbuild completed!")
 
     # Copy the items built to our local dir

From 32cc25b3f3c86f8d2745824372c9fbb18b657a26 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 26 Jun 2012 00:10:30 -0700
Subject: [PATCH 364/434] Add a section for building an rpm and a section for
 building a deb

---
 Makefile | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index c20dfbd3..a96d6b5b 100644
--- a/Makefile
+++ b/Makefile
@@ -23,5 +23,11 @@ clean:
 	rm -rf /var/log/cloud-init.log \
 		   /var/lib/cloud/
 
-.PHONY: test pylint pyflakes 2to3 clean pep8
+rpm:
+	cd packages && ./brpm
+
+deb:
+	cd packages && ./bddeb
+
+.PHONY: test pylint pyflakes 2to3 clean pep8 rpm deb
 

From c69355cbcd317295978f8cbe18c0cc3391bb10e4 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 26 Jun 2012 00:48:38 -0700
Subject: [PATCH 365/434] Removed, just going to use the base 'ChangeLog' file.

---
 packages/rpm-changelog | 211 -----------------------------------------
 1 file changed, 211 deletions(-)
 delete mode 100755 packages/rpm-changelog

diff --git a/packages/rpm-changelog b/packages/rpm-changelog
deleted file mode 100755
index 8acaa5b9..00000000
--- a/packages/rpm-changelog
+++ /dev/null
@@ -1,211 +0,0 @@
-#!/usr/bin/python
-# vi: ts=4 expandtab
-
-# A crappy little script
-# that changes bzr 'log' 
-# into someting that rpm spec files can use (best effort)
-
-import os
-import re
-import sys
-
-from datetime import datetime
-from datetime import date
-
-import subprocess
-
-E_TYPES = ['tags', 'revno', 'author', 'timestamp', 'committer']
-
-
-def tiny_p(cmd):
-    # Darn python 2.6 doesn't have check_output (argggg)
-    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
-                    stderr=subprocess.PIPE, stdin=None)
-    (out, err) = sp.communicate()
-    return (out, err)
-
-
-def extract_entry(collecting):
-    entry = {}
-    for t in E_TYPES:
-        look_for = "%s:" % (t)
-        for v in collecting:
-            if v.startswith(look_for):
-                entry[t] = v[len(look_for):].strip()
-                break
-    i = -1
-    # Messages seem to be the last element so suck 
-    # those all up
-    for a, v in enumerate(collecting):
-        if v.startswith("message:"):
-            i = a
-            break
-    if i != -1:
-        msg_lines = collecting[i + 1:]
-        entry['message'] = "\n".join(msg_lines)
-    return entry
-
-
-def clean_authors(authors):
-    if not authors:
-        return ''
-    auth_cleaned = set()
-    for a in authors:
-        a = a.strip()
-        if a:
-            auth_cleaned.add(a)
-    if not auth_cleaned:
-        return ''
-    uniq_authors = list(auth_cleaned)
-    if len(uniq_authors) == 1:
-        return authors[0]
-    auths = "(%s)" % ", ".join(uniq_authors)
-    return auths
-
-
-def clean_revnos(revnos):
-    novs = list()
-    for r in revnos:
-        r = r.strip()
-        r = r.replace("[merge]", "")
-        if r:
-            novs.append(int(r))
-    entries = list(novs)
-    if not entries:
-        return ''
-    entries.sort()
-    if len(entries) == 1:
-        return "%s" % (entries[0])
-
-    # Check if consecutive
-    start = entries[0]
-    consec = True
-    for (i, v) in enumerate(entries):
-        if v != start + i:
-            consec = False
-            break
-    if consec:
-        end = entries[-1]
-        return "%s => %s" % (start, end)
-    v = [str(b) for b in entries]
-    return ", ".join(v)
-
-
-def spacey(am):
-    return " " * am
-
-
-def justify(text, space_wanted):
-    c_bef = len(text)
-    t_c = len(text.lstrip())
-    space_am = (c_bef - t_c)
-    needed = (space_wanted - space_am)
-    if needed < 0:
-        return text
-    return (" " * (needed) + text)
-
-
-def clean_messages(messages):
-    contents = []
-    for msg in messages:
-        # Split into sub-messages...
-        # if we can
-        lines = []
-        pieces = msg.splitlines()
-        if len(pieces) == 1:
-            lines.append("%s- %s " %
-                         (spacey(4), msg.strip()))
-        else:
-            n_lines = []
-            n_lines.append(pieces[0].strip())
-            for line in pieces[1:]:
-                line = line.lstrip()
-                if not line:
-                    continue
-                n_lines.append(justify(line, 6))
-            lines.append("%s- %s" % (spacey(4), "\n".join(n_lines)))
-        contents.extend(lines)
-    return "\n".join(contents)
-
-
-def build_changelog(history=-1):
-    cmd = ['bzr', 'log', '--timezone=utc']
-    (stdout, _stderr) = tiny_p(cmd)
-
-    # Clean the format up
-    entries = stdout.splitlines()
-    all_entries = []
-    collecting = []
-    for e in entries:
-        if e.startswith("---"):
-            if collecting:
-                a_entry = extract_entry(collecting)
-                if a_entry:
-                    all_entries.append(a_entry)
-                collecting = []
-        else:
-            collecting.append(e)
-
-    # Anything that we left behind??
-    entry = extract_entry(collecting)
-    if entry:
-        all_entries.append(entry)
-
-    if history > 0:
-        take_entries = list(all_entries[0:history])
-    else:
-        take_entries = list(all_entries)
-
-    # Merge those with same date
-    date_entries = {}
-    for e in take_entries:
-        author = e.get('author')
-        if not author:
-            author = e.get('committer')
-        if not author:
-            continue
-        timestamp = e.get('timestamp')
-        if not timestamp:
-            continue
-        msg = e.get('message')
-        if not msg:
-            continue
-        revno = e.get('revno')
-        if not revno:
-            continue
-        # http://bugs.python.org/issue6641
-        timestamp = timestamp.replace("+0000", '').strip()
-        ds = datetime.strptime(timestamp, '%a %Y-%m-%d %H:%M:%S')
-        ds = ds.date()
-        if ds not in date_entries:
-            entry = {}
-            entry['messages'] = []
-            entry['authors'] = []
-            entry['revnos'] = []
-            date_entries[ds] = entry
-        entry = date_entries[ds]
-        entry['messages'].append(msg)
-        entry['authors'].append(author)
-        entry['revnos'].append(revno)
-
-    # It wants them in chronological order...
-    dates = sorted(date_entries.keys())
-    chglog = []
-    for ds in reversed(dates):
-        e = date_entries[ds]
-        authors = clean_authors(e['authors'])
-        revnos = clean_revnos(e['revnos'])
-        top_line = "%s %s - [revison %s]" % (ds.strftime("%a %b %d %Y"),
-                                   authors, revnos)
-        chglog.append("* %s" % (top_line))
-        chglog.append(clean_messages(e['messages']))
-    return "\n".join(chglog)
-
-
-if __name__ == '__main__':
-    args = sys.argv[1:]
-    history_am = -1
-    if args:
-        history_am = int(args[0])
-    chglog = build_changelog(history_am)
-    print chglog

From 6a257b89fd70a65d21a1db53f267d4452c30858d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 26 Jun 2012 00:48:55 -0700
Subject: [PATCH 366/434] Just use the base changelog.

---
 packages/brpm | 60 ++++++++++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 57 insertions(+), 3 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index bbe637e8..081d092b 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -7,9 +7,11 @@ import shutil
 import subprocess
 import sys
 import tempfile
+import re
 
 import tempita
 
+from datetime import datetime
 
 # Mapping of expected packages to there full name...
 PKG_MP = {
@@ -53,6 +55,46 @@ def tiny_p(cmd, capture=True):
                             % (cmd, sp.returncode, out, err))
     return (out, err)
 
+def get_log_header(version):
+    cmd = ['bzr', 'tags']
+    (stdout, _stderr) = tiny_p(cmd)
+    a_rev = None
+    for t in stdout.splitlines():
+        ver, rev = t.split(None)
+        if ver == version:
+            a_rev = rev
+            break
+    if not a_rev:
+        return format_change_line(datetime.now(),
+                                  '??', version)
+    cmd = ['bzr', 'log', '-r%s' % (a_rev), '--timezone=utc']
+    (stdout, _stderr) = tiny_p(cmd)
+    kvs = {
+        'comment': version,
+    }
+    for line in stdout.splitlines():
+        if line.startswith('committer:'):
+            kvs['who'] = line[len('committer:'):].strip()
+        if line.startswith('timestamp:'):
+            ts = line[len('timestamp:'):]
+            ts = ts.strip()
+            # http://bugs.python.org/issue6641
+            ts = ts.replace("+0000", '').strip()
+            ds = datetime.strptime(ts, '%a %Y-%m-%d %H:%M:%S')
+            kvs['ds'] = ds
+    return format_change_line(**kvs)
+
+def format_change_line(ds, who, comment=None):
+    d = format_rpm_date(ds)
+    d += " - %s" % (who)
+    if comment:
+        d += " - %s" % (comment)
+    return "* %s" % (d)
+
+
+def format_rpm_date(ds):
+    return ds.strftime("%a %b %d %Y")
+
 
 def info(msg):
     print("INFO: %s" % (msg))
@@ -93,9 +135,21 @@ def generate_spec_contents(tmpl_fn, revno, version):
     base_name = 'cloud-init-%s-%s' % (version, subs['revno'])
     subs['requires'] = requires
 
-    (stdout, _stderr) = tiny_p([sys.executable, 
-                               join(os.getcwd(), 'rpm-changelog')])
-    subs['changelog'] = stdout.strip()
+    # Format a nice changelog (as best as we can)
+    changelog = ''
+    with open(join(os.pardir, 'ChangeLog')) as fh:
+        changelog = fh.read()
+    ch_lines = []
+    for line in changelog.splitlines():
+        if not line.strip():
+            continue
+        if re.match(r"^\s*[\d][.][\d][.][\d]:\s*", line):
+            line = line.strip(":")
+            header = get_log_header(line)
+            ch_lines.append(header)
+        else:
+            ch_lines.append(line)
+    subs['changelog'] = "\n".join(ch_lines)
 
     # See: http://www.zarb.org/~jasonc/macros.php
     # Pickup any special files

From 7f99a3b3006210b99d16e5eb28c892fe90017eb0 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Tue, 26 Jun 2012 07:16:05 -0700
Subject: [PATCH 367/434] Remove the '.sh' extension

---
 initd/{cloud-config.sh => cloud-config}         | 0
 initd/{cloud-final.sh => cloud-final}           | 0
 initd/{cloud-init.sh => cloud-init}             | 0
 initd/{cloud-init-local.sh => cloud-init-local} | 0
 4 files changed, 0 insertions(+), 0 deletions(-)
 rename initd/{cloud-config.sh => cloud-config} (100%)
 rename initd/{cloud-final.sh => cloud-final} (100%)
 rename initd/{cloud-init.sh => cloud-init} (100%)
 rename initd/{cloud-init-local.sh => cloud-init-local} (100%)

diff --git a/initd/cloud-config.sh b/initd/cloud-config
similarity index 100%
rename from initd/cloud-config.sh
rename to initd/cloud-config
diff --git a/initd/cloud-final.sh b/initd/cloud-final
similarity index 100%
rename from initd/cloud-final.sh
rename to initd/cloud-final
diff --git a/initd/cloud-init.sh b/initd/cloud-init
similarity index 100%
rename from initd/cloud-init.sh
rename to initd/cloud-init
diff --git a/initd/cloud-init-local.sh b/initd/cloud-init-local
similarity index 100%
rename from initd/cloud-init-local.sh
rename to initd/cloud-init-local

From aa530fa2bd443e630552f0bd7589d28554615bdc Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Tue, 26 Jun 2012 07:47:29 -0700
Subject: [PATCH 368/434] Add all the upstart/systemd/init.d files.

Let the package building solutions figure out exactly which
of these they wish to delete or wish to take, since setup.py
can not know it just has to install them all.
---
 setup.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index fd67da46..402443ea 100755
--- a/setup.py
+++ b/setup.py
@@ -67,7 +67,11 @@ setuptools.setup(name='cloud-init',
                   ('/etc/cloud/cloud.cfg.d', glob('config/cloud.cfg.d/*')),
                   ('/etc/cloud/templates', glob('templates/*')),
                   # Only really need for upstart based systems
-                  #('/etc/init', glob('upstart/*.conf')),
+                  ('/etc/init', glob('upstart/*.conf')),
+                  # Only really need for systemd based systems
+                  ('/etc/systemd/system', glob('systemd/*.service')),
+                  # Only really need for init.d based system
+                  ('/etc/init.d', glob('initd/*')),
                   ('/usr/share/cloud-init', []),
                   ('/usr/lib/cloud-init',
                     ['tools/uncloud-init', 'tools/write-ssh-key-fingerprints']),

From ead28165e458cd7b823eaeb94bfdf3ab1a146130 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Tue, 26 Jun 2012 07:48:12 -0700
Subject: [PATCH 369/434] Add in the ability to choose which type of boot type
 the rpm should have and adjust the specfile that is generated to remove the
 unwanted config files for the types which were not selected.

---
 packages/brpm                   | 30 ++++++++++++++++++++++++++++--
 packages/redhat/cloud-init.spec |  6 +++++-
 2 files changed, 33 insertions(+), 3 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index 081d092b..b505e6b4 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -9,6 +9,8 @@ import sys
 import tempfile
 import re
 
+import argparse
+
 import tempita
 
 from datetime import datetime
@@ -104,7 +106,7 @@ def warn(msg):
     print("WARNING: %s" % (msg))
 
 
-def generate_spec_contents(tmpl_fn, revno, version):
+def generate_spec_contents(args, tmpl_fn, revno, version):
 
     # Tmpl params
     subs = {}
@@ -172,6 +174,22 @@ def generate_spec_contents(tmpl_fn, revno, version):
         '%{_bindir}/*',
         '/usr/lib/cloud-init/*',
     ]
+    # Since setup.py installs them
+    # all, we need to selectively 
+    # knock off the wrong ones and
+    # ensure the right one is kept
+    post_remove_keep = {
+        'initd': '/etc/init.d/',
+        'systemd': '/etc/systemd/',
+        'upstart': '/etc/init/',
+    }
+    post_remove = []
+    for (k, v) in post_remove_keep.iteritems():
+        if k != args.boot:
+            post_remove.append(v)
+        else:
+            other_files.append(v)
+    subs['post_remove'] = post_remove
     subs['files'] = other_files
     
     with open(tmpl_fn, 'r') as fh:
@@ -188,6 +206,13 @@ def archive_code():
 
 
 def main():
+    
+    parser = argparse.ArgumentParser()
+    parser.add_argument("-b", "--boot", dest="boot",
+                        help="select boot type (default: %(default)s)", 
+                        metavar="TYPE", default='initd',
+                        choices=['upstart', 'initd', 'systemd'])
+    args = parser.parse_args()
 
     # Clean out the root dir and make sure the dirs we want are in place
     root_dir = os.path.expanduser("~/rpmbuild")
@@ -207,7 +232,8 @@ def main():
     # Form the spec file to be used
     tmpl_fn = os.path.join(os.getcwd(), 'redhat', 'cloud-init.spec')
     info("Generated spec file from template %r" % (tmpl_fn))
-    (base_name, arc_name, contents) = generate_spec_contents(tmpl_fn,
+    (base_name, arc_name, contents) = generate_spec_contents(args,
+                                                             tmpl_fn,
                                                              revno, version)
     spec_fn = os.path.join(root_dir, 'cloud-init.spec')
     with open(spec_fn, 'w') as fh:
diff --git a/packages/redhat/cloud-init.spec b/packages/redhat/cloud-init.spec
index f0c874ee..ddb6617d 100644
--- a/packages/redhat/cloud-init.spec
+++ b/packages/redhat/cloud-init.spec
@@ -37,11 +37,15 @@ ssh keys and to let the user run various scripts.
 %build
 %{__python} setup.py build
 
-
 %install
 rm -rf $RPM_BUILD_ROOT
 %{__python} setup.py install -O1 --skip-build --root $RPM_BUILD_ROOT
 
+# Remove anything after it was installed??
+{{for r in post_remove}}
+rm -rfv $RPM_BUILD_ROOT/{{r}}
+{{endfor}}
+
 %clean
 rm -rf $RPM_BUILD_ROOT
 

From 1f08c95198d16098ce9f03581e5ad1c011f04e3e Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Tue, 26 Jun 2012 07:55:21 -0700
Subject: [PATCH 370/434] Add check that the changelog version is the same as
 the code version

---
 tools/read-version | 21 ++++++++++++++++++++-
 1 file changed, 20 insertions(+), 1 deletion(-)

diff --git a/tools/read-version b/tools/read-version
index 4458c712..e6167a2c 100755
--- a/tools/read-version
+++ b/tools/read-version
@@ -5,6 +5,15 @@ import os
 import sys
 import re
 
+from distutils import version as ver
+
+possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
+        sys.argv[0]), os.pardir, os.pardir))
+if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
+    sys.path.insert(0, possible_topdir)
+
+from cloudinit import version as cver
+
 def parse_versions(fn):
     with open(fn, 'r') as fh:
         lines = fh.read().splitlines()
@@ -47,5 +56,15 @@ if __name__ == '__main__':
             sys.stderr.write("No versions found in %s!\n" % (fn))
             sys.exit(1)
         else:
-            sys.stdout.write(versions[0].strip())
+            # Check that the code version is the same 
+            # as the version we found!
+            ch_ver = versions[0].strip()
+            code_ver = cver.version()
+            ch_ver_obj = ver.StrictVersion(ch_ver)
+            if ch_ver_obj != code_ver:
+                sys.stderr.write(("Code version %s does not match"
+                                  " changelog version %s\n") % 
+                                  (code_ver, ch_ver_obj))
+                sys.exit(1)
+            sys.stdout.write(ch_ver)
             sys.exit(0)

From fc6ebd5aecf34b8e30697884f5bb4fbd6ca99105 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Tue, 26 Jun 2012 07:56:54 -0700
Subject: [PATCH 371/434] Copy the tiny_p from the packager code

---
 setup.py | 16 +++++++++++++---
 1 file changed, 13 insertions(+), 3 deletions(-)

diff --git a/setup.py b/setup.py
index 402443ea..810ebb48 100755
--- a/setup.py
+++ b/setup.py
@@ -29,10 +29,20 @@ import setuptools
 
 import subprocess
 
-def tiny_p(cmd):
-    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
-                    stderr=subprocess.PIPE, stdin=None)
+
+def tiny_p(cmd, capture=True):
+    # Darn python 2.6 doesn't have check_output (argggg)
+    stdout = subprocess.PIPE
+    stderr = subprocess.PIPE
+    if not capture:
+        stdout = None
+        stderr = None
+    sp = subprocess.Popen(cmd, stdout=stdout,
+                    stderr=stderr, stdin=None)
     (out, err) = sp.communicate()
+    if sp.returncode not in [0]:
+        raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
+                            % (cmd, sp.returncode, out, err))
     return (out, err)
 
 

From 9189b96786789eb3164c7e65df829a1ae9e77fca Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Tue, 26 Jun 2012 07:59:34 -0700
Subject: [PATCH 372/434] Relax the version numbers for now.

---
 Requires | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/Requires b/Requires
index bbe7baec..10be0155 100644
--- a/Requires
+++ b/Requires
@@ -3,28 +3,28 @@
 # Used for templating any files or strings that are considered 
 # to be templates, not cheetah since it pulls in alot of extra libs.
 # This one is pretty dinky and does want we want (var substituion)
-Tempita>=0.4
+Tempita
 
 # This is used for any pretty printing of tabular data.
-PrettyTable>=0.4
+PrettyTable
 
 # This one is currently only used by the MAAS datasource. If that
 # datasource is removed, this is no longer needed
-oauth>=1.0
+oauth
 
 # This is used to fetch the ec2 metadata into a easily
 # parseable format, instead of having to have cloud-init perform
 # those same fetchs and decodes and signing (...) that ec2 requires.
-boto>=2.4
+boto
 
 # This is only needed for places where we need to support configs in a manner
 # that the built-in config parser is not sufficent (ie
 # when we need to preserve comments, or do not have a top-level
 # section)...
-configobj>=4.6
+configobj
 
 # All new style configurations are in the yaml format
-pyyaml>=3.0
+pyyaml
 
 # The new main entrypoint uses argparse instead of optparse
-argparse>=1.1
+argparse

From 49966a47c274e6913a327dae1500afccd7d60bd8 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Tue, 26 Jun 2012 08:04:28 -0700
Subject: [PATCH 373/434] 1. Remove unused return arguments 2. Adjust info
 statement to reflect better what it is doing.

---
 packages/brpm | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index b505e6b4..db60bf81 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -195,7 +195,7 @@ def generate_spec_contents(args, tmpl_fn, revno, version):
     with open(tmpl_fn, 'r') as fh:
         tmpl = tempita.Template(fh.read())
         contents = tmpl.substitute(**subs)
-        return (base_name, '%s.tar.gz' % (base_name), contents)
+        return contents
 
 
 def archive_code():
@@ -231,10 +231,8 @@ def main():
 
     # Form the spec file to be used
     tmpl_fn = os.path.join(os.getcwd(), 'redhat', 'cloud-init.spec')
-    info("Generated spec file from template %r" % (tmpl_fn))
-    (base_name, arc_name, contents) = generate_spec_contents(args,
-                                                             tmpl_fn,
-                                                             revno, version)
+    info("Generating spec file from template %r" % (tmpl_fn))
+    contents = generate_spec_contents(args, tmpl_fn, revno, version)
     spec_fn = os.path.join(root_dir, 'cloud-init.spec')
     with open(spec_fn, 'w') as fh:
         fh.write(contents)

From 5d74b8005c2ff37c8ee830bee4784fdcced15f76 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 26 Jun 2012 12:16:39 -0700
Subject: [PATCH 374/434] 1. Add a chdir context manager 2. Add a abs path
 joining function that will return the absolute path of    a combined path
 (where applicable)

---
 cloudinit/util.py | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 2f5ed275..f95a5d07 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -486,6 +486,16 @@ def mergedict(src, cand):
     return src
 
 
+@contextlib.contextmanager
+def chdir(ndir):
+    curr = os.getcwd()
+    try:
+        os.chdir(ndir)
+        yield ndir
+    finally:
+        os.chdir(curr)
+
+
 @contextlib.contextmanager
 def umask(n_msk):
     old = os.umask(n_msk)
@@ -1285,6 +1295,10 @@ def subp(args, data=None, rcs=None, env=None, capture=True, shell=False):
     return (out, err)
 
 
+def abs_join(*paths):
+    return os.path.abspath(os.path.join(*paths))
+
+
 # shellify, takes a list of commands
 #  for each entry in the list
 #    if it is an array, shell protect it (with single ticks)

From db281f731210918b1800866ef93967f82082ddea Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 26 Jun 2012 12:17:11 -0700
Subject: [PATCH 375/434] Shrink these down by using the cloudinit utils.

---
 packages/bddeb        | 179 ++++++++++++++++++------------------------
 packages/brpm         | 155 +++++++++++++++---------------------
 packages/make-tarball | 100 +++++++++--------------
 3 files changed, 180 insertions(+), 254 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index c39965da..5f250738 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -1,15 +1,20 @@
 #!/usr/bin/python
 
-import contextlib
-import glob
 import os
 import shutil
-import subprocess
 import sys
-import tempfile
 
-import tempita
+# Use the util functions from cloudinit
+possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
+        sys.argv[0]), os.pardir, os.pardir))
+if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
+    sys.path.insert(0, possible_topdir)
 
+from cloudinit import templater
+from cloudinit import util
+
+# Package names that will showup in requires to what we can actually
+# use in our debian 'control' file
 PKG_MP = {
     'tempita': 'python-tempita',
     'boto': 'python-boto',
@@ -20,126 +25,94 @@ PKG_MP = {
     'argparse': 'python-argparse',
 }
 
-@contextlib.contextmanager
-def tmpdir():
-    t = tempfile.mkdtemp()
-    try:
-        yield t
-    finally:
-        pass
-        #shutil.rmtree(t)
 
-
-def join(*paths):
-    p = os.path.join(*paths)
-    return os.path.abspath(p)
-
-
-def tiny_p(cmd, capture=True):
-    # Darn python 2.6 doesn't have check_output (argggg)
-    info("Running %s" % (cmd))
-    stdout = subprocess.PIPE
-    stderr = subprocess.PIPE
-    if not capture:
-        stdout = None
-        stderr = None
-    sp = subprocess.Popen(cmd, stdout=stdout,
-                    stderr=stderr, stdin=None)
-    (out, err) = sp.communicate()
-    if sp.returncode not in [0]:
-        raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
-                            % (cmd, sp.returncode, out, err))
-    return (out, err)
-
-
-def tmpl_file(name, params):
-    with open(join('debian', name), 'r') as fh:
-        contents = fh.read()
-    tpl = tempita.Template(contents)
-    return tpl.substitute(**params)
-    
-
-def write_debian(version, revno, root):
-    db_dir = join(root, 'debian')
-    os.makedirs(db_dir)
+def write_debian_folder(root, version, revno):
+    deb_dir = util.abs_join(root, 'debian')
+    os.makedirs(deb_dir)
     
     # Fill in the change log template
-    with open(join(db_dir, 'changelog'), 'w') as fh:
-        params = {
-            'version': version,
-            'revision': revno,
-        }
-        contents = tmpl_file('changelog', params) 
-        fh.write(contents)
+    templater.render_to_file(util.abs_join('debian', 'changelog'),
+                             util.abs_join(deb_dir, 'changelog'),
+                             params={
+                                 'version': version,
+                                 'revision': revno,
+                             })
 
     # Write out the control file template
-    cmd = [sys.executable, join(os.pardir, 'tools', 'read-dependencies')]
-    (stdout, _stderr) = tiny_p(cmd)
-    pkgs = stdout.splitlines()
-    requires = []
+    cmd = [sys.executable,
+            util.abs_join(os.pardir, 'tools', 'read-dependencies')]
+    (stdout, _stderr) = util.subp(cmd)
     
     # Map to known packages
-    for e in pkgs:
-        e = e.lower().strip()
+    pkgs = [p.lower().strip() for p in stdout.splitlines()]
+    requires = []
+    for p in pkgs:
         tgt_pkg = None
-        for n in PKG_MP.keys():
-            if e.find(n) != -1:
-                tgt_pkg = PKG_MP.get(n)
+        for name in PKG_MP.keys():
+            if p.find(name) != -1:
+                tgt_pkg = PKG_MP.get(name)
+                break
         if not tgt_pkg:
             raise RuntimeError(("Do not know how to translate %s to "
-                                " a known package") % (e))
+                                " a known package") % (p))
         else:
             requires.append(tgt_pkg)
-    contents = tmpl_file('control', {'requires': requires})
-    with open(join(db_dir, 'control'), 'w') as fh:
-        fh.write(contents)
+
+    templater.render_to_file(util.abs_join('debian', 'control'),
+                             util.abs_join(deb_dir, 'control'),
+                             params={'requires': requires})
     
     # Just copy the following directly
-    for fn in ['dirs', 'copyright', 'compat', 'pycompat', 'rules']:
-        shutil.copy(join('debian', fn), 
-                    join(db_dir, fn))
-
-def info(msg):
-    print("INFO: %s" % (msg))
-
-
-def warn(msg):
-    print("WARNING: %s" % (msg))
-
-
-def archive_code():
-    (stdout, _stderr) = tiny_p([sys.executable, 
-                               join(os.getcwd(), 'make-tarball')])
-    return stdout.split(None)
+    for base_fn in ['dirs', 'copyright', 'compat', 'pycompat', 'rules']:
+        shutil.copy(util.abs_join('debian', base_fn),
+                    util.abs_join(deb_dir, base_fn))
 
 
 def main():
 
-    with tmpdir() as td:
-        (revno, version, bname, archive_fn) = archive_code()
-        real_archive_fn = os.path.join(td, os.path.basename(archive_fn))
-        shutil.move(archive_fn, real_archive_fn)
-        cmd = ['tar', '-xvzf', real_archive_fn, '-C', td]
-        stdout, stderr = tiny_p(cmd)
+    with util.tempdir() as tdir:
 
-        edir = join(td, bname)
-        shutil.move(edir, join(td, 'cloud-init'))
-        write_debian(version, revno, join(td, 'cloud-init'))
+        cmd = [sys.executable,
+                 util.abs_join(os.pardir, 'tools', 'read-version')]
+        (sysout, _stderr) = util.subp(cmd)
+        version = sysout.strip()
 
-        # Seems to want an original tar ball
-        o_tar = "cloud-init_%s~%s.orig.tar.gz" % (version, revno)
-        cmd = ['tar', '-czvf', join(td, o_tar), '-C', join(td, 'cloud-init')]
-        cmd.extend(os.listdir(join(td, 'cloud-init')))
-        tiny_p(cmd)
+        cmd = ['bzr', 'revno']
+        (sysout, _stderr) = util.subp(cmd)
+        revno = sysout.strip()
+        
+        cmd = [sys.executable,
+                util.abs_join(os.getcwd(), 'make-tarball')]
+        (sysout, _stderr) = util.subp(cmd)
+        arch_fn = sysout.strip()
+
+        tmp_arch_fn = util.abs_join(tdir, os.path.basename(arch_fn))
+        shutil.move(arch_fn, tmp_arch_fn)
+
+        cmd = ['tar', '-xvzf', tmp_arch_fn, '-C', tdir]
+        util.subp(cmd)
+        
+        base_name = os.path.basename(arch_fn)[:-len(".tar.gz")]
+        shutil.move(util.abs_join(tdir, base_name), 
+                    util.abs_join(tdir, 'cloud-init'))
+        
+        write_debian_folder(util.abs_join(tdir, 'cloud-init'),
+                            version, revno)
+        
+        tar_fn = "cloud-init_%s~%s.orig.tar.gz" % (version, revno)
+        cmd = ['tar', '-czvf', 
+               util.abs_join(tdir, tar_fn), 
+               '-C', util.abs_join(tdir, 'cloud-init')]
+        cmd.extend(os.listdir(util.abs_join(tdir, 'cloud-init')))
+        util.subp(cmd)
         
         ocwd = os.getcwd()
-        os.chdir(join(td, 'cloud-init'))
-        cmd = ['debuild']
-        tiny_p(cmd, capture=False)
-
-        debname = "cloud-init_%s~bzr%s-1_all.deb" % (version, revno)
-        shutil.move(debname, join(owcwd, debname))
-        info("Wrote out debian package %s" % (join(owcwd, debname)))
+        with util.chdir(util.abs_join(tdir, 'cloud-init')):
+            util.subp(['debuild'], capture=False)
+            debname = "cloud-init_%s~bzr%s-1_all.deb" % (version, revno)
+            shutil.move(debname, util.abs_join(ocwd, debname))
+        
+        print("Wrote out debian package %s" % (util.abs_join(ocwd, debname)))
 
     return 0
 
diff --git a/packages/brpm b/packages/brpm
index db60bf81..f3ff2f58 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -11,10 +11,18 @@ import re
 
 import argparse
 
-import tempita
+# Use the util functions from cloudinit
+possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
+        sys.argv[0]), os.pardir, os.pardir))
+if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
+    sys.path.insert(0, possible_topdir)
+
+from cloudinit import templater
+from cloudinit import util
 
 from datetime import datetime
 
+
 # Mapping of expected packages to there full name...
 PKG_MP = {
     'boto': 'python-boto',
@@ -27,39 +35,10 @@ PKG_MP = {
 }
 
 
-@contextlib.contextmanager
-def tmpdir():
-    t = tempfile.mkdtemp()
-    try:
-        yield t
-    finally:
-        shutil.rmtree(t)
-
-
-def join(*paths):
-    p = os.path.join(*paths)
-    return os.path.abspath(p)
-
-
-def tiny_p(cmd, capture=True):
-    # Darn python 2.6 doesn't have check_output (argggg)
-    info("Running %s" % (cmd))
-    stdout = subprocess.PIPE
-    stderr = subprocess.PIPE
-    if not capture:
-        stdout = None
-        stderr = None
-    sp = subprocess.Popen(cmd, stdout=stdout,
-                    stderr=stderr, stdin=None)
-    (out, err) = sp.communicate()
-    if sp.returncode not in [0]:
-        raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
-                            % (cmd, sp.returncode, out, err))
-    return (out, err)
-
 def get_log_header(version):
+    # Try to find the version in the tags output
     cmd = ['bzr', 'tags']
-    (stdout, _stderr) = tiny_p(cmd)
+    (stdout, _stderr) = util.subp(cmd)
     a_rev = None
     for t in stdout.splitlines():
         ver, rev = t.split(None)
@@ -69,11 +48,14 @@ def get_log_header(version):
     if not a_rev:
         return format_change_line(datetime.now(),
                                   '??', version)
+    
+    # Extract who made that tag as the header
     cmd = ['bzr', 'log', '-r%s' % (a_rev), '--timezone=utc']
-    (stdout, _stderr) = tiny_p(cmd)
+    (stdout, _stderr) = util.subp(cmd)
     kvs = {
         'comment': version,
     }
+
     for line in stdout.splitlines():
         if line.startswith('committer:'):
             kvs['who'] = line[len('committer:'):].strip()
@@ -84,74 +66,73 @@ def get_log_header(version):
             ts = ts.replace("+0000", '').strip()
             ds = datetime.strptime(ts, '%a %Y-%m-%d %H:%M:%S')
             kvs['ds'] = ds
+
     return format_change_line(**kvs)
 
+
 def format_change_line(ds, who, comment=None):
-    d = format_rpm_date(ds)
+    d = ds.strftime("%a %b %d %Y")
     d += " - %s" % (who)
     if comment:
         d += " - %s" % (comment)
     return "* %s" % (d)
 
 
-def format_rpm_date(ds):
-    return ds.strftime("%a %b %d %Y")
+def generate_spec_contents(args, tmpl_fn):
 
-
-def info(msg):
-    print("INFO: %s" % (msg))
-
-
-def warn(msg):
-    print("WARNING: %s" % (msg))
-
-
-def generate_spec_contents(args, tmpl_fn, revno, version):
+    # Figure out the version and revno
+    cmd = [sys.executable,
+            util.abs_join(os.pardir, 'tools', 'read-version')]
+    (stdout, _stderr) = util.subp(cmd)
+    version = stdout.strip()
+    
+    cmd = ['bzr', 'revno']
+    (stdout, _stderr) = util.subp(cmd)
+    revno = stdout.strip()
 
     # Tmpl params
     subs = {}
     subs['version'] = version
     subs['revno'] = revno
     subs['release'] = revno
-    subs['archive_name'] = '%{name}-%{version}-' + subs['revno'] + '.tar.gz'
+    subs['archive_name'] = '%{name}-%{version}-' + revno + '.tar.gz'
     subs['bd_requires'] = ['python-devel', 'python-setuptools']
 
-    requires = []
-    cmd = [sys.executable, join(os.pardir, 'tools', 'read-dependencies')]
-    (stdout, _stderr) = tiny_p(cmd)
-    pkgs = stdout.splitlines()
-    
+    cmd = [sys.executable, 
+            util.abs_join(os.pardir, 'tools', 'read-dependencies')]
+    (stdout, _stderr) = util.subp(cmd)
+
     # Map to known packages
-    for e in pkgs:
-        e = e.lower().strip()
+    pkgs = [p.lower().strip() for p in stdout.splitlines()]
+
+    # Map to known packages
+    requires = []
+    for p in pkgs:
         tgt_pkg = None
-        for n in PKG_MP.keys():
-            if e.find(n) != -1:
-                tgt_pkg = PKG_MP.get(n)
+        for name in PKG_MP.keys():
+            if p.find(name) != -1:
+                tgt_pkg = PKG_MP.get(name)
+                break
         if not tgt_pkg:
             raise RuntimeError(("Do not know how to translate %s to "
-                                " a known package") % (e))
+                                " a known package") % (p))
         else:
             requires.append(tgt_pkg)
-
-    base_name = 'cloud-init-%s-%s' % (version, subs['revno'])
     subs['requires'] = requires
 
     # Format a nice changelog (as best as we can)
-    changelog = ''
-    with open(join(os.pardir, 'ChangeLog')) as fh:
-        changelog = fh.read()
-    ch_lines = []
+    changelog = util.load_file(util.abs_join(os.pardir, 'ChangeLog'))
+    changelog_lines = []
     for line in changelog.splitlines():
         if not line.strip():
             continue
         if re.match(r"^\s*[\d][.][\d][.][\d]:\s*", line):
             line = line.strip(":")
             header = get_log_header(line)
-            ch_lines.append(header)
+            changelog_lines.append(header)
         else:
-            ch_lines.append(line)
-    subs['changelog'] = "\n".join(ch_lines)
+            changelog_lines.append(line)
+    subs['changelog'] = "\n".join(changelog_lines)
 
     # See: http://www.zarb.org/~jasonc/macros.php
     # Pickup any special files
@@ -174,6 +155,7 @@ def generate_spec_contents(args, tmpl_fn, revno, version):
         '%{_bindir}/*',
         '/usr/lib/cloud-init/*',
     ]
+
     # Since setup.py installs them
     # all, we need to selectively 
     # knock off the wrong ones and
@@ -192,10 +174,7 @@ def generate_spec_contents(args, tmpl_fn, revno, version):
     subs['post_remove'] = post_remove
     subs['files'] = other_files
     
-    with open(tmpl_fn, 'r') as fh:
-        tmpl = tempita.Template(fh.read())
-        contents = tmpl.substitute(**subs)
-        return contents
+    return templater.render_from_file(tmpl_fn, params=subs)
 
 
 def archive_code():
@@ -216,31 +195,28 @@ def main():
 
     # Clean out the root dir and make sure the dirs we want are in place
     root_dir = os.path.expanduser("~/rpmbuild")
-    info("Cleaning %r" % (root_dir))
     if os.path.isdir(root_dir):
         shutil.rmtree(root_dir)
-    arc_dir = os.path.join(root_dir, 'SOURCES')
-    for d in [root_dir, arc_dir]:
-        os.makedirs(d)
-        
+    arc_dir = util.abs_join(root_dir, 'SOURCES')
+    util.ensure_dirs([root_dir, arc_dir])
+
     # Archive the code
-    (revno, version, archive_fn) = archive_code()
+    cmd = [sys.executable,
+            util.abs_join(os.getcwd(), 'make-tarball')]
+    (stdout, _stderr) = util.subp(cmd)
+    archive_fn = stdout.strip()
     real_archive_fn = os.path.join(arc_dir, os.path.basename(archive_fn))
     shutil.move(archive_fn, real_archive_fn)
-    info("Archived code to %r" % (real_archive_fn))
 
     # Form the spec file to be used
-    tmpl_fn = os.path.join(os.getcwd(), 'redhat', 'cloud-init.spec')
-    info("Generating spec file from template %r" % (tmpl_fn))
-    contents = generate_spec_contents(args, tmpl_fn, revno, version)
+    tmpl_fn = util.abs_join(os.getcwd(), 'redhat', 'cloud-init.spec')
+    contents = generate_spec_contents(args, tmpl_fn)
     spec_fn = os.path.join(root_dir, 'cloud-init.spec')
-    with open(spec_fn, 'w') as fh:
-        fh.write(contents)
-        info("Wrote spec file to %r" % (spec_fn))
+    util.write_file(spec_fn, contents)
 
     # Now build it!
     cmd = ['rpmbuild', '-ba', spec_fn]
-    tiny_p(cmd, capture=False)
+    util.subp(cmd, capture=False)
     info("Rpmbuild completed!")
 
     # Copy the items built to our local dir
@@ -251,11 +227,10 @@ def main():
                            (os.path.join(root_dir, 'RPMS'))))
     globs.extend(glob.glob("%s/*.rpm" %
                            (os.path.join(root_dir, 'SRPMS'))))
-    for fn in globs:
-        n = os.path.basename(fn)
-        tgt_fn = os.path.join(os.getcwd(), n)
-        shutil.move(fn, tgt_fn)
-        info("Copied %s to %s" % (n, tgt_fn))
+    for rpm_fn in globs:
+        tgt_fn = util.abs_join(os.getcwd(), os.path.basename(rpm_fn))
+        shutil.move(rpm_fn, tgt_fn)
+        print(tgt_fn)
 
     return 0
 
diff --git a/packages/make-tarball b/packages/make-tarball
index 98f669a9..479e11af 100755
--- a/packages/make-tarball
+++ b/packages/make-tarball
@@ -8,78 +8,56 @@ import sys
 import tempfile
 
 
-def join(*paths):
-    p = os.path.join(*paths)
-    return os.path.abspath(p)
-
-
-def tiny_p(cmd):
-    # Darn python 2.6 doesn't have check_output (argggg)
-    sp = subprocess.Popen(cmd, stdout=subprocess.PIPE,
-                    stderr=subprocess.PIPE, stdin=None)
-    (out, err) = sp.communicate()
-    if sp.returncode not in [0]:
-        raise RuntimeError("Failed running %s [rc=%s] (%s, %s)" 
-                            % (cmd, sp.returncode, out, err))
-    return (out, err)
-
-
-@contextlib.contextmanager
-def tmpdir():
-    t = tempfile.mkdtemp()
-    try:
-        yield t
-    finally:
-        shutil.rmtree(t)
+# Use the util functions from cloudinit
+possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
+        sys.argv[0]), os.pardir, os.pardir))
+if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
+    sys.path.insert(0, possible_topdir)
 
+from cloudinit import util
 
 
 def main(args):
-    
-    tag = None
+
+    base_fn = None
     if args:
-        tag = args[0]
+        base_fn = args[0]
 
-    with tmpdir() as td:
-        (stdout, _stderr) = tiny_p(['bzr', 'revno'])
-        revno = stdout.strip()
+    with util.tempdir() as tdir:
 
-        cmd = [sys.executable, join(os.pardir, 'tools', 'read-version')]
-        (stdout, _stderr) = tiny_p(cmd)
-        version = stdout.strip()
+        if not base_fn:
+            (stdout, _stderr) = util.subp(['bzr', 'revno'])
+            revno = stdout.strip()
+    
+            cmd = [sys.executable,
+                   util.abs_join(os.pardir, 'tools', 'read-version')]
+            (stdout, _stderr) = util.subp(cmd)
+            version = stdout.strip()
+            base_fn = 'cloud-init-%s-%s' % (version, revno)
 
-        owcd = os.getcwd()
-        os.chdir(os.path.abspath(os.pardir))
-        if not os.path.exists('setup.py'):
-            raise RuntimeError("No setup.py found in %s" % (os.getcwd()))
+        util.ensure_dir(util.abs_join(tdir, base_fn))
+        arch_fn = '%s.tar.gz' % (base_fn)
 
-        cmd = ['bzr', 'ls', '--versioned']
-        (stdout, _stderr) = tiny_p(cmd)
-        fns = []
-        for fn in stdout.splitlines():
-            fn = fn.strip()
-            if not fn or fn.startswith("."):
-                continue
-            fns.append(fn)
-        bfn = 'cloud-init-%s-%s' % (version, revno)
-        os.makedirs(join(td, bfn))
-        
-        for fn in fns:
-            if os.path.isfile(fn):
-                shutil.copy(fn, join(td, bfn, fn))
-            else:
-                shutil.copytree(fn, join(td, bfn, fn))
+        with util.chdir(os.pardir):
+            (stdout, _stderr) = util.subp(['bzr', 'ls', '--versioned'])
+            fns = [fn for fn in stdout.splitlines() 
+                          if fn and not fn.startswith('.')]
+            # TODO - only copy the right files
+            # ie do a recursive versioned...
+            for fn in fns:
+                if os.path.isfile(fn):
+                    shutil.copy(fn, util.abs_join(tdir, base_fn, fn))
+                else:
+                    shutil.copytree(fn, util.abs_join(tdir, base_fn, fn))
 
-        fn = '%s.tar.gz' % (bfn)
-        o_fn = join(td, fn)
-        cmd = ['tar', '-czf', o_fn, '-C', join(td), bfn]
-        tiny_p(cmd)
+        cmd = ['tar', '-czf',
+                util.abs_join(tdir, arch_fn), 
+                '-C', tdir, base_fn]
+        util.subp(cmd)
 
-        os.chdir(owcd)
-        shutil.move(o_fn, fn)
-
-        out = [revno, version, bfn, os.path.abspath(fn)]
-        print('\t'.join(out))
+        shutil.move(util.abs_join(tdir, arch_fn),
+                    util.abs_join(os.getcwd(), arch_fn))
+        print(os.path.abspath(arch_fn))
         
     return 0
 

From df891da83183da0ee675e531a4f29f991e994eab Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 26 Jun 2012 13:08:31 -0700
Subject: [PATCH 376/434] 1. Fix old info call.

---
 packages/brpm | 1 -
 1 file changed, 1 deletion(-)

diff --git a/packages/brpm b/packages/brpm
index f3ff2f58..6870e172 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -217,7 +217,6 @@ def main():
     # Now build it!
     cmd = ['rpmbuild', '-ba', spec_fn]
     util.subp(cmd, capture=False)
-    info("Rpmbuild completed!")
 
     # Copy the items built to our local dir
     globs = [] 

From 6355fa52776c33150c50e421272b139f207d5fae Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 26 Jun 2012 15:20:07 -0700
Subject: [PATCH 377/434] 1. Add 'verbose' options to both. 2. Fixup the debian
 building after util changes

---
 packages/bddeb | 39 +++++++++++++++++++++++++++++++--------
 packages/brpm  | 10 +++++++++-
 2 files changed, 40 insertions(+), 9 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index 5f250738..9015585b 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -13,6 +13,8 @@ if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
 from cloudinit import templater
 from cloudinit import util
 
+import argparse
+
 # Package names that will showup in requires to what we can actually
 # use in our debian 'control' file
 PKG_MP = {
@@ -70,6 +72,23 @@ def write_debian_folder(root, version, revno):
 
 def main():
 
+    parser = argparse.ArgumentParser()
+    parser.add_argument("-n", "--no-sign", dest="sign",
+                        help=("attempt to sign "
+                              "the package (default: %(default)s)"),
+                        default=True,
+                        action='store_false')
+    parser.add_argument("-v", "--verbose", dest="verbose",
+                        help=("run verbosely"
+                              " (default: %(default)s)"),
+                        default=False,
+                        action='store_true')
+    args = parser.parse_args()
+
+    capture = True
+    if args.verbose:
+        capture = False
+
     with util.tempdir() as tdir:
 
         cmd = [sys.executable,
@@ -95,24 +114,28 @@ def main():
         base_name = os.path.basename(arch_fn)[:-len(".tar.gz")]
         shutil.move(util.abs_join(tdir, base_name), 
                     util.abs_join(tdir, 'cloud-init'))
-        
+
         write_debian_folder(util.abs_join(tdir, 'cloud-init'),
                             version, revno)
-        
+
         tar_fn = "cloud-init_%s~%s.orig.tar.gz" % (version, revno)
         cmd = ['tar', '-czvf', 
                util.abs_join(tdir, tar_fn), 
                '-C', util.abs_join(tdir, 'cloud-init')]
         cmd.extend(os.listdir(util.abs_join(tdir, 'cloud-init')))
         util.subp(cmd)
+        shutil.copy(util.abs_join(tdir, tar_fn), tar_fn)
+        print("Wrote out archive %r" % (util.abs_join(tar_fn)))
         
-        ocwd = os.getcwd()
         with util.chdir(util.abs_join(tdir, 'cloud-init')):
-            util.subp(['debuild'], capture=False)
-            debname = "cloud-init_%s~bzr%s-1_all.deb" % (version, revno)
-            shutil.move(debname, util.abs_join(ocwd, debname))
-        
-        print("Wrote out debian package %s" % (util.abs_join(ocwd, debname)))
+            cmd = ['debuild']
+            if not args.sign:
+                cmd.extend(['-us', '-uc'])
+            util.subp(cmd, capture=capture)
+
+        debname = "cloud-init_%s~%s-1_all.deb" % (version, revno)
+        shutil.move(util.abs_join(tdir, debname), debname)
+        print("Wrote out debian package %r" % (util.abs_join(debname)))
 
     return 0
 
diff --git a/packages/brpm b/packages/brpm
index 6870e172..b7246d8d 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -191,7 +191,15 @@ def main():
                         help="select boot type (default: %(default)s)", 
                         metavar="TYPE", default='initd',
                         choices=['upstart', 'initd', 'systemd'])
+    parser.add_argument("-v", "--verbose", dest="verbose",
+                        help=("run verbosely"
+                              " (default: %(default)s)"),
+                        default=False,
+                        action='store_true')
     args = parser.parse_args()
+    capture = True
+    if args.verbose:
+        capture = False
 
     # Clean out the root dir and make sure the dirs we want are in place
     root_dir = os.path.expanduser("~/rpmbuild")
@@ -216,7 +224,7 @@ def main():
 
     # Now build it!
     cmd = ['rpmbuild', '-ba', spec_fn]
-    util.subp(cmd, capture=False)
+    util.subp(cmd, capture=capture)
 
     # Copy the items built to our local dir
     globs = [] 

From abe83d376da3f76a6461113068ea8045e6cfb7df Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 27 Jun 2012 16:32:41 -0700
Subject: [PATCH 378/434] Take only the files in the directory, not the
 directory itself (this causes issues when installing)

---
 packages/brpm | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/packages/brpm b/packages/brpm
index b7246d8d..2adbfc95 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -170,7 +170,8 @@ def generate_spec_contents(args, tmpl_fn):
         if k != args.boot:
             post_remove.append(v)
         else:
-            other_files.append(v)
+            take = v + "*"
+            other_files.append(take)
     subs['post_remove'] = post_remove
     subs['files'] = other_files
     

From ba9a454c03cfdf3f53db87f67dd30e59198f33ba Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 27 Jun 2012 17:07:42 -0700
Subject: [PATCH 379/434] No longer need to do this special config appending,
 the config merger class handles this.

---
 bin/cloud-init | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index 68c7ba76..0b879876 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -253,13 +253,7 @@ def main_modules(action_name, args):
         util.logexc(LOG, 'Can not apply stage %s, no datasource found!', name)
         return 1
     # Stage 3
-    mod_cfgs = extract_fns(args)
-    cc_cfg = init.paths.get_ipath_cur('cloud_config')
-    if settings.CFG_ENV_NAME in os.environ:
-        cc_cfg = os.environ[settings.CFG_ENV_NAME]
-    if cc_cfg and os.path.exists(cc_cfg):
-        mod_cfgs.append(cc_cfg)
-    mods = stages.Modules(init, mod_cfgs)
+    mods = stages.Modules(init, extract_fns(args))
     # Stage 4
     try:
         LOG.debug("Closing stdin")

From 1c8027e0e21eed17039a7d28ac5b7ddd4645076a Mon Sep 17 00:00:00 2001
From: Scott Moser <smoser@ubuntu.com>
Date: Thu, 28 Jun 2012 16:46:11 -0400
Subject: [PATCH 380/434] change upstart jobs to use single 'cloud-init' binary

This just updates upstart jobs to the new single binary approach.
---
 upstart/cloud-config.conf     | 2 +-
 upstart/cloud-final.conf      | 2 +-
 upstart/cloud-init-local.conf | 2 +-
 upstart/cloud-init.conf       | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/upstart/cloud-config.conf b/upstart/cloud-config.conf
index 5edc58b9..3ac113f3 100644
--- a/upstart/cloud-config.conf
+++ b/upstart/cloud-config.conf
@@ -5,4 +5,4 @@ start on (filesystem and started rsyslog)
 console output
 task
 
-exec cloud-init-cfg all config
+exec cloud-init modules --mode=config
diff --git a/upstart/cloud-final.conf b/upstart/cloud-final.conf
index a04105a1..72ae5052 100644
--- a/upstart/cloud-final.conf
+++ b/upstart/cloud-final.conf
@@ -7,4 +7,4 @@ start on (stopped rc RUNLEVEL=[2345] and stopped cloud-config)
 console output
 task
 
-exec cloud-init-cfg all final
+exec cloud-init modules --mode=final
diff --git a/upstart/cloud-init-local.conf b/upstart/cloud-init-local.conf
index b6eb21b4..061fe406 100644
--- a/upstart/cloud-init-local.conf
+++ b/upstart/cloud-init-local.conf
@@ -6,4 +6,4 @@ task
 
 console output
 
-exec /usr/bin/cloud-init start-local
+exec /usr/bin/cloud-init init --local  
diff --git a/upstart/cloud-init.conf b/upstart/cloud-init.conf
index b9be5981..41ddd284 100644
--- a/upstart/cloud-init.conf
+++ b/upstart/cloud-init.conf
@@ -6,4 +6,4 @@ task
 
 console output
 
-exec /usr/bin/cloud-init start
+exec /usr/bin/cloud-init init

From 29cad69e2e0e8c98c1b990e6d6b70e5d8c507beb Mon Sep 17 00:00:00 2001
From: Scott Moser <smoser@ubuntu.com>
Date: Thu, 28 Jun 2012 16:48:18 -0400
Subject: [PATCH 381/434] packages/debian/rules: remove unused quilt section

---
 packages/debian/rules | 13 -------------
 1 file changed, 13 deletions(-)

diff --git a/packages/debian/rules b/packages/debian/rules
index a907b594..1739f4cf 100755
--- a/packages/debian/rules
+++ b/packages/debian/rules
@@ -12,16 +12,3 @@ DEB_DH_INSTALL_SOURCEDIR := debian/tmp
 cloud-init-fixups:
 	install -d $(DEB_DESTDIR)/etc/rsyslog.d
 	cp tools/21-cloudinit.conf $(DEB_DESTDIR)/etc/rsyslog.d/21-cloudinit.conf
-
-# You only need to run this immediately after checking out the package from
-# revision control.
-# http://bugs.debian.org/cgi-bin/bugreport.cgi?bug=572204
-quilt-setup:
-	@[ ! -d .pc ] || { echo ".pc exists. remove it and re-run to start fresh"; exit 1; }
-	set -e; for patch in $$(quilt series | tac); do \
-		patch -p1 -R --no-backup-if-mismatch <"debian/patches/$$patch"; \
-	done
-	quilt push -a
-
-.PHONY: quilt-setup
-

From a47bfae2ee7b148c641f5bc5917678dd14ba1ba4 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 28 Jun 2012 15:13:19 -0700
Subject: [PATCH 382/434] 1. Update with smosers code review and comments (and
 put some of those comments into the files) 2. Rename consume() to
 consume_userdata() as it helps in figuring out what this does. 3. Fixup the
 tests due to #2

---
 bin/cloud-init                   | 49 +++++++++++++++++++++++---------
 cloudinit/stages.py              | 19 ++++++-------
 tests/unittests/test_userdata.py | 10 +++----
 3 files changed, 49 insertions(+), 29 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index 0b879876..d3ef092f 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -34,13 +34,15 @@ if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
 
 from cloudinit import log as logging
 from cloudinit import netinfo
-from cloudinit import settings
 from cloudinit import sources
 from cloudinit import stages
 from cloudinit import templater
 from cloudinit import util
 from cloudinit import version
 
+from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE,
+                                CLOUD_CONFIG)
+
 
 # Module section template
 MOD_SECTION_TPL = "cloud_%s_modules"
@@ -54,9 +56,9 @@ QUERY_DATA_TYPES = [
 
 # Frequency shortname to full name
 FREQ_SHORT_NAMES = {
-    'instance': settings.PER_INSTANCE,
-    'always': settings.PER_ALWAYS,
-    'once': settings.PER_ONCE,
+    'instance': PER_INSTANCE,
+    'always': PER_ALWAYS,
+    'once': PER_ONCE,
 }
 
 LOG = logging.getLogger()
@@ -111,8 +113,15 @@ def main_init(name, args):
         deps = [sources.DEP_FILESYSTEM]
 
     if not args.local:
-        # TODO: What is this for??
-        root_name = "%s.d" % (settings.CLOUD_CONFIG)
+        # See doc/kernel-cmdline.txt
+        #
+        # This is used in maas datasource, in "ephemeral" (read-only root)
+        # environment where the instance netboots to iscsi ro root.
+        # and the entity that controls the pxe config has to configure
+        # the maas datasource.
+        #
+        # Could be used elsewhere, only works on network based (not local).
+        root_name = "%s.d" % (CLOUD_CONFIG)
         target_fn = os.path.join(root_name, "91_kernel_cmdline_url.cfg")
         util.read_write_cmdline_url(target_fn)
 
@@ -194,22 +203,34 @@ def main_init(name, args):
         init.fetch()
     except sources.DataSourceNotFoundException:
         util.logexc(LOG, "No instance datasource found!")
-        # TODO: Return 0 or 1??
-        return 1
+        # In the case of cloud-init (net mode) it is a bit
+        # more likely that the user would consider it
+        # failure if nothing was found. When using
+        # upstart it will also mentions job failure
+        # in console log if exit code is != 0.
+        if args.local:
+            return 0
+        else:
+            return 1
     # Stage 6
     iid = init.instancify()
     LOG.debug("%s will now be targeting instance id: %s", name, iid)
     init.update()
     # Stage 7
     try:
+        # Attempt to consume the data per instance.
+        # This may run user-data handlers and/or perform
+        # url downloads and such as needed.
         (ran, _results) = init.cloudify().run('consume_userdata',
-                                             init.consume,
-                                             args=[settings.PER_INSTANCE],
-                                             freq=settings.PER_INSTANCE)
+                                             init.consume_userdata,
+                                             args=[PER_INSTANCE],
+                                             freq=PER_INSTANCE)
         if not ran:
-            # Just consume anything that is set to run per
-            # always if nothing ran in the per instance section
-            init.consume(settings.PER_ALWAYS)
+            # Just consume anything that is set to run per-always
+            # if nothing ran in the per-instance code
+            #
+            # TODO: should this always happen?? (even if the above runs?)
+            init.consume_userdata(PER_ALWAYS)
     except Exception:
         util.logexc(LOG, "Consuming user data failed!")
         return 1
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 47f6e188..6689e4c9 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -192,13 +192,13 @@ class Init(object):
         cfg_list = self.cfg.get('datasource_list') or []
         return (cfg_list, pkg_list)
 
-    def _get_data_source(self, local_only=False):
+    def _get_data_source(self):
         if self.datasource:
             return self.datasource
         ds = self._restore_from_cache()
         if ds:
             LOG.debug("Restored from cache, datasource: %s", ds)
-        if not ds and not local_only:
+        if not ds:
             (cfg_list, pkg_list) = self._get_datasources()
             # Deep copy so that user-data handlers can not modify
             # (which will affect user-data handlers down the line...)
@@ -209,11 +209,10 @@ class Init(object):
                                                cfg_list,
                                                pkg_list)
             LOG.debug("Loaded datasource %s - %s", dsname, ds)
-        if ds:
-            self.datasource = ds
-            # Ensure we adjust our path members datasource
-            # now that we have one (thus allowing ipath to be used)
-            self.paths.datasource = ds
+        self.datasource = ds
+        # Ensure we adjust our path members datasource
+        # now that we have one (thus allowing ipath to be used)
+        self.paths.datasource = ds
         return ds
 
     def _get_instance_subdirs(self):
@@ -275,8 +274,8 @@ class Init(object):
                         "%s\n" % (previous_iid))
         return iid
 
-    def fetch(self, local_only=False):
-        return self._get_data_source(local_only)
+    def fetch(self):
+        return self._get_data_source()
 
     def instancify(self):
         return self._reflect_cur_instance()
@@ -312,7 +311,7 @@ class Init(object):
         ]
         return def_handlers
 
-    def consume(self, frequency=PER_INSTANCE):
+    def consume_userdata(self, frequency=PER_INSTANCE):
         cdir = self.paths.get_cpath("handlers")
         idir = self._get_ipath("handlers")
 
diff --git a/tests/unittests/test_userdata.py b/tests/unittests/test_userdata.py
index eeddde7d..861642b6 100644
--- a/tests/unittests/test_userdata.py
+++ b/tests/unittests/test_userdata.py
@@ -68,7 +68,7 @@ class TestConsumeUserData(MockerTestCase):
 
         log_file = self.capture_log(logging.WARNING)
         ci.fetch()
-        ci.consume()
+        ci.consume_userdata()
         self.assertIn(
             "Unhandled non-multipart (text/x-not-multipart) userdata:",
             log_file.getvalue())
@@ -85,7 +85,7 @@ class TestConsumeUserData(MockerTestCase):
 
         log_file = self.capture_log(logging.WARNING)
         ci.fetch()
-        ci.consume()
+        ci.consume_userdata()
         self.assertIn(
             "Unhandled unknown content-type (text/plain)",
             log_file.getvalue())
@@ -104,7 +104,7 @@ class TestConsumeUserData(MockerTestCase):
 
         log_file = self.capture_log(logging.WARNING)
         ci.fetch()
-        ci.consume()
+        ci.consume_userdata()
         self.assertEqual("", log_file.getvalue())
 
     def test_mime_text_x_shellscript(self):
@@ -122,7 +122,7 @@ class TestConsumeUserData(MockerTestCase):
 
         log_file = self.capture_log(logging.WARNING)
         ci.fetch()
-        ci.consume()
+        ci.consume_userdata()
         self.assertEqual("", log_file.getvalue())
 
     def test_mime_text_plain_shell(self):
@@ -140,5 +140,5 @@ class TestConsumeUserData(MockerTestCase):
 
         log_file = self.capture_log(logging.WARNING)
         ci.fetch()
-        ci.consume()
+        ci.consume_userdata()
         self.assertEqual("", log_file.getvalue())

From d4e29b84c6e07499afbbcf6a2d1bdd3adaa97907 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 28 Jun 2012 15:35:33 -0700
Subject: [PATCH 383/434] Continue working on removing and allowing the correct
 files in the spec generated file

---
 packages/brpm | 51 +++++++++++++++++++++++++++++++++------------------
 1 file changed, 33 insertions(+), 18 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index 2adbfc95..51242e54 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -154,27 +154,41 @@ def generate_spec_contents(args, tmpl_fn):
     other_files = [
         '%{_bindir}/*',
         '/usr/lib/cloud-init/*',
+        '/etc/init/*',
+        '/etc/systemd/*',
+        '/etc/init.d/*',
     ]
 
-    # Since setup.py installs them
-    # all, we need to selectively 
-    # knock off the wrong ones and
-    # ensure the right one is kept
-    post_remove_keep = {
-        'initd': '/etc/init.d/',
-        'systemd': '/etc/systemd/',
-        'upstart': '/etc/init/',
+    # Since setup.py installs them all, we need to selectively
+    # remove the wrong ones and ensure the right one/s are kept
+    # for the boot mode that is desired...
+    post_remove = { 
+        'initd': [
+            '/etc/init.d/cloud-init-local',
+            '/etc/systemd/',
+            '/etc/init/',
+        ],
+        'initd-local': [
+            '/etc/init.d/cloud-init',
+            '/etc/systemd/',
+            '/etc/init/',
+        ],
+        # It seems like systemd can work with
+        # all of its files being 'active' (and not have naming
+        # or event name conflicts??)
+        'systemd': [
+            '/etc/init.d/',
+            '/etc/init/',
+        ],
+        'upstart': [
+            '/etc/init/cloud-init-nonet.conf',
+            '/etc/init/cloud-init-local.conf',
+            '/etc/init/',
+            '/etc/systemd/',
+        ],
     }
-    post_remove = []
-    for (k, v) in post_remove_keep.iteritems():
-        if k != args.boot:
-            post_remove.append(v)
-        else:
-            take = v + "*"
-            other_files.append(take)
-    subs['post_remove'] = post_remove
+    subs['post_remove'] = post_remove[args.boot]
     subs['files'] = other_files
-    
     return templater.render_from_file(tmpl_fn, params=subs)
 
 
@@ -191,7 +205,8 @@ def main():
     parser.add_argument("-b", "--boot", dest="boot",
                         help="select boot type (default: %(default)s)", 
                         metavar="TYPE", default='initd',
-                        choices=['upstart', 'initd', 'systemd'])
+                        choices=('upstart', 'initd', 'systemd',
+                                 'upstart-local', 'initd-local'))
     parser.add_argument("-v", "--verbose", dest="verbose",
                         help=("run verbosely"
                               " (default: %(default)s)"),

From d86f4a39f23373ff497a3eb7796f319d6c841a7d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 28 Jun 2012 15:41:54 -0700
Subject: [PATCH 384/434] 1. Match the variable names with what they are used
 for 2. Create a set of directories that need to be kept for the different
 boot modes.

---
 packages/brpm | 27 +++++++++++++++++++++++++--
 1 file changed, 25 insertions(+), 2 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index 51242e54..d2ff06f0 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -162,7 +162,7 @@ def generate_spec_contents(args, tmpl_fn):
     # Since setup.py installs them all, we need to selectively
     # remove the wrong ones and ensure the right one/s are kept
     # for the boot mode that is desired...
-    post_remove = { 
+    boot_remove = { 
         'initd': [
             '/etc/init.d/cloud-init-local',
             '/etc/systemd/',
@@ -186,8 +186,31 @@ def generate_spec_contents(args, tmpl_fn):
             '/etc/init/',
             '/etc/systemd/',
         ],
+        'upstart-local': [
+            '/etc/init/cloud-init.conf',
+            '/etc/init/',
+            '/etc/systemd/',
+        ]
     }
-    subs['post_remove'] = post_remove[args.boot]
+    boot_keep = [
+        'systemd': [
+            '/etc/systemd/*',
+        ],
+        'upstart': [
+            '/etc/init/*',
+        ],
+        'upstart-local': [
+            '/etc/init/*',
+        ],
+        'initd-local': [
+            '/etc/init.d/*',
+        ],
+        'initd': [
+            '/etc/init.d/*',
+        ],
+    ]
+    subs['post_remove'] = boot_remove[args.boot]
+    other_files.extend(boot_keep[args.boot]
     subs['files'] = other_files
     return templater.render_from_file(tmpl_fn, params=subs)
 

From 9ff64388d23a89e146895b27c46edaa619a07f55 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 28 Jun 2012 15:42:37 -0700
Subject: [PATCH 385/434] Remove the keep all the init directories which didn't
 work

---
 packages/brpm | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index d2ff06f0..0826364f 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -154,9 +154,6 @@ def generate_spec_contents(args, tmpl_fn):
     other_files = [
         '%{_bindir}/*',
         '/usr/lib/cloud-init/*',
-        '/etc/init/*',
-        '/etc/systemd/*',
-        '/etc/init.d/*',
     ]
 
     # Since setup.py installs them all, we need to selectively

From 539f2f5a1b6a92c6679178164c60c4ff58ccdb32 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 28 Jun 2012 16:13:23 -0700
Subject: [PATCH 386/434] Syntax error fixup

---
 packages/brpm | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index 0826364f..44fd24b3 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -189,7 +189,7 @@ def generate_spec_contents(args, tmpl_fn):
             '/etc/systemd/',
         ]
     }
-    boot_keep = [
+    boot_keep = {
         'systemd': [
             '/etc/systemd/*',
         ],
@@ -205,9 +205,9 @@ def generate_spec_contents(args, tmpl_fn):
         'initd': [
             '/etc/init.d/*',
         ],
-    ]
+    }
     subs['post_remove'] = boot_remove[args.boot]
-    other_files.extend(boot_keep[args.boot]
+    other_files.extend(boot_keep[args.boot])
     subs['files'] = other_files
     return templater.render_from_file(tmpl_fn, params=subs)
 

From 6cffaf4caa5085524c8ec2c43f3bbeeab5b33e26 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Thu, 28 Jun 2012 16:32:47 -0700
Subject: [PATCH 387/434] Fix chopping off the wrong folers, oops

---
 packages/brpm | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index 44fd24b3..bbf30565 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -162,11 +162,13 @@ def generate_spec_contents(args, tmpl_fn):
     boot_remove = { 
         'initd': [
             '/etc/init.d/cloud-init-local',
+            # Remove the other auto-start folders
             '/etc/systemd/',
             '/etc/init/',
         ],
         'initd-local': [
             '/etc/init.d/cloud-init',
+            # Remove the other auto-start folders
             '/etc/systemd/',
             '/etc/init/',
         ],
@@ -174,18 +176,21 @@ def generate_spec_contents(args, tmpl_fn):
         # all of its files being 'active' (and not have naming
         # or event name conflicts??)
         'systemd': [
+            # Remove the other auto-start folders
             '/etc/init.d/',
             '/etc/init/',
         ],
         'upstart': [
             '/etc/init/cloud-init-nonet.conf',
             '/etc/init/cloud-init-local.conf',
-            '/etc/init/',
+            # Remove the other auto-start folders
+            '/etc/init.d/',
             '/etc/systemd/',
         ],
         'upstart-local': [
             '/etc/init/cloud-init.conf',
-            '/etc/init/',
+            # Remove the other auto-start folders
+            '/etc/init.d/',
             '/etc/systemd/',
         ]
     }

From 67cfabecbfbbb1386ead703332833f17a2a220c3 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 11:41:15 -0700
Subject: [PATCH 388/434] Add a message about why the second consume_userdata
 occurs since its not very obvious.

---
 bin/cloud-init | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index d3ef092f..025195d4 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -229,7 +229,8 @@ def main_init(name, args):
             # Just consume anything that is set to run per-always
             # if nothing ran in the per-instance code
             #
-            # TODO: should this always happen?? (even if the above runs?)
+            # See: https://bugs.launchpad.net/bugs/819507 for a little
+            # reason behind this...
             init.consume_userdata(PER_ALWAYS)
     except Exception:
         util.logexc(LOG, "Consuming user data failed!")

From 79844379fba5f7807448f09bf624d57f51eb9ac2 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 11:41:43 -0700
Subject: [PATCH 389/434] Ensure that only when incoming frequency is
 per-instance that this runs.

---
 cloudinit/handlers/upstart_job.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/cloudinit/handlers/upstart_job.py b/cloudinit/handlers/upstart_job.py
index 411a5d68..99e0afde 100644
--- a/cloudinit/handlers/upstart_job.py
+++ b/cloudinit/handlers/upstart_job.py
@@ -46,6 +46,10 @@ class UpstartJobPartHandler(handlers.Handler):
         if ctype in handlers.CONTENT_SIGNALS:
             return
 
+        # See: https://bugs.launchpad.net/bugs/819507
+        if frequency != PER_INSTANCE:
+            return
+
         if not self.upstart_dir:
             return
 

From d179f59c0957d8e0a5effeb26eecd9c448c60ee6 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 11:42:03 -0700
Subject: [PATCH 390/434] Add a test that ensures the upstart handler does not
 output files when in non-per-instance mode.

---
 tests/unittests/test_builtin_handlers.py | 54 ++++++++++++++++++++++++
 1 file changed, 54 insertions(+)
 create mode 100644 tests/unittests/test_builtin_handlers.py

diff --git a/tests/unittests/test_builtin_handlers.py b/tests/unittests/test_builtin_handlers.py
new file mode 100644
index 00000000..84d85d4d
--- /dev/null
+++ b/tests/unittests/test_builtin_handlers.py
@@ -0,0 +1,54 @@
+"""Tests of the built-in user data handlers"""
+
+import os
+
+from mocker import MockerTestCase
+
+from cloudinit import handlers
+from cloudinit import helpers
+from cloudinit import util
+
+from cloudinit.handlers import upstart_job
+
+from cloudinit.settings import (PER_ALWAYS, PER_INSTANCE)
+
+
+class TestBuiltins(MockerTestCase):
+
+    def test_upstart_frequency_no_out(self):
+        c_root = self.makeDir()
+        up_root = self.makeDir()
+        paths = helpers.Paths({
+            'cloud_dir': c_root,
+            'upstart_dir': up_root,
+        })
+        freq = PER_ALWAYS
+        h = upstart_job.UpstartJobPartHandler(paths)
+        # No files should be written out when
+        # the frequency is ! per-instance
+        h.handle_part('', handlers.CONTENT_START,
+                      None, None, None)
+        h.handle_part('blah', 'text/upstart-job',
+                      'test.conf', 'blah', freq)
+        h.handle_part('', handlers.CONTENT_END,
+                      None, None, None)
+        self.assertEquals(0, len(os.listdir(up_root)))
+
+    def test_upstart_frequency_single(self): 
+        c_root = self.makeDir()
+        up_root = self.makeDir()
+        paths = helpers.Paths({
+            'cloud_dir': c_root,
+            'upstart_dir': up_root,
+        })
+        freq = PER_INSTANCE
+        h = upstart_job.UpstartJobPartHandler(paths)
+        # No files should be written out when
+        # the frequency is ! per-instance
+        h.handle_part('', handlers.CONTENT_START,
+                      None, None, None)
+        h.handle_part('blah', 'text/upstart-job',
+                      'test.conf', 'blah', freq)
+        h.handle_part('', handlers.CONTENT_END,
+                      None, None, None)
+        self.assertEquals(1, len(os.listdir(up_root)))

From 349eb7b160b65e5618fe740ae4a2613960fc9f40 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 12:00:01 -0700
Subject: [PATCH 391/434] Add in the linking of the _all.deb with a symlink
 'cloud-init_all.deb'

---
 packages/bddeb | 14 +++++++++++---
 1 file changed, 11 insertions(+), 3 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index 9015585b..b10f5a8e 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -133,9 +133,17 @@ def main():
                 cmd.extend(['-us', '-uc'])
             util.subp(cmd, capture=capture)
 
-        debname = "cloud-init_%s~%s-1_all.deb" % (version, revno)
-        shutil.move(util.abs_join(tdir, debname), debname)
-        print("Wrote out debian package %r" % (util.abs_join(debname)))
+        globs = [] 
+        globs.extend(glob.glob("%s/*.deb" %
+                     (os.path.join(tdir))))
+        for fn in globs:
+            base_fn = os.path.basename(fn)
+            shutil.move(fn, base_fn)
+            print("Wrote out debian package %r" % (base_fn))
+            if fn.endswith('_all.deb'):
+                # Add in the local link
+                util.del_file('cloud-init_all.deb')
+                util.symlink(base_fn, 'cloud-init_all.deb')
 
     return 0
 

From 2f9ec214ba622060f5054febde9a7a5c4672e1cc Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 12:03:05 -0700
Subject: [PATCH 392/434] Fix the variable name, should have been
 'additional_fns'

---
 cloudinit/stages.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 6689e4c9..4fcc66e4 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -399,7 +399,7 @@ class Modules(object):
         if self._cached_cfg is None:
             merger = helpers.ConfigMerger(paths=self.init.paths,
                                           datasource=self.init.datasource,
-                                          fns=self.cfg_files,
+                                          additional_fns=self.cfg_files,
                                           base_cfg=self.init.cfg)
             self._cached_cfg = merger.cfg
             LOG.debug("Loading 'module' config %s", self._cached_cfg)

From a0d6c556229b94c6c629fda379c218a491d8fda4 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 12:05:06 -0700
Subject: [PATCH 393/434] Add the rc code for blkid '2' being valid with  a
 note to as why.

---
 cloudinit/util.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index f95a5d07..def4fefd 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -866,7 +866,8 @@ def find_devs_with(criteria=None, oformat='device',
     if path:
         options.append(path)
     cmd = blk_id_cmd + options
-    (out, _err) = subp(cmd)
+    # See man blkid for why 2 is added
+    (out, _err) = subp(cmd, rcs=[0, 2])
     entries = []
     for line in out.splitlines():
         line = line.strip()

From 1f007b82d7a2098a344ee00dd70e4347ec34291f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 12:12:34 -0700
Subject: [PATCH 394/434] Reduce the log levels by removing a few statements
 that happen to often (and aren't very meaningful)

---
 cloudinit/util.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index def4fefd..40f31570 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1068,7 +1068,6 @@ def yaml_dumps(obj):
 def ensure_dir(path, mode=None):
     if not os.path.isdir(path):
         # Make the dir and adjust the mode
-        LOG.debug("Ensuring directory exists at path %s", path)
         with SeLinuxGuard(os.path.dirname(path), recursive=True):
             os.makedirs(path)
         chmod(path, mode)
@@ -1221,8 +1220,6 @@ def chmod(path, mode):
     except (ValueError, TypeError):
         pass
     if path and real_mode:
-        LOG.debug("Adjusting the permissions of %s (perms=%o)",
-                 path, real_mode)
         with SeLinuxGuard(path):
             os.chmod(path, real_mode)
 
@@ -1238,7 +1235,8 @@ def write_file(filename, content, mode=0644, omode="wb"):
     @param omode: The open mode used when opening the file (r, rb, a, etc.)
     """
     ensure_dir(os.path.dirname(filename))
-    LOG.debug("Writing to %s - %s, %s bytes", filename, omode, len(content))
+    LOG.debug("Writing to %s - %s: [%s] %s bytes",
+               filename, omode, mode, len(content))
     with SeLinuxGuard(path=filename):
         with open(filename, omode) as fh:
             fh.write(content)

From 4d6bcf81d46daa302b510e0c012202345d6b369c Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 12:18:54 -0700
Subject: [PATCH 395/434] Cleanup the pickling.

1. When loading the pickled file, don't log if it isn't there
  a. Do log though if it is there and unpickling fails
2. On writing log if pickling fails and log if pickle writing fails.
---
 cloudinit/stages.py | 30 +++++++++++++++++++++---------
 1 file changed, 21 insertions(+), 9 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 4fcc66e4..ef89e77c 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -159,15 +159,23 @@ class Init(object):
         return merger.cfg
 
     def _restore_from_cache(self):
+        # We try to restore from a current link and static path
+        # by using the instance link, if purge_cache was called
+        # the file wont exist.
         pickled_fn = self.paths.get_ipath_cur('obj_pkl')
+        pickle_contents = None
         try:
-            # we try to restore from a current link and static path
-            # by using the instance link, if purge_cache was called
-            # the file wont exist
-            return pickle.loads(util.load_file(pickled_fn))
+            pickle_contents = util.load_file(pickled_fn)
         except Exception:
-            util.logexc(LOG, "Failed loading pickled datasource from %s",
-                        pickled_fn)
+            pass
+        # This is expected so just return nothing
+        # successfully loaded...
+        if not pickle_contents:
+            return None
+        try:
+            return pickle.loads(pickle_contents)
+        except Exception:
+            util.logexc(LOG, "Failed loading pickled blob from %s", pickled_fn)
             return None
 
     def _write_to_cache(self):
@@ -175,12 +183,16 @@ class Init(object):
             return False
         pickled_fn = self.paths.get_ipath_cur("obj_pkl")
         try:
-            contents = pickle.dumps(self.datasource)
-            util.write_file(pickled_fn, contents, mode=0400)
-            return True
+            pk_contents = pickle.dumps(self.datasource)
+        except Exception:
+            util.logexc(LOG, "Failed pickling datasource %s", self.datasource)
+            return False
+        try:
+            util.write_file(pickled_fn, pk_contents, mode=0400)
         except Exception:
             util.logexc(LOG, "Failed pickling datasource to %s", pickled_fn)
             return False
+        return True
 
     def _get_datasources(self):
         # Any config provided???

From afc62cf910bb05578e224611f481e8b1df4ba521 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 12:28:44 -0700
Subject: [PATCH 396/434] Readd the original prefix to the netinfo (if
 provided).

---
 cloudinit/netinfo.py | 16 +++++++++++++---
 1 file changed, 13 insertions(+), 3 deletions(-)

diff --git a/cloudinit/netinfo.py b/cloudinit/netinfo.py
index a6b9116d..feba5a62 100644
--- a/cloudinit/netinfo.py
+++ b/cloudinit/netinfo.py
@@ -150,8 +150,18 @@ def route_pformat():
     return "\n".join(lines)
 
 
-def debug_info():
+def debug_info(prefix='ci-info: '):
     lines = []
-    lines.append(netdev_pformat())
-    lines.append(route_pformat())
+    netdev_lines = netdev_pformat().splitlines()
+    if prefix:
+        for line in netdev_lines:
+            lines.append("%s%s" % (prefix, line))
+    else:
+        lines.extend(netdev_lines)
+    route_lines = route_pformat().splitlines()
+    if prefix:
+        for line in route_lines:
+            lines.append("%s%s" % (prefix, line))
+    else:
+        lines.extend(route_lines)
     return "\n".join(lines)

From d8cffa173fe1b75ee88c3ea6519ef58a7bd90049 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 13:08:52 -0700
Subject: [PATCH 397/434] Don't always log stdout and stderr (exceptions will
 capture them if it fails)

---
 cloudinit/util.py | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 40f31570..3cf51e65 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1287,10 +1287,6 @@ def subp(args, data=None, rcs=None, env=None, capture=True, shell=False):
         out = ''
     if not err and capture:
         err = ''
-    # Useful to note what happened...
-    if capture:
-        LOG.debug("Stdout: %s", out)
-        LOG.debug("Stderr: %s", err)
     return (out, err)
 
 

From fc46a91dfa56f1506f69980ddc7792fd2799fba9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 13:20:09 -0700
Subject: [PATCH 398/434] Don't show the args but show the name and lock that
 is being used.

---
 cloudinit/helpers.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/cloudinit/helpers.py b/cloudinit/helpers.py
index 0f86285f..15036a50 100644
--- a/cloudinit/helpers.py
+++ b/cloudinit/helpers.py
@@ -168,8 +168,7 @@ class Runners(object):
             if not lk:
                 raise LockFailure("Failed to acquire lock for %s" % name)
             else:
-                LOG.debug("Running %s with args %s using lock (%s)",
-                          functor, args, lk)
+                LOG.debug("Running %s using lock (%s)", name, lk)
                 if isinstance(args, (dict)):
                     results = functor(**args)
                 else:

From 2a69655938d7eacaf7d9d4bbc3774079e0893068 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 13:27:11 -0700
Subject: [PATCH 399/434] Fix the datasource not being fetched in single
 running mode.

---
 bin/cloud-init | 23 +++++++++++++++++------
 1 file changed, 17 insertions(+), 6 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index 025195d4..e00913e3 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -301,16 +301,27 @@ def main_query(name, _args):
 def main_single(name, args):
     # Cloud-init single stage is broken up into the following sub-stages
     # 1. Ensure that the init object fetches its config without errors
-    # 2. Construct the modules object
-    # 3. Adjust any subsequent logging/output redirections using
+    # 2. Attempt to fetch the datasource (warn if it doesn't work)
+    # 3. Construct the modules object
+    # 4. Adjust any subsequent logging/output redirections using
     #    the modules objects configuration
-    # 4. Run the single module
-    # 5. Done!
+    # 5. Run the single module
+    # 6. Done!
     mod_name = args.name
     welcome("%s:%s" % (name, mod_name))
     init = stages.Init(ds_deps=[])
     # Stage 1
     init.read_cfg(extract_fns(args))
+    # Stage 2
+    try:
+        init.fetch()
+    except sources.DataSourceNotFoundException:
+        # There was no datasource found,
+        # that might be bad (or ok) depending on
+        # the module being ran (so continue on)
+        util.logexc(LOG, ("Failed to fetch your datasource,"
+                          " likely bad things to come!"))
+    # Stage 3
     mods = stages.Modules(init, extract_fns(args))
     mod_args = args.module_args
     if mod_args:
@@ -319,7 +330,7 @@ def main_single(name, args):
     if mod_freq:
         LOG.debug("Using passed in frequency %s", mod_freq)
         mod_freq = FREQ_SHORT_NAMES.get(mod_freq)
-    # Stage 3
+    # Stage 4
     try:
         LOG.debug("Closing stdin")
         util.close_stdin()
@@ -332,7 +343,7 @@ def main_single(name, args):
                    " longer be active shortly"))
         logging.resetLogging()
     logging.setupLogging(mods.cfg)
-    # Stage 4
+    # Stage 5
     (which_ran, failures) = mods.run_single(mod_name,
                                             mod_args,
                                             mod_freq)

From 5fd9633ed57abbc7b4c98f0880292d3fd5211bd3 Mon Sep 17 00:00:00 2001
From: Scott Moser <smoser@ubuntu.com>
Date: Fri, 29 Jun 2012 16:37:05 -0400
Subject: [PATCH 400/434] packages/bddeb: fix broken bddeb

needed to import glob, and use os.symlink, not util.symlink.

Also, here made the 'tar' verbose. if '-v' option given.
---
 packages/bddeb | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index b10f5a8e..eeb64434 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -3,6 +3,7 @@
 import os
 import shutil
 import sys
+import glob
 
 # Use the util functions from cloudinit
 possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
@@ -123,7 +124,7 @@ def main():
                util.abs_join(tdir, tar_fn), 
                '-C', util.abs_join(tdir, 'cloud-init')]
         cmd.extend(os.listdir(util.abs_join(tdir, 'cloud-init')))
-        util.subp(cmd)
+        util.subp(cmd, capture=capture)
         shutil.copy(util.abs_join(tdir, tar_fn), tar_fn)
         print("Wrote out archive %r" % (util.abs_join(tar_fn)))
         
@@ -143,7 +144,7 @@ def main():
             if fn.endswith('_all.deb'):
                 # Add in the local link
                 util.del_file('cloud-init_all.deb')
-                util.symlink(base_fn, 'cloud-init_all.deb')
+                os.symlink(base_fn, 'cloud-init_all.deb')
 
     return 0
 

From d1c711d825df47fc7240cbca38c74f80b0cb1b41 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 13:44:31 -0700
Subject: [PATCH 401/434] Add a force option which will allow users to continue
 running when no datasource is found.

---
 bin/cloud-init | 26 +++++++++++++++++++-------
 1 file changed, 19 insertions(+), 7 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index e00913e3..0330cb2b 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -202,16 +202,18 @@ def main_init(name, args):
     try:
         init.fetch()
     except sources.DataSourceNotFoundException:
-        util.logexc(LOG, "No instance datasource found!")
+        util.logexc(LOG, ("No instance datasource found!"
+                          " Likely bad things to come!"))
         # In the case of cloud-init (net mode) it is a bit
         # more likely that the user would consider it
         # failure if nothing was found. When using
         # upstart it will also mentions job failure
         # in console log if exit code is != 0.
-        if args.local:
-            return 0
-        else:
-            return 1
+        if not args.force:
+            if args.local:
+                return 0
+            else:
+                return 1
     # Stage 6
     iid = init.instancify()
     LOG.debug("%s will now be targeting instance id: %s", name, iid)
@@ -272,8 +274,11 @@ def main_modules(action_name, args):
         init.fetch()
     except sources.DataSourceNotFoundException:
         # There was no datasource found, theres nothing to do
-        util.logexc(LOG, 'Can not apply stage %s, no datasource found!', name)
-        return 1
+        util.logexc(LOG, ('Can not apply stage %s, '
+                          'no datasource found!'
+                          " Likely bad things to come!"), name)
+        if not args.force:
+            return 1
     # Stage 3
     mods = stages.Modules(init, extract_fns(args))
     # Stage 4
@@ -321,6 +326,8 @@ def main_single(name, args):
         # the module being ran (so continue on)
         util.logexc(LOG, ("Failed to fetch your datasource,"
                           " likely bad things to come!"))
+        if not args.force:
+            return 1
     # Stage 3
     mods = stages.Modules(init, extract_fns(args))
     mod_args = args.module_args
@@ -373,6 +380,11 @@ def main():
                         help=('show additional pre-action'
                               ' logging (default: %(default)s)'),
                         default=False)
+    parser.add_argument('--force', action='store_true',
+                        help=('force running even if no datasource is'
+                              ' found (use at your own risk)'),
+                        dest='force',
+                        default=False)
     subparsers = parser.add_subparsers()
 
     # Each action and its sub-options (if any)

From 2282aeb6b82bee38951581a7a271f3f1e72f5617 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 13:46:19 -0700
Subject: [PATCH 402/434] Don't remove the key if its not there (or was already
 removed)

---
 cloudinit/ssh_util.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cloudinit/ssh_util.py b/cloudinit/ssh_util.py
index fc8b9b3d..e0a2f0ca 100644
--- a/cloudinit/ssh_util.py
+++ b/cloudinit/ssh_util.py
@@ -197,7 +197,8 @@ def update_authorized_keys(fname, keys):
                 # Replace it with our better one
                 ent = k
                 # Don't add it later
-                to_add.remove(k)
+                if k in to_add:
+                    to_add.remove(k)
         entries[i] = ent
 
     # Now append any entries we did not match above

From 53a38344305ffcf3b40f19f0cb845a3b13370eba Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 13:49:55 -0700
Subject: [PATCH 403/434] Just log the number of commands 'shellified'

---
 cloudinit/util.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 3cf51e65..3ff3835a 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -1303,21 +1303,24 @@ def shellify(cmdlist, add_header=True):
     if add_header:
         content += "#!/bin/sh\n"
     escaped = "%s%s%s%s" % ("'", '\\', "'", "'")
+    cmds_made = 0
     for args in cmdlist:
-        # if the item is a list, wrap all items in single tick
-        # if its not, then just write it directly
+        # If the item is a list, wrap all items in single tick.
+        # If its not, then just write it directly.
         if isinstance(args, list):
             fixed = []
             for f in args:
                 fixed.append("'%s'" % (str(f).replace("'", escaped)))
             content = "%s%s\n" % (content, ' '.join(fixed))
+            cmds_made += 1
         elif isinstance(args, (str, basestring)):
             content = "%s%s\n" % (content, args)
+            cmds_made += 1
         else:
             raise RuntimeError(("Unable to shellify type %s"
                                 " which is not a list or string")
                                % (obj_name(args)))
-    LOG.debug("Shellified %s to %s", cmdlist, content)
+    LOG.debug("Shellified %s commands.", cmds_made)
     return content
 
 

From 80c59cb63547e0a6d512c75f93a9c4ad268dee0d Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 14:01:26 -0700
Subject: [PATCH 404/434] Remove logging of module/init configs

---
 cloudinit/stages.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index ef89e77c..2f175934 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -144,7 +144,7 @@ class Init(object):
         # None check so that we don't keep on re-loading if empty
         if self._cfg is None:
             self._cfg = self._read_cfg(extra_fns)
-            LOG.debug("Loaded 'init' config %s", self._cfg)
+            # LOG.debug("Loaded 'init' config %s", self._cfg)
 
     def _read_cfg(self, extra_fns):
         try:
@@ -414,7 +414,7 @@ class Modules(object):
                                           additional_fns=self.cfg_files,
                                           base_cfg=self.init.cfg)
             self._cached_cfg = merger.cfg
-            LOG.debug("Loading 'module' config %s", self._cached_cfg)
+            # LOG.debug("Loading 'module' config %s", self._cached_cfg)
         # Only give out a copy so that others can't modify this...
         return copy.deepcopy(self._cached_cfg)
 

From c3dffc2d0d9ee7da4e43800600ec87118babd3e7 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 14:42:06 -0700
Subject: [PATCH 405/434] If logging hasn't been enabled via '--debug' at least
 log the exceptions that occur to stderr.

---
 bin/cloud-init | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/bin/cloud-init b/bin/cloud-init
index 0330cb2b..22901e15 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -24,6 +24,7 @@
 import argparse
 import os
 import sys
+import traceback
 
 # This is more just for running from the bin folder so that
 # cloud-init binary can find the cloudinit module
@@ -64,6 +65,18 @@ FREQ_SHORT_NAMES = {
 LOG = logging.getLogger()
 
 
+# Used for when a logger may not be active
+# and we still want to print exceptions...
+def print_exc(msg=''):
+    if msg:
+        sys.stderr.write("%s\n" % (msg))
+    sys.stderr.write('-' * 60)
+    sys.stderr.write("\n")
+    traceback.print_exc(file=sys.stderr)
+    sys.stderr.write('-' * 60)
+    sys.stderr.write("\n")
+
+
 def welcome(action):
     msg = ("Cloud-init v. {{version}} running '{{action}}' at "
            "{{timestamp}}. Up {{uptime}} seconds.")
@@ -151,6 +164,7 @@ def main_init(name, args):
         (outfmt, errfmt) = util.fixup_output(init.cfg, name)
     except:
         util.logexc(LOG, "Failed to setup output redirection!")
+        print_exc("Failed to setup output redirection!")
     if args.debug:
         # Reset so that all the debug handlers are closed out
         LOG.debug(("Logging being reset, this logger may no"
@@ -277,6 +291,9 @@ def main_modules(action_name, args):
         util.logexc(LOG, ('Can not apply stage %s, '
                           'no datasource found!'
                           " Likely bad things to come!"), name)
+        print_exc(('Can not apply stage %s, '
+                   'no datasource found!'
+                   " Likely bad things to come!") % (name))
         if not args.force:
             return 1
     # Stage 3
@@ -326,6 +343,8 @@ def main_single(name, args):
         # the module being ran (so continue on)
         util.logexc(LOG, ("Failed to fetch your datasource,"
                           " likely bad things to come!"))
+        print_exc(("Failed to fetch your datasource,"
+                   " likely bad things to come!"))
         if not args.force:
             return 1
     # Stage 3

From 2a3d52a1b285a33b99fb2d9e67fe8e030da11813 Mon Sep 17 00:00:00 2001
From: Scott Moser <smoser@ubuntu.com>
Date: Fri, 29 Jun 2012 20:06:32 -0400
Subject: [PATCH 406/434] add update_package_sources to distro class

Previously update_package_sources was a private class
(_update_package_sources).  The apt_update_upgrade class called it.

It does make sense that things would want to call this independently
of installing packages.  Therefore, expose it as a non hidden method.
---
 cloudinit/distros/__init__.py |  4 ++++
 cloudinit/distros/debian.py   |  4 ++--
 cloudinit/distros/rhel.py     | 10 ++++++++++
 3 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/cloudinit/distros/__init__.py b/cloudinit/distros/__init__.py
index c324ddf6..da4d0180 100644
--- a/cloudinit/distros/__init__.py
+++ b/cloudinit/distros/__init__.py
@@ -71,6 +71,10 @@ class Distro(object):
     def package_command(self, cmd, args=None):
         raise NotImplementedError()
 
+    @abc.abstractmethod
+    def update_package_sources(self):
+        raise NotImplementedError()
+
     def get_package_mirror(self):
         return self.get_option('package_mirror')
 
diff --git a/cloudinit/distros/debian.py b/cloudinit/distros/debian.py
index 3a0cae19..3247d7ce 100644
--- a/cloudinit/distros/debian.py
+++ b/cloudinit/distros/debian.py
@@ -53,7 +53,7 @@ class Distro(distros.Distro):
         util.write_file(out_fn, "\n".join(contents))
 
     def install_packages(self, pkglist):
-        self._update_package_sources()
+        self.update_package_sources()
         self.package_command('install', pkglist)
 
     def _write_network(self, settings):
@@ -144,6 +144,6 @@ class Distro(distros.Distro):
         # Allow the output of this to flow outwards (ie not be captured)
         util.subp(cmd, env=e, capture=False)
 
-    def _update_package_sources(self):
+    def update_package_sources(self):
         self._runner.run("update-sources", self.package_command,
                          ["update"], freq=PER_INSTANCE)
diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index 87d5b7a8..342d4c79 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -26,6 +26,8 @@ from cloudinit import distros
 from cloudinit import log as logging
 from cloudinit import util
 
+from cloudinit.settings import PER_INSTANCE
+
 LOG = logging.getLogger(__name__)
 
 NETWORK_FN_TPL = '/etc/sysconfig/network-scripts/ifcfg-%s'
@@ -57,6 +59,10 @@ class Distro(distros.Distro):
 
     def __init__(self, name, cfg, paths):
         distros.Distro.__init__(self, name, cfg, paths)
+        # This will be used to restrict certain
+        # calls from repeatly happening (when they
+        # should only happen say once per instance...)
+        self._runner = helpers.Runners(paths)
 
     def install_packages(self, pkglist):
         self.package_command('install', pkglist)
@@ -199,6 +205,10 @@ class Distro(distros.Distro):
         # Allow the output of this to flow outwards (ie not be captured)
         util.subp(cmd, capture=False)
 
+    def update_package_sources(self):
+        self._runner.run("update-sources", self.package_command,
+                         ["update"], freq=PER_INSTANCE)
+
 
 # This class helps adjust the configobj
 # writing to ensure that when writing a k/v

From b427ac1d19027022a7f63c29a43205e6f0d6f463 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 18:20:12 -0700
Subject: [PATCH 407/434] Start filling out the 0.7 changelog section.

---
 ChangeLog | 181 +++++++++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 180 insertions(+), 1 deletion(-)

diff --git a/ChangeLog b/ChangeLog
index 4e75199b..3d7dba0e 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,5 +1,184 @@
 0.7.0:
- - Huge refactor [Joshua Harlow]
+ - unified binary that activates the various stages
+   - Now using argparse + subcommands to specify the various CLI options
+ - a stage module that clearly separates the stages of the different
+   components (also described how they are used and in what order in the
+   new unified binary)
+ - user_data is now a module that just does user data processing while the
+   actual activation and 'handling' of the processed user data is done via
+   a separate set of files (and modules) with the main 'init' stage being the
+   controller of this
+   - creation of boot_hook, cloud_config, shell_script, upstart_job version 2
+     modules (with classes that perform there functionality) instead of those
+     having functionality that is attached to the cloudinit object (which
+     reduces reuse and limits future functionality, and makes testing harder)
+ - removal of global config that defined paths, shared config, now this is
+   via objects making unit testing testing and global side-effects a non issue
+ - creation of a 'helpers.py' 
+   - this contains an abstraction for the 'lock' like objects that the various 
+     module/handler running stages use to avoid re-running a given 
+     module/handler for a given frequency. this makes it separated from 
+     the actual usage of that object (thus helpful for testing and clear lines
+     usage and how the actual job is accomplished)
+     - a common 'runner' class is the main entrypoint using these locks to
+       run function objects passed in (along with there arguments) and there
+       frequency
+   - add in a 'paths' object that provides access to the previously global
+     and/or config based paths, this also adds in the ability to change the
+     path when constructing that path 'object' and adding in additional config
+     that can be used to alter the root paths of 'joins' (useful for testing
+     or possibly useful in chroots?)
+   - add a config parser subclass that will automatically add unknown sections
+     and return default values (instead of throwing exceptions for these cases)
+   - a new config merging class that will be the central object that knows
+     how to do the common configuration merging from the various configuration
+     sources. The order is the following:
+     - cli config files override environment config files
+       which override instance configs which override datasource
+       configs which override base configuration which overrides
+       default configuration.
+ - remove the passing around of the 'cloudinit' object as a 'cloud' variable
+   and instead pass around an 'interface' object that can be given to modules
+   and handlers as there cloud access layer while the backing of that
+   object can be varied (good for abstraction and testing)
+ - use a single set of functions to do importing of modules
+ - add a function in which will search for a given set of module names with
+   a given set of attributes and return those which are found
+ - refactor logging so that instead of using a single top level 'log' that
+   instead each component/module can use its own logger (if desired), this
+   should be backwards compatible with handlers and config modules that used
+   the passed in logger (its still passed in)
+   - ensure that all places where exception are caught and where applicable
+     that the util logexc() is called, so that no exceptions that may occur
+     are dropped without first being logged (where it makes sense for this 
+     to happen)
+ - add a 'requires' file that lists cloud-init dependencies
+   - applying it in package creation (bdeb and brpm) as well as using it
+     in the modified setup.py to ensure dependencies are installed when
+     using that method of packaging
+ - add a 'version.py' that lists the active version (in code) so that code
+   inside cloud-init can report the version in messaging and other config files
+ - cleanup of subprocess usage so that all subprocess calls go through the
+   subp() utility method, which now has an exception type that will provide
+   detailed information on python 2.6 and 2.7
+ - forced all code loading, moving, chmod, writing files and other system
+   level actions to go through standard set of util functions, this greatly 
+   helps in debugging and determining exactly which system actions cloud-init is
+   performing
+ - switching out the templating engine cheetah for tempita since tempita has
+   no external dependencies (minus python) while cheetah has many dependencies
+   which makes it more difficult to adopt cloud-init in distros that may not
+   have those dependencies
+ - adjust url fetching and url trying to go through a single function that
+   reads urls in the new 'url helper' file, this helps in tracing, debugging
+   and knowing which urls are being called and/or posted to from with-in 
+   cloud-init code
+   - add in the sending of a 'User-Agent' header for all urls fetched that
+     do not provide there own header mapping, derive this user-agent from
+     the following template, 'Cloud-Init/{version}' where the version is the
+     cloud-init version number
+ - using prettytable for netinfo 'debug' printing since it provides a standard
+   and defined output that should be easier to parse than a custom format
+ - add a set of distro specific classes, that handle distro specific actions
+   that modules and or handler code can use as needed, this is organized into
+   a base abstract class with child classes that implement the shared 
+   functionality. config determines exactly which subclass to load, so it can
+   be easily extended as needed.
+   - current functionality
+      - network interface config file writing
+      - hostname setting/updating
+      - locale/timezone/ setting
+      - updating of /etc/hosts (with templates or generically)
+      - package commands (ie installing, removing)/mirror finding
+      - interface up/down activating
+   - implemented a debian + ubuntu subclass
+   - implemented a redhat + fedora subclass
+ - adjust the root 'cloud.cfg' file to now have distrobution/path specific 
+   configuration values in it. these special configs are merged as the normal
+   config is, but the system level config is not passed into modules/handlers
+   - modules/handlers must go through the path and distro object instead
+ - have the cloudstack datasource test the url before calling into boto to 
+   avoid the long wait for boto to finish retrying and finally fail when
+   the gateway meta-data address is unavailable
+ - add a simple mock ec2 meta-data python based http server that can serve a
+   very simple set of ec2 meta-data back to callers
+      - useful for testing or for understanding what the ec2 meta-data 
+        service can provide in terms of data or functionality
+ - for ssh key and authorized key file parsing add in classes and util functions
+   that maintain the state of individual lines, allowing for a clearer 
+   separation of parsing and modification (useful for testing and tracing)
+ - add a set of 'base' init.d scripts that can be used on systems that do
+   not have full upstart or systemd support (or support that does not match
+   the standard fedora/ubuntu implementation)
+   - currently these are being tested on RHEL 6.2
+ - separate the datasources into there own subdirectory (instead of being
+   a top-level item), this matches how config 'modules' and user-data 'handlers'
+   are also in there own subdirectory (thus helping new developers and others
+   understand the code layout in a quicker manner)
+ - add the building of rpms based off a new cli tool and template 'spec' file
+   that will templatize and perform the necessary commands to create a source
+   and binary package to be used with a cloud-init install on a 'rpm' supporting
+   system
+   - uses the new standard set of requires and converts those pypi requirements
+     into a local set of package requirments (that are known to exist on RHEL
+     systems but should also exist on fedora systems)
+ - adjust the bdeb builder to be a python script (instead of a shell script) and
+   make its 'control' file a template that takes in the standard set of pypi 
+   dependencies and uses a local mapping (known to work on ubuntu) to create the
+   packages set of dependencies (that should also work on ubuntu-like systems)
+ - pythonify a large set of various pieces of code
+   - remove wrapping return statements with () when it has no effect
+   - upper case all constants used
+   - use os.path.join (and similar commands) instead of custom path creation
+   - use 'is None' instead of the frowned upon '== None' which picks up a large
+     set of 'true' cases than is typically desired (ie for objects that have
+     there own equality)
+   - use context managers on locks, tempdir, chdir, file, selinux, umask, 
+     unmounting commands so that these actions do not have to be closed and/or
+     cleaned up manually in finally blocks, which is typically not done and will
+     eventually be a bug in the future
+   - use the 'abc' module for abstract classes base where possible
+      - applied in the datasource root class, the distro root class, and the
+        user-data v2 root class
+ - when loading yaml, check that the 'root' type matches a predefined set of
+   valid types (typically just 'dict') and throw a type error if a mismatch
+   occurs, this seems to be a good idea to do when loading user config files
+ - when forking a long running task (ie resizing a filesytem) use a new util
+   function that will fork and then call a callback, instead of having to
+   implement all that code in a non-shared location (thus allowing it to be
+   used by others in the future)
+ - when writing out filenames, go through a util function that will attempt to
+   ensure that the given filename is 'filesystem' safe by replacing '/' with
+   '_' and removing characters which do not match a given whitelist of allowed
+   filename characters
+ - for the varying usages of the 'blkid' command make a function in the util
+   module that can be used as the single point of entry for interaction with
+   that command (and its results) instead of having X separate implementations
+ - place the rfc 8222 time formatting and uptime repeated pieces of code in the
+   util module as a set of function with the name 'time_rfc2822'/'uptime'
+ - separate the pylint+pep8 calling from one tool into two indivudal tools so
+   that they can be called independently, add make file sections that can be 
+   used to call these independently
+ - remove the support for the old style config that was previously located in
+   '/etc/ec2-init/ec2-config.cfg', no longer supported!
+ - instead of using a altered config parser that added its own 'dummy' section
+   on in the 'mcollective' module, use configobj which handles the parsing of
+   config without sections better (and it also maintains comments instead of
+   removing them)
+ - use the new defaulting config parser (that will not raise errors on sections
+   that do not exist or return errors when values are fetched that do not exist)
+   in the 'puppet' module
+ - for config 'modules' add in the ability for the module to provide a list of 
+   distro names which it is known to work with, if when ran and the distro being
+   used name does not match one of those in this list, a warning will be written
+   out saying that this module may not work correctly on this distrobution
+ - for all dynamically imported modules ensure that they are fixed up before 
+   they are used by ensuring that they have certain attributes, if they do not
+   have those attributes they will be set to a sensible set of defaults instead
+ - adjust all 'config' modules and handlers to use the adjusted util functions
+   and the new distro objects where applicable so that those pieces of code can 
+   benefit from the unified and enhanced functionality being provided in that
+   util module
 0.6.4:
  - support relative path in AuthorizedKeysFile (LP: #970071).
  - make apt-get update run with --quiet (suitable for logging) (LP: #1012613)

From 62e027b172b1eaa1cab8b3bf6383fdd36379f0bf Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 29 Jun 2012 18:29:45 -0700
Subject: [PATCH 408/434] Update the todo with comments on new actions to be
 fixed.

1. Use the netcf library instead of ubuntu -> rhel format conversion occuring now
2. Replace the apt* like config 'modules' with generic ones that will
   use the new distro classes to handle the specific lower-level details
---
 TODO | 15 +++++++++++----
 1 file changed, 11 insertions(+), 4 deletions(-)

diff --git a/TODO b/TODO
index 568bdb07..50471774 100644
--- a/TODO
+++ b/TODO
@@ -1,14 +1,21 @@
-- consider 'failsafe' DataSource
+- Consider a 'failsafe' DataSource
   If all others fail, setting a default that
    - sets the user password, writing it to console
    - logs to console that this happened
-- consider 'previous' DataSource
+- Consider 'previous' DataSource
   If no other data source is found, fall back to the 'previous' one
   keep a indication of what instance id that is in /var/lib/cloud
-- rewrite "cloud-init-query"
-  have DataSource and cloudinit expose explicit fields
+- Rewrite "cloud-init-query" (currently not implemented)
+  Possibly have DataSource and cloudinit expose explicit fields
    - instance-id
    - hostname
    - mirror
    - release
    - ssh public keys
+- Remove the conversion of the ubuntu network interface format conversion
+  to a RH/fedora format and replace it with a top level format that uses
+  the netcf libraries format instead (which itself knows how to translate
+  into the specific formats)
+- Replace the 'apt*' modules with variants that now use the distro classes
+  to perform distro independent packaging commands (where possible)
+ 

From a353240c09ce98a0a5124757c7bb862785c05196 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 29 Jun 2012 20:37:46 -0700
Subject: [PATCH 409/434] Refactor the selinux guard to aid in mocking

1. Adjust the test_util after this mocking to be cleaner
---
 cloudinit/util.py            | 28 +++++++++++-----------
 tests/unittests/test_util.py | 46 +++++++++++++++++++++++-------------
 2 files changed, 44 insertions(+), 30 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 3ff3835a..0c592656 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -46,19 +46,13 @@ import urlparse
 
 import yaml
 
+from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import url_helper as uhelp
 
 from cloudinit.settings import (CFG_BUILTIN, CLOUD_CONFIG)
 
 
-try:
-    import selinux
-    HAVE_LIBSELINUX = True
-except ImportError:
-    HAVE_LIBSELINUX = False
-
-
 LOG = logging.getLogger(__name__)
 
 # Helps cleanup filenames to ensure they aren't FS incompatible
@@ -126,31 +120,37 @@ class ProcessExecutionError(IOError):
 
 class SeLinuxGuard(object):
     def __init__(self, path, recursive=False):
+        # Late import since it might not always
+        # be possible to use this
+        try:
+            self.selinux = importer.import_module('selinux')
+        except ImportError:
+            self.selinux = None
         self.path = path
         self.recursive = recursive
-        self.enabled = False
-        if HAVE_LIBSELINUX and selinux.is_selinux_enabled():
-            self.enabled = True
 
     def __enter__(self):
-        return self.enabled
+        if self.selinux:
+            return True
+        else:
+            return False
 
     def __exit__(self, excp_type, excp_value, excp_traceback):
-        if self.enabled:
+        if self.selinux:
             path = os.path.realpath(os.path.expanduser(self.path))
             do_restore = False
             try:
                 # See if even worth restoring??
                 stats = os.lstat(path)
                 if stat.ST_MODE in stats:
-                    selinux.matchpathcon(path, stats[stat.ST_MODE])
+                    self.selinux.matchpathcon(path, stats[stat.ST_MODE])
                     do_restore = True
             except OSError:
                 pass
             if do_restore:
                 LOG.debug("Restoring selinux mode for %s (recursive=%s)",
                           path, self.recursive)
-                selinux.restorecon(path, recursive=self.recursive)
+                self.selinux.restorecon(path, recursive=self.recursive)
 
 
 class MountFailedError(Exception):
diff --git a/tests/unittests/test_util.py b/tests/unittests/test_util.py
index 3be6e186..93979f06 100644
--- a/tests/unittests/test_util.py
+++ b/tests/unittests/test_util.py
@@ -5,6 +5,26 @@ from unittest import TestCase
 from mocker import MockerTestCase
 
 from cloudinit import util
+from cloudinit import importer
+
+
+class FakeSelinux(object):
+
+    def __init__(self, match_what):
+        self.match_what = match_what
+        self.restored = []
+
+    def matchpathcon(self, path, mode):
+        if path == self.match_what:
+            return
+        else:
+            raise OSError("No match!")
+
+    def is_selinux_enabled(self):
+        return True
+
+    def restorecon(self, path, recursive):
+        self.restored.append(path)
 
 
 class TestMergeDict(MockerTestCase):
@@ -159,22 +179,16 @@ class TestWriteFile(MockerTestCase):
 
     def test_restorecon_if_possible_is_called(self):
         """Make sure the selinux guard is called correctly."""
-        try:
-            # We can only mock these out if selinux actually
-            # exists, so thats why we catch the import
-            mock_restorecon = self.mocker.replace(
-                "selinux.restorecon", passthrough=False)
-            mock_is_selinux_enabled = self.mocker.replace(
-                "selinux.is_selinux_enabled", passthrough=False)
-            mock_is_selinux_enabled()
-            self.mocker.result(True)
-            mock_restorecon("/etc/hosts", recursive=False)
-            self.mocker.result(True)
-            self.mocker.replay()
-            with util.SeLinuxGuard("/etc/hosts") as is_on:
-                self.assertTrue(is_on)
-        except ImportError:
-            pass
+        import_mock = self.mocker.replace(importer.import_module,
+                                          passthrough=False)
+        import_mock('selinux')
+        fake_se = FakeSelinux('/etc/hosts')
+        self.mocker.result(fake_se)
+        self.mocker.replay()
+        with util.SeLinuxGuard("/etc/hosts") as is_on:
+            self.assertTrue(is_on)
+        self.assertEqual(1, len(fake_se.restored))
+        self.assertEqual('/etc/hosts', fake_se.restored[0])
 
 
 class TestDeleteDirContents(MockerTestCase):

From 8777acf770a67b52d2ef5c3e78dab2384ae2be93 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 29 Jun 2012 20:38:19 -0700
Subject: [PATCH 410/434] Include the helpers import.

---
 cloudinit/distros/rhel.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/cloudinit/distros/rhel.py b/cloudinit/distros/rhel.py
index 342d4c79..7fa69f03 100644
--- a/cloudinit/distros/rhel.py
+++ b/cloudinit/distros/rhel.py
@@ -23,6 +23,7 @@
 import os
 
 from cloudinit import distros
+from cloudinit import helpers
 from cloudinit import log as logging
 from cloudinit import util
 

From 0d075ec8e10899950500eaa59d7ad2d2d1f10a0e Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Fri, 29 Jun 2012 20:38:34 -0700
Subject: [PATCH 411/434] Add some more TODO to be done in the future.

---
 TODO | 15 +++++++++++++--
 1 file changed, 13 insertions(+), 2 deletions(-)

diff --git a/TODO b/TODO
index 50471774..30a52cae 100644
--- a/TODO
+++ b/TODO
@@ -2,7 +2,7 @@
   If all others fail, setting a default that
    - sets the user password, writing it to console
    - logs to console that this happened
-- Consider 'previous' DataSource
+- Consider a 'previous' DataSource
   If no other data source is found, fall back to the 'previous' one
   keep a indication of what instance id that is in /var/lib/cloud
 - Rewrite "cloud-init-query" (currently not implemented)
@@ -18,4 +18,15 @@
   into the specific formats)
 - Replace the 'apt*' modules with variants that now use the distro classes
   to perform distro independent packaging commands (where possible)
- 
+- Canonicalize the semaphore/lock name for modules and user data handlers
+  a. It is most likely a bug that currently exists that if a module in config
+     alters its name and it has already ran, then it will get ran again since
+     the lock name hasn't be canonicalized
+- Replace some the LOG.debug calls with a LOG.info where appropriate instead
+  of how right now there is really only 2 levels (WARN and DEBUG)
+- Remove the 'cc_' for config modules, either have them fully specified (ie
+  'cloudinit.config.resizefs') or by default only look in the 'cloudinit.config'
+  for these modules (or have a combination of the above), this avoids having
+  to understand where your modules are coming from (which can be altered by
+  the current python inclusion path)
+

From e7d50b8e0881c47ec0e861f3be673e6f4811e36a Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sat, 30 Jun 2012 16:18:00 -0700
Subject: [PATCH 412/434] Add comment about #includeonce/#include bug/change

---
 ChangeLog | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/ChangeLog b/ChangeLog
index 3d7dba0e..d55eac9c 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -179,6 +179,10 @@
    and the new distro objects where applicable so that those pieces of code can 
    benefit from the unified and enhanced functionality being provided in that
    util module
+ - fix a potential bug whereby when a #includeonce was encountered it would
+   enable checking of urls against a cache, if later a #include was encountered
+   it would continue checking against that cache, instead of refetching (which
+   would likely be the expected case)
 0.6.4:
  - support relative path in AuthorizedKeysFile (LP: #970071).
  - make apt-get update run with --quiet (suitable for logging) (LP: #1012613)

From 216d656c68886139ad7d267ff7de110ac3856980 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sat, 30 Jun 2012 16:56:14 -0700
Subject: [PATCH 413/434] Add in more comments about what has been
 changed/adjusted/reworked

---
 ChangeLog | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/ChangeLog b/ChangeLog
index d55eac9c..ecac7888 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -24,10 +24,14 @@
        run function objects passed in (along with there arguments) and there
        frequency
    - add in a 'paths' object that provides access to the previously global
-     and/or config based paths, this also adds in the ability to change the
-     path when constructing that path 'object' and adding in additional config
-     that can be used to alter the root paths of 'joins' (useful for testing
-     or possibly useful in chroots?)
+     and/or config based paths (thus providing a single entrypoint object/type
+     that provides path information)
+       - this also adds in the ability to change the path when constructing 
+       that path 'object' and adding in additional config that can be used to 
+       alter the root paths of 'joins' (useful for testing or possibly useful
+       in chroots?)
+        - config options now avaiable that can alter the 'write_root' and the 
+         'read_root' when backing code uses the paths join() function
    - add a config parser subclass that will automatically add unknown sections
      and return default values (instead of throwing exceptions for these cases)
    - a new config merging class that will be the central object that knows
@@ -129,6 +133,7 @@
  - pythonify a large set of various pieces of code
    - remove wrapping return statements with () when it has no effect
    - upper case all constants used
+   - correctly 'case' class and method names (where applicable)
    - use os.path.join (and similar commands) instead of custom path creation
    - use 'is None' instead of the frowned upon '== None' which picks up a large
      set of 'true' cases than is typically desired (ie for objects that have

From 55464e8512455934f5c34e9f75bf49d4137662c9 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Sun, 1 Jul 2012 00:19:49 -0700
Subject: [PATCH 414/434] Add a multi log function that can write to stderr,
 console and a log debug, useful in certain cases

---
 bin/cloud-init                         |  4 +---
 cloudinit/config/cc_final_message.py   |  6 +-----
 cloudinit/config/cc_keys_to_console.py |  6 +++---
 cloudinit/util.py                      | 11 +++++++++++
 4 files changed, 16 insertions(+), 11 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index 22901e15..fce4fe8c 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -86,9 +86,7 @@ def welcome(action):
         'timestamp': util.time_rfc2822(),
         'action': action,
     }
-    welcome_msg = "%s" % (templater.render_string(msg, tpl_params))
-    sys.stderr.write("%s\n" % (welcome_msg))
-    LOG.debug(welcome_msg)
+    util.multi_log("%s\n" % (templater.render_string(msg, tpl_params)))
 
 
 def extract_fns(args):
diff --git a/cloudinit/config/cc_final_message.py b/cloudinit/config/cc_final_message.py
index fd59aa1e..711e7b5b 100644
--- a/cloudinit/config/cc_final_message.py
+++ b/cloudinit/config/cc_final_message.py
@@ -18,8 +18,6 @@
 #    You should have received a copy of the GNU General Public License
 #    along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import sys
-
 from cloudinit import templater
 from cloudinit import util
 from cloudinit import version
@@ -57,9 +55,7 @@ def handle(_name, cfg, cloud, log, args):
             'timestamp': ts,
             'version': cver,
         }
-        # Use stdout, stderr or the logger??
-        content = templater.render_string(msg_in, subs)
-        sys.stderr.write("%s\n" % (content))
+        util.multi_log("%s\n" % (templater.render_string(msg_in, subs)))
     except Exception:
         util.logexc(log, "Failed to render final message template")
 
diff --git a/cloudinit/config/cc_keys_to_console.py b/cloudinit/config/cc_keys_to_console.py
index d4c877f7..da7d5219 100644
--- a/cloudinit/config/cc_keys_to_console.py
+++ b/cloudinit/config/cc_keys_to_console.py
@@ -29,7 +29,7 @@ frequency = PER_INSTANCE
 HELPER_TOOL = '/usr/lib/cloud-init/write-ssh-key-fingerprints'
 
 
-def handle(name, cfg, cloud, log, _args):
+def handle(name, cfg, _cloud, log, _args):
     if not os.path.exists(HELPER_TOOL):
         log.warn(("Unable to activate module %s,"
                   " helper tool not found at %s"), name, HELPER_TOOL)
@@ -46,7 +46,7 @@ def handle(name, cfg, cloud, log, _args):
         cmd.append(','.join(fp_blacklist))
         cmd.append(','.join(key_blacklist))
         (stdout, _stderr) = util.subp(cmd)
-        util.write_file(cloud.paths.join(False, '/dev/console'), stdout)
+        util.multi_log("%s\n" % (stdout.strip()), stderr=False)
     except:
-        log.warn("Writing keys to /dev/console failed!")
+        log.warn("Writing keys to the system console failed!")
         raise
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 0c592656..e6219d66 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -271,6 +271,17 @@ def find_modules(root_dir):
     return entries
 
 
+def multi_log(text, console=True, stderr=True, log=None):
+    if stderr:
+        sys.stderr.write(text)
+    if console:
+        with open('/dev/console', 'wb') as wfh:
+            wfh.write(text)
+            wfh.flush()
+    if log:
+        log.debug(text)
+
+
 def is_ipv4(instr):
     """ determine if input string is a ipv4 address. return boolean"""
     toks = instr.split('.')

From 71a802b036fda4542c6a01cb201a4b0de650b6d8 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 1 Jul 2012 12:08:08 -0700
Subject: [PATCH 415/434] 1. Rename util functions to is_true and is_false 2.
 Move the config loading functions to where they are used (in stages) 3.
 Adjust cc_set_passwords to use the is_true and is_false renamed functions 4.
 Adjust the init stage to have a _read_base_config function used to load   
 the base 'initial' configuration from the following locations    a. Kernel
 cmdline    b. Conf.d location (+ the cloud.cfg location)    c. Built-in
 configuration

---
 cloudinit/config/cc_set_passwords.py |  4 +-
 cloudinit/stages.py                  | 27 ++++++++++----
 cloudinit/util.py                    | 56 ++++++++--------------------
 3 files changed, 37 insertions(+), 50 deletions(-)

diff --git a/cloudinit/config/cc_set_passwords.py b/cloudinit/config/cc_set_passwords.py
index 5b72224b..ab266741 100644
--- a/cloudinit/config/cc_set_passwords.py
+++ b/cloudinit/config/cc_set_passwords.py
@@ -96,9 +96,9 @@ def handle(_name, cfg, cloud, log, args):
     pw_auth = None
     if 'ssh_pwauth' in cfg:
         change_pwauth = True
-        if util.is_true_str(cfg['ssh_pwauth']):
+        if util.is_true(cfg['ssh_pwauth']):
             pw_auth = 'yes'
-        if util.is_false_str(cfg['ssh_pwauth']):
+        if util.is_false(cfg['ssh_pwauth']):
             pw_auth = 'no'
 
     if change_pwauth:
diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 2f175934..79663b27 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -26,7 +26,7 @@ import copy
 import os
 import sys
 
-from cloudinit.settings import (PER_INSTANCE, FREQUENCIES)
+from cloudinit.settings import (PER_INSTANCE, FREQUENCIES, CLOUD_CONFIG)
 
 from cloudinit import handlers
 
@@ -146,16 +146,27 @@ class Init(object):
             self._cfg = self._read_cfg(extra_fns)
             # LOG.debug("Loaded 'init' config %s", self._cfg)
 
+    def _read_base_cfg(self):
+        base_cfgs = []
+        default_cfg = util.get_builtin_cfg()
+        kern_contents = util.read_cc_from_cmdline()
+        # Kernel/cmdline parameters override system config
+        if kern_contents:
+            base_cfgs.append(util.load_yaml(kern_contents, default={}))
+        # Anything in your conf.d location??
+        if os.path.isfile(CLOUD_CONFIG):
+            base_cfgs.append(util.read_conf_with_confd(CLOUD_CONFIG))
+        # And finally the default gets to play
+        if default_cfg:
+            base_cfgs.append(default_cfg)
+        return util.mergemanydict(base_cfgs)
+
     def _read_cfg(self, extra_fns):
-        try:
-            base_conf = util.get_base_cfg(builtin=util.get_builtin_cfg())
-        except Exception:
-            base_conf = util.get_builtin_cfg()
-        no_cfg_pths = helpers.Paths({}, self.datasource)
-        merger = helpers.ConfigMerger(paths=no_cfg_pths,
+        no_cfg_paths = helpers.Paths({}, self.datasource)
+        merger = helpers.ConfigMerger(paths=no_cfg_paths,
                                       datasource=self.datasource,
                                       additional_fns=extra_fns,
-                                      base_cfg=base_conf)
+                                      base_cfg=self._read_base_cfg())
         return merger.cfg
 
     def _restore_from_cache(self):
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 0c592656..f07d22e7 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -50,7 +50,7 @@ from cloudinit import importer
 from cloudinit import log as logging
 from cloudinit import url_helper as uhelp
 
-from cloudinit.settings import (CFG_BUILTIN, CLOUD_CONFIG)
+from cloudinit.settings import (CFG_BUILTIN)
 
 
 LOG = logging.getLogger(__name__)
@@ -192,7 +192,9 @@ def fork_cb(child_cb, *args):
                   fid, obj_name(child_cb))
 
 
-def is_true_str(val, addons=None):
+def is_true(val, addons=None):
+    if isinstance(val, (bool)):
+        return val is True
     check_set = ['true', '1', 'on', 'yes']
     if addons:
         check_set = check_set + addons
@@ -201,7 +203,9 @@ def is_true_str(val, addons=None):
     return False
 
 
-def is_false_str(val, addons=None):
+def is_false(val, addons=None):
+    if isinstance(val, (bool)):
+        return val is False
     check_set = ['off', '0', 'no', 'false']
     if addons:
         check_set = check_set + addons
@@ -218,7 +222,7 @@ def translate_bool(val, addons=None):
     # If its already a boolean skip
     if isinstance(val, (bool)):
         return val
-    return is_true_str(val, addons)
+    return is_true(val, addons)
 
 
 def rand_str(strlen=32, select_from=None):
@@ -285,29 +289,6 @@ def is_ipv4(instr):
     return (len(toks) == 4)
 
 
-def merge_base_cfg(cfgfile, cfg_builtin=None):
-    syscfg = read_conf_with_confd(cfgfile)
-
-    kern_contents = read_cc_from_cmdline()
-    kerncfg = {}
-    if kern_contents:
-        kerncfg = load_yaml(kern_contents, default={})
-
-    # Kernel parameters override system config
-    if kerncfg:
-        combined = mergedict(kerncfg, syscfg)
-    else:
-        combined = syscfg
-
-    if cfg_builtin:
-        # Combined over-ride anything builtin
-        fin = mergedict(combined, cfg_builtin)
-    else:
-        fin = combined
-
-    return fin
-
-
 def get_cfg_option_bool(yobj, key, default=False):
     if key not in yobj:
         return default
@@ -622,15 +603,17 @@ def read_seeded(base="", ext="", timeout=5, retries=10, file_retries=0):
 
 
 def read_conf_d(confd):
-    # get reverse sorted list (later trumps newer)
+    # Get reverse sorted list (later trumps newer)
     confs = sorted(os.listdir(confd), reverse=True)
 
-    # remove anything not ending in '.cfg'
+    # Remove anything not ending in '.cfg'
     confs = [f for f in confs if f.endswith(".cfg")]
 
-    # remove anything not a file
-    confs = [f for f in confs if os.path.isfile(os.path.join(confd, f))]
+    # Remove anything not a file
+    confs = [f for f in confs
+             if os.path.isfile(os.path.join(confd, f))]
 
+    # Load them all so that they can be merged
     cfgs = []
     for fn in confs:
         cfgs.append(read_conf(os.path.join(confd, fn)))
@@ -658,7 +641,8 @@ def read_conf_with_confd(cfgfile):
         return cfg
 
     # Conf.d settings override input configuration
-    return mergedict(read_conf_d(confd), cfg)
+    confd_cfg = read_conf_d(confd)
+    return mergedict(confd_cfg, cfg)
 
 
 def read_cc_from_cmdline(cmdline=None):
@@ -1076,14 +1060,6 @@ def ensure_dir(path, mode=None):
         chmod(path, mode)
 
 
-def get_base_cfg(cfg_path=None, builtin=None):
-    if not cfg_path:
-        cfg_path = CLOUD_CONFIG
-    if not builtin:
-        builtin = get_builtin_cfg()
-    return merge_base_cfg(cfg_path, builtin)
-
-
 @contextlib.contextmanager
 def unmounter(umount):
     try:

From d8005335ca0555b493eb430f5bd08c41aa410cbe Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 1 Jul 2012 12:11:21 -0700
Subject: [PATCH 416/434] Always read fro the cloud config location + conf.d
 locations

---
 cloudinit/stages.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cloudinit/stages.py b/cloudinit/stages.py
index 79663b27..8fd6aa5d 100644
--- a/cloudinit/stages.py
+++ b/cloudinit/stages.py
@@ -154,8 +154,8 @@ class Init(object):
         if kern_contents:
             base_cfgs.append(util.load_yaml(kern_contents, default={}))
         # Anything in your conf.d location??
-        if os.path.isfile(CLOUD_CONFIG):
-            base_cfgs.append(util.read_conf_with_confd(CLOUD_CONFIG))
+        # or the 'default' cloud.cfg location???
+        base_cfgs.append(util.read_conf_with_confd(CLOUD_CONFIG))
         # And finally the default gets to play
         if default_cfg:
             base_cfgs.append(default_cfg)

From b6739d04dcd683ec868ab15df1ee3d406e078504 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 1 Jul 2012 12:43:33 -0700
Subject: [PATCH 417/434] Add a nova/openstack based extension to pep8 via
 hacking.py

---
 tools/hacking.py | 175 +++++++++++++++++++++++++++++++++++++++++++++++
 tools/run-pep8   |  13 +++-
 2 files changed, 185 insertions(+), 3 deletions(-)
 create mode 100755 tools/hacking.py

diff --git a/tools/hacking.py b/tools/hacking.py
new file mode 100755
index 00000000..d0c27d25
--- /dev/null
+++ b/tools/hacking.py
@@ -0,0 +1,175 @@
+#!/usr/bin/env python
+# vim: tabstop=4 shiftwidth=4 softtabstop=4
+
+# Copyright (c) 2012, Cloudscaling
+# All Rights Reserved.
+#
+#    Licensed under the Apache License, Version 2.0 (the "License"); you may
+#    not use this file except in compliance with the License. You may obtain
+#    a copy of the License at
+#
+#         http://www.apache.org/licenses/LICENSE-2.0
+#
+#    Unless required by applicable law or agreed to in writing, software
+#    distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
+#    WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
+#    License for the specific language governing permissions and limitations
+#    under the License.
+
+"""cloudinit HACKING file compliance testing (based off of nova hacking.py)
+
+built on top of pep8.py
+"""
+
+import inspect
+import logging
+import os
+import re
+import sys
+import tokenize
+import warnings
+
+import pep8
+
+# Don't need this for testing
+logging.disable('LOG')
+
+# N1xx comments
+# N2xx except
+# N3xx imports
+# N4xx docstrings
+# N[5-9]XX (future use)
+
+DOCSTRING_TRIPLE = ['"""', "'''"]
+VERBOSE_MISSING_IMPORT = False
+_missingImport = set([])
+
+
+def import_normalize(line):
+    # convert "from x import y" to "import x.y"
+    # handle "from x import y as z" to "import x.y as z"
+    split_line = line.split()
+    if (line.startswith("from ") and "," not in line and
+           split_line[2] == "import" and split_line[3] != "*" and
+           split_line[1] != "__future__" and
+           (len(split_line) == 4 or
+           (len(split_line) == 6 and split_line[4] == "as"))):
+        return "import %s.%s" % (split_line[1], split_line[3])
+    else:
+        return line
+
+
+def cloud_import_alphabetical(physical_line, line_number, lines):
+    """Check for imports in alphabetical order.
+
+    HACKING guide recommendation for imports:
+    imports in human alphabetical order
+    N306
+    """
+    # handle import x
+    # use .lower since capitalization shouldn't dictate order
+    split_line = import_normalize(physical_line.strip()).lower().split()
+    split_previous = import_normalize(lines[line_number - 2]
+            ).strip().lower().split()
+    # with or without "as y"
+    length = [2, 4]
+    if (len(split_line) in length and len(split_previous) in length and
+        split_line[0] == "import" and split_previous[0] == "import"):
+        if split_line[1] < split_previous[1]:
+            return (0, "N306: imports not in alphabetical order (%s, %s)"
+                % (split_previous[1], split_line[1]))
+
+
+def cloud_docstring_start_space(physical_line):
+    """Check for docstring not start with space.
+
+    HACKING guide recommendation for docstring:
+    Docstring should not start with space
+    N401
+    """
+    pos = max([physical_line.find(i) for i in DOCSTRING_TRIPLE])  # start
+    if (pos != -1 and len(physical_line) > pos + 1):
+        if (physical_line[pos + 3] == ' '):
+            return (pos, "N401: one line docstring should not start with"
+                " a space")
+
+
+def cloud_todo_format(physical_line):
+    """Check for 'TODO()'.
+
+    HACKING guide recommendation for TODO:
+    Include your name with TODOs as in "#TODO(termie)"
+    N101
+    """
+    pos = physical_line.find('TODO')
+    pos1 = physical_line.find('TODO(')
+    pos2 = physical_line.find('#') # make sure it's a comment
+    if (pos != pos1 and pos2 >= 0 and pos2 < pos):
+        return pos, "N101: Use TODO(NAME)"
+
+
+def cloud_docstring_one_line(physical_line):
+    """Check one line docstring end.
+
+    HACKING guide recommendation for one line docstring:
+    A one line docstring looks like this and ends in a period.
+    N402
+    """
+    pos = max([physical_line.find(i) for i in DOCSTRING_TRIPLE])  # start
+    end = max([physical_line[-4:-1] == i for i in DOCSTRING_TRIPLE])  # end
+    if (pos != -1 and end and len(physical_line) > pos + 4):
+        if (physical_line[-5] != '.'):
+            return pos, "N402: one line docstring needs a period"
+
+
+def cloud_docstring_multiline_end(physical_line):
+    """Check multi line docstring end.
+
+    HACKING guide recommendation for docstring:
+    Docstring should end on a new line
+    N403
+    """
+    pos = max([physical_line.find(i) for i in DOCSTRING_TRIPLE])  # start
+    if (pos != -1 and len(physical_line) == pos):
+        print physical_line
+        if (physical_line[pos + 3] == ' '):
+            return (pos, "N403: multi line docstring end on new line")
+
+
+
+current_file = ""
+
+
+def readlines(filename):
+    """Record the current file being tested."""
+    pep8.current_file = filename
+    return open(filename).readlines()
+
+
+def add_cloud():
+    """Monkey patch pep8 for cloud-init guidelines.
+
+    Look for functions that start with cloud_
+    and add them to pep8 module.
+
+    Assumes you know how to write pep8.py checks
+    """
+    for name, function in globals().items():
+        if not inspect.isfunction(function):
+            continue
+        if name.startswith("cloud_"):
+            exec("pep8.%s = %s" % (name, name))
+
+if __name__ == "__main__":
+    # NOVA based 'hacking.py' error codes start with an N
+    pep8.ERRORCODE_REGEX = re.compile(r'[EWN]\d{3}')
+    add_cloud()
+    pep8.current_file = current_file
+    pep8.readlines = readlines
+    try:
+        pep8._main()
+    finally:
+        if len(_missingImport) > 0:
+            print >> sys.stderr, ("%i imports missing in this test environment"
+                    % len(_missingImport))
+
diff --git a/tools/run-pep8 b/tools/run-pep8
index e7707985..ea46c117 100755
--- a/tools/run-pep8
+++ b/tools/run-pep8
@@ -12,17 +12,24 @@ if [ $# -eq 0 ]; then
    done
 else
    files=( "$@" );
-fi 
+fi
+
+if [ -f 'hacking.py' ]
+then
+    base=`pwd`
+else
+    base=`pwd`/tools/
+fi
 
 cmd=(
-    pep8
+    ${base}/hacking.py
 
     --ignore=E501 # Line too long (these are caught by pylint)
 
     "${files[@]}"
 )
 
-echo -e "\nRunning pep8:"
+echo -e "\nRunning 'cloudinit' pep8:"
 echo "${cmd[@]}"
 "${cmd[@]}"
 

From 3cee0d84e9ffd8f6c23094227865e686cfbbd587 Mon Sep 17 00:00:00 2001
From: harlowja <harlowja@virtualbox.rhel>
Date: Sun, 1 Jul 2012 12:48:51 -0700
Subject: [PATCH 418/434] Adjust the changelog after adding 'hacking.py'

---
 ChangeLog | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/ChangeLog b/ChangeLog
index ecac7888..c3f71b9c 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -188,6 +188,9 @@
    enable checking of urls against a cache, if later a #include was encountered
    it would continue checking against that cache, instead of refetching (which
    would likely be the expected case)
+ - add a openstack/nova based pep8 extension utility ('hacking.py') that allows
+   for custom checks (along with the standard pep8 checks) to occur when running
+   'make pep8' and its derivatives
 0.6.4:
  - support relative path in AuthorizedKeysFile (LP: #970071).
  - make apt-get update run with --quiet (suitable for logging) (LP: #1012613)

From 2d960203854a91574628fdc91e35abedca51420a Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 2 Jul 2012 10:56:22 -0700
Subject: [PATCH 419/434] 1. Move the welcome message template string to a
 constant at the top of the module 2. Fix the usage of multi_log to log to
 only one of the places (for now) 3. Update comment about multi-log and why
 write_file isn't used in this case

---
 bin/cloud-init                         | 11 ++++++++---
 cloudinit/config/cc_final_message.py   |  3 ++-
 cloudinit/config/cc_keys_to_console.py |  3 ++-
 cloudinit/util.py                      |  7 +++++--
 4 files changed, 17 insertions(+), 7 deletions(-)

diff --git a/bin/cloud-init b/bin/cloud-init
index fce4fe8c..c7863db1 100755
--- a/bin/cloud-init
+++ b/bin/cloud-init
@@ -45,6 +45,10 @@ from cloudinit.settings import (PER_INSTANCE, PER_ALWAYS, PER_ONCE,
                                 CLOUD_CONFIG)
 
 
+# Pretty little welcome message template
+WELCOME_MSG_TPL = ("Cloud-init v. {{version}} running '{{action}}' at "
+                   "{{timestamp}}. Up {{uptime}} seconds.")
+
 # Module section template
 MOD_SECTION_TPL = "cloud_%s_modules"
 
@@ -56,6 +60,7 @@ QUERY_DATA_TYPES = [
 ]
 
 # Frequency shortname to full name
+# (so users don't have to remember the full name...)
 FREQ_SHORT_NAMES = {
     'instance': PER_INSTANCE,
     'always': PER_ALWAYS,
@@ -78,15 +83,15 @@ def print_exc(msg=''):
 
 
 def welcome(action):
-    msg = ("Cloud-init v. {{version}} running '{{action}}' at "
-           "{{timestamp}}. Up {{uptime}} seconds.")
     tpl_params = {
         'version': version.version_string(),
         'uptime': util.uptime(),
         'timestamp': util.time_rfc2822(),
         'action': action,
     }
-    util.multi_log("%s\n" % (templater.render_string(msg, tpl_params)))
+    tpl_msg = templater.render_string(WELCOME_MSG_TPL, tpl_params)
+    util.multi_log("%s\n" % (tpl_msg),
+                   console=False, stderr=True)
 
 
 def extract_fns(args):
diff --git a/cloudinit/config/cc_final_message.py b/cloudinit/config/cc_final_message.py
index 711e7b5b..b1caca47 100644
--- a/cloudinit/config/cc_final_message.py
+++ b/cloudinit/config/cc_final_message.py
@@ -55,7 +55,8 @@ def handle(_name, cfg, cloud, log, args):
             'timestamp': ts,
             'version': cver,
         }
-        util.multi_log("%s\n" % (templater.render_string(msg_in, subs)))
+        util.multi_log("%s\n" % (templater.render_string(msg_in, subs)),
+                       console=False, stderr=True)
     except Exception:
         util.logexc(log, "Failed to render final message template")
 
diff --git a/cloudinit/config/cc_keys_to_console.py b/cloudinit/config/cc_keys_to_console.py
index da7d5219..ed7af690 100644
--- a/cloudinit/config/cc_keys_to_console.py
+++ b/cloudinit/config/cc_keys_to_console.py
@@ -46,7 +46,8 @@ def handle(name, cfg, _cloud, log, _args):
         cmd.append(','.join(fp_blacklist))
         cmd.append(','.join(key_blacklist))
         (stdout, _stderr) = util.subp(cmd)
-        util.multi_log("%s\n" % (stdout.strip()), stderr=False)
+        util.multi_log("%s\n" % (stdout.strip()),
+                       stderr=False, console=True)
     except:
         log.warn("Writing keys to the system console failed!")
         raise
diff --git a/cloudinit/util.py b/cloudinit/util.py
index 6b23a0ee..4c29432b 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -275,15 +275,18 @@ def find_modules(root_dir):
     return entries
 
 
-def multi_log(text, console=True, stderr=True, log=None):
+def multi_log(text, console=True, stderr=True,
+              log=None, log_level=logging.DEBUG):
     if stderr:
         sys.stderr.write(text)
     if console:
+        # Don't use the write_file since
+        # this might be 'sensitive' info (not debug worthy?)
         with open('/dev/console', 'wb') as wfh:
             wfh.write(text)
             wfh.flush()
     if log:
-        log.debug(text)
+        log.log(log_level, text)
 
 
 def is_ipv4(instr):

From 545fd9c3b997850b1e4f106a7986142d53d42ae8 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 2 Jul 2012 15:40:51 -0700
Subject: [PATCH 420/434] 1. Fixup the setup.py to not include custom startup
 scripts, let the packaging solutions handle these 2. Get the cloud-init
 specfile working for the init.d case (with the right postun and post and
 install sections)    a. It works!!!

---
 packages/brpm                   | 104 +++----------------
 packages/redhat/cloud-init.spec | 177 +++++++++++++++++++++++++++-----
 setup.py                        |   8 --
 3 files changed, 169 insertions(+), 120 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index bbf30565..3abd9f15 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -71,6 +71,7 @@ def get_log_header(version):
 
 
 def format_change_line(ds, who, comment=None):
+    # Rpmbuild seems to be pretty strict about the date format
     d = ds.strftime("%a %b %d %Y")
     d += " - %s" % (who)
     if comment:
@@ -134,104 +135,31 @@ def generate_spec_contents(args, tmpl_fn):
             changelog_lines.append(line)
     subs['changelog'] = "\n".join(changelog_lines)
 
-    # See: http://www.zarb.org/~jasonc/macros.php
-    # Pickup any special files
-    docs = [
-        'TODO',
-        'LICENSE',
-        'ChangeLog',
-        'Requires',
-        '%{_defaultdocdir}/cloud-init/*',
-    ]
-    subs['docs'] = docs
-    configs = [
-        'cloud/cloud.cfg',
-        'cloud/cloud.cfg.d/*.cfg',
-        'cloud/cloud.cfg.d/README',
-        'cloud/templates/*',
-    ]
-    subs['configs'] = configs
-    other_files = [
-        '%{_bindir}/*',
-        '/usr/lib/cloud-init/*',
-    ]
+    if args.boot == 'initd':
+        subs['init_d'] = True
+        subs['init_d_local'] = False
+    elif args.boot == 'initd-local':
+        subs['init_d'] = True
+        subs['init_d_local'] = True
+    else:
+        subs['init_d'] = False
+        subs['init_d_local'] = False
+
+    if args.boot == 'systemd':
+        subs['systemd'] = True
+    else:
+        subs['systemd'] = False
 
-    # Since setup.py installs them all, we need to selectively
-    # remove the wrong ones and ensure the right one/s are kept
-    # for the boot mode that is desired...
-    boot_remove = { 
-        'initd': [
-            '/etc/init.d/cloud-init-local',
-            # Remove the other auto-start folders
-            '/etc/systemd/',
-            '/etc/init/',
-        ],
-        'initd-local': [
-            '/etc/init.d/cloud-init',
-            # Remove the other auto-start folders
-            '/etc/systemd/',
-            '/etc/init/',
-        ],
-        # It seems like systemd can work with
-        # all of its files being 'active' (and not have naming
-        # or event name conflicts??)
-        'systemd': [
-            # Remove the other auto-start folders
-            '/etc/init.d/',
-            '/etc/init/',
-        ],
-        'upstart': [
-            '/etc/init/cloud-init-nonet.conf',
-            '/etc/init/cloud-init-local.conf',
-            # Remove the other auto-start folders
-            '/etc/init.d/',
-            '/etc/systemd/',
-        ],
-        'upstart-local': [
-            '/etc/init/cloud-init.conf',
-            # Remove the other auto-start folders
-            '/etc/init.d/',
-            '/etc/systemd/',
-        ]
-    }
-    boot_keep = {
-        'systemd': [
-            '/etc/systemd/*',
-        ],
-        'upstart': [
-            '/etc/init/*',
-        ],
-        'upstart-local': [
-            '/etc/init/*',
-        ],
-        'initd-local': [
-            '/etc/init.d/*',
-        ],
-        'initd': [
-            '/etc/init.d/*',
-        ],
-    }
-    subs['post_remove'] = boot_remove[args.boot]
-    other_files.extend(boot_keep[args.boot])
-    subs['files'] = other_files
     return templater.render_from_file(tmpl_fn, params=subs)
 
 
-def archive_code():
-    (stdout, _stderr) = tiny_p([sys.executable, 
-                               join(os.getcwd(), 'make-tarball')])
-    (revno, version, bname, arc_fn) = stdout.split(None)
-    return (revno, version, arc_fn)
-
-
 def main():
     
     parser = argparse.ArgumentParser()
     parser.add_argument("-b", "--boot", dest="boot",
                         help="select boot type (default: %(default)s)", 
                         metavar="TYPE", default='initd',
-                        choices=('upstart', 'initd', 'systemd',
-                                 'upstart-local', 'initd-local'))
+                        choices=('initd', 'systemd', 'initd-local'))
     parser.add_argument("-v", "--verbose", dest="verbose",
                         help=("run verbosely"
                               " (default: %(default)s)"),
diff --git a/packages/redhat/cloud-init.spec b/packages/redhat/cloud-init.spec
index ddb6617d..e9ce087a 100644
--- a/packages/redhat/cloud-init.spec
+++ b/packages/redhat/cloud-init.spec
@@ -1,5 +1,9 @@
 %{!?python_sitelib: %global python_sitelib %(%{__python} -c "from distutils.sysconfig import get_python_lib; print get_python_lib()")}
 
+# See: See: http://www.zarb.org/~jasonc/macros.php
+# Or: http://fedoraproject.org/wiki/Packaging:ScriptletSnippets
+# Or: http://www.rpm.org/max-rpm/ch-rpm-inside.html
+
 Name:           cloud-init
 Version:        {{version}}
 Release:        {{release}}%{?dist}
@@ -10,27 +14,45 @@ License:        GPLv3
 URL:            http://launchpad.net/cloud-init
 
 Source0:        {{archive_name}}
-
 BuildArch:      noarch
-
 BuildRoot:      %{_tmppath}
 
+BuildRequires:        python-devel
+BuildRequires:        python-setuptools
 
-{{for r in bd_requires}}
-BuildRequires: {{r}}
-{{endfor}}
+# System util packages needed
+Requires:       shadow-utils
+Requires:       rsyslog
+Requires:       iproute
+Requires:       e2fsprogs
+Requires:       net-tools
+Requires:       procps
+Requires:       shadow-utils
 
-# Install requirements
+# Install pypi 'dynamic' requirements
 {{for r in requires}}
-Requires: {{r}}
+Requires:       {{r}}
 {{endfor}}
 
+{{if init_d}}
+Requires(post):       chkconfig
+Requires(postun):     initscripts
+Requires(preun):      chkconfig
+Requires(preun):      initscripts
+{{endif}}
+
+{{if systemd}}
+BuildRequires:  systemd-units
+Requires(post):   systemd-units
+Requires(postun): systemd-units
+Requires(preun):  systemd-units
+{{endif}}
+
 %description
 Cloud-init is a set of init scripts for cloud instances.  Cloud instances
 need special scripts to run during initialization to retrieve and install
 ssh keys and to let the user run various scripts.
 
-
 %prep
 %setup -q -n %{name}-%{version}-{{revno}}
 
@@ -41,32 +63,139 @@ ssh keys and to let the user run various scripts.
 rm -rf $RPM_BUILD_ROOT
 %{__python} setup.py install -O1 --skip-build --root $RPM_BUILD_ROOT
 
-# Remove anything after it was installed??
-{{for r in post_remove}}
-rm -rfv $RPM_BUILD_ROOT/{{r}}
-{{endfor}}
+# Note that /etc/rsyslog.d didn't exist by default until F15.
+# el6 request: https://bugzilla.redhat.com/show_bug.cgi?id=740420
+mkdir -p $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d
+cp -p tools/21-cloudinit.conf \
+                    $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d/21-cloudinit.conf
+
+{{if init_d}}
+mkdir -p $RPM_BUILD_ROOT/%{_initddir}/
+{{endif}}
+{{if init_d_local}}
+cp -p initd/cloud-init-local $RPM_BUILD_ROOT/%{_initddir}/
+cp -p initd/cloud-config $RPM_BUILD_ROOT/%{_initddir}/
+cp -p initd/cloud-final $RPM_BUILD_ROOT/%{_initddir}/
+{{elif init_d}}
+cp -p initd/cloud-init $RPM_BUILD_ROOT/%{_initddir}/
+cp -p initd/cloud-config $RPM_BUILD_ROOT/%{_initddir}/
+cp -p initd/cloud-final $RPM_BUILD_ROOT/%{_initddir}/
+{{endif}}
+
+{{if systemd}}
+mkdir -p        $RPM_BUILD_ROOT/%{_unitdir}
+cp -p systemd/* $RPM_BUILD_ROOT/%{_unitdir}
+{{endif}}
 
 %clean
 rm -rf $RPM_BUILD_ROOT
 
+%post
+
+{{if systemd}}
+if [ $1 -eq 1 ]
+then
+    /bin/systemctl enable cloud-config.service     >/dev/null 2>&1 || :
+    /bin/systemctl enable cloud-final.service      >/dev/null 2>&1 || :
+    /bin/systemctl enable cloud-init.service       >/dev/null 2>&1 || :
+    /bin/systemctl enable cloud-init-local.service >/dev/null 2>&1 || :
+fi
+{{endif}}
+
+{{if init_d_local}}
+/sbin/chkconfig --add /etc/rc.d/init.d/cloud-init-local
+{{elif init_d}}
+/sbin/chkconfig --add /etc/rc.d/init.d/cloud-init
+{{endif}}
+{{if init_d}}
+/sbin/chkconfig --add /etc/rc.d/init.d/cloud-config
+/sbin/chkconfig --add /etc/rc.d/init.d/cloud-final
+{{endif}}
+
+%preun
+
+{{if init_d_local}}
+if [ $1 -eq 0 ]
+then
+    /sbin/service cloud-init-local stop >/dev/null 2>&1
+    /sbin/chkconfig --del cloud-init-local
+fi
+{{elif init_d}}
+if [ $1 -eq 0 ]
+then
+    /sbin/service cloud-init stop >/dev/null 2>&1
+    /sbin/chkconfig --del cloud-init
+fi
+{{endif}}
+{{if init_d}}
+if [ $1 -eq 0 ]
+then
+    /sbin/service cloud-config stop >/dev/null 2>&1
+    /sbin/chkconfig --del cloud-config
+    /sbin/service cloud-final stop >/dev/null 2>&1
+    /sbin/chkconfig --del cloud-final
+fi
+{{endif}}
+
+{{if systemd}}
+if [ $1 -eq 0 ]
+then
+    /bin/systemctl --no-reload disable cloud-config.service >/dev/null 2>&1 || :
+    /bin/systemctl --no-reload disable cloud-final.service  >/dev/null 2>&1 || :
+    /bin/systemctl --no-reload disable cloud-init.service   >/dev/null 2>&1 || :
+    /bin/systemctl --no-reload disable cloud-init-local.service >/dev/null 2>&1 || :
+fi
+{{endif}}
+
+%postun
+
+{{if systemd}}
+/bin/systemctl daemon-reload >/dev/null 2>&1 || :
+{{endif}}
+
 %files
 
+{{if init_d}}
+%attr(0755, root, root) %{_initddir}/cloud-config
+%attr(0755, root, root) %{_initddir}/cloud-final
+{{endif}}
+{{if init_d_local}}
+%attr(0755, root, root) %{_initddir}/cloud-init-local
+{{elif init_d}}
+%attr(0755, root, root) %{_initddir}/cloud-init
+{{endif}}
+
+{{if systemd}}
+%{_unitdir}/cloud-config.service
+%{_unitdir}/cloud-config.target
+%{_unitdir}/cloud-init.service
+%{_unitdir}/cloud-init-local.service
+%{_unitdir}/cloud-final.service
+{{endif}}
+
+# Program binaries
+%{_bindir}/cloud-init*
+
+# There doesn't seem to be an agreed upon place for these
+# although it appears the standard says /usr/lib but rpmbuild
+# will try /usr/lib64 ??
+/usr/lib/%{name}/uncloud-init
+/usr/lib/%{name}/write-ssh-key-fingerprints
+
 # Docs
-{{for r in docs}}
-%doc {{r}}
-{{endfor}}
+%doc TODO LICENSE ChangeLog Requires
+%doc %{_defaultdocdir}/cloud-init/*
 
 # Configs
-{{for r in configs}}
-%config(noreplace) %{_sysconfdir}/{{r}}
-{{endfor}}
+%config(noreplace)      %{_sysconfdir}/cloud/cloud.cfg
+%dir                    %{_sysconfdir}/cloud/cloud.cfg.d
+%config(noreplace)      %{_sysconfdir}/cloud/cloud.cfg.d/*.cfg
+%config(noreplace)      %{_sysconfdir}/cloud/cloud.cfg.d/README
+%dir                    %{_sysconfdir}/cloud/templates
+%config(noreplace)      %{_sysconfdir}/cloud/templates/*
+%config(noreplace) %{_sysconfdir}/rsyslog.d/21-cloudinit.conf
 
-# Other files
-{{for r in files}}
-{{r}}
-{{endfor}}
-
-# Python sitelib
+# Python code is here...
 %{python_sitelib}/*
 
 %changelog
diff --git a/setup.py b/setup.py
index 810ebb48..d6253384 100755
--- a/setup.py
+++ b/setup.py
@@ -76,20 +76,12 @@ setuptools.setup(name='cloud-init',
       data_files=[('/etc/cloud', glob('config/*.cfg')),
                   ('/etc/cloud/cloud.cfg.d', glob('config/cloud.cfg.d/*')),
                   ('/etc/cloud/templates', glob('templates/*')),
-                  # Only really need for upstart based systems
-                  ('/etc/init', glob('upstart/*.conf')),
-                  # Only really need for systemd based systems
-                  ('/etc/systemd/system', glob('systemd/*.service')),
-                  # Only really need for init.d based system
-                  ('/etc/init.d', glob('initd/*')),
                   ('/usr/share/cloud-init', []),
                   ('/usr/lib/cloud-init',
                     ['tools/uncloud-init', 'tools/write-ssh-key-fingerprints']),
                   ('/usr/share/doc/cloud-init', filter(is_f, glob('doc/*'))),
                   ('/usr/share/doc/cloud-init/examples', filter(is_f, glob('doc/examples/*'))),
                   ('/usr/share/doc/cloud-init/examples/seed', filter(is_f, glob('doc/examples/seed/*'))),
-                  # ??
-                  # ('/etc/profile.d', ['tools/Z99-cloud-locale-test.sh']),
                   ],
       install_requires=read_requires(),
       )

From fd563c173cf9bf3fb57c2c2a1e0062b1efe0c114 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 2 Jul 2012 18:43:54 -0700
Subject: [PATCH 421/434] Add a sample yaml config to be used for testing.

---
 tests/configs/sample1.yaml | 53 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 53 insertions(+)
 create mode 100644 tests/configs/sample1.yaml

diff --git a/tests/configs/sample1.yaml b/tests/configs/sample1.yaml
new file mode 100644
index 00000000..24e874ee
--- /dev/null
+++ b/tests/configs/sample1.yaml
@@ -0,0 +1,53 @@
+#cloud-config
+#apt_update: false
+#apt_upgrade: true
+packages: [ bzr, pastebinit, ubuntu-dev-tools, ccache, bzr-builddeb, vim-nox, git-core, lftp ]
+
+#apt_sources:
+# - source: ppa:smoser/ppa
+
+#disable_root: False
+
+# mounts:
+#  - [ ephemeral0, /mnt ]
+#  - [ swap, none, swap, sw, 0, 0 ]
+
+ssh_import_id: [smoser ]
+
+#!/bin/sh
+
+output: {all: '| tee -a /var/log/cloud-init-output.log'}
+
+sm_misc:
+ - &user_setup |
+   set -x; exec > ~/user_setup.log 2>&1
+   echo "starting at $(date -R)"
+   echo "set -o vi" >> ~/.bashrc
+   cat >> ~/.profile <<"EOF"
+   export EDITOR=vi
+   export DEB_BUILD_OPTIONS=parallel=4
+   export PATH=/usr/lib/ccache:$PATH
+   EOF
+
+   mkdir ~/bin
+   chmod 755 ~/bin
+   cat > ~/bin/mdebuild <<"EOF"
+   #!/bin/sh
+   exec debuild --prepend-path /usr/lib/ccache "$@"
+   EOF
+   chmod 755 ~/bin/*
+
+   #byobu-launcher-install
+   byobu-ctrl-a screen 2>&1 || :
+
+   echo "pinging 8.8.8.8"
+   ping -c 4 8.8.8.8
+
+runcmd:
+ - [ sudo, -Hu, ubuntu, sh, -c, '[ -e /var/log/cloud-init.log ] || exit 0; grep "cloud-init.*running" /var/log/cloud-init.log > ~/runcmd.log' ]
+ - [ sudo, -Hu, ubuntu, sh, -c, 'read up sleep < /proc/uptime; echo $(date): runcmd up at $up | tee -a ~/runcmd.log' ]
+ - [ sudo, -Hu, ubuntu, sh, -c, *user_setup ]
+ 
+
+byobu_by_default: user
+output: {all: '| tee -a /var/log/cloud-init-output.log'}

From 739a994cda7ea97dd1062af1186c9767b4de555f Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 2 Jul 2012 19:02:16 -0700
Subject: [PATCH 422/434] Update the mock metadata server to return a file (or
 the default generated content) for the userdata blob.

---
 tools/mock-meta.py | 27 ++++++++++++++++++++-------
 1 file changed, 20 insertions(+), 7 deletions(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index 0f13acd6..8a73b43c 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -196,18 +196,26 @@ class UserDataHandler(object):
         self.opts = opts
 
     def _get_user_blob(self, **kwargs):
-        blob_mp = {}
-        blob_mp['hostname'] = kwargs.get('who', '')
-        lines = []
-        lines.append("#cloud-config")
-        lines.append(yamlify(blob_mp))
-        blob = "\n".join(lines)
+        blob = None
+        if self.opts['user_data_file']:
+            with open(opts['user_data_file'], 'rb') as fh:
+                blob = fh.read()
+                blob = blob.strip()
+        if not blob:
+            blob_mp = {
+                'hostname': kwargs.get('who', 'localhost'),
+            }
+            lines = [
+                "#cloud-config",
+                yamlify(blob_mp),
+            ]
+            blob = "\n".join(lines)
         return blob.strip()
 
     def get_data(self, params, who, **kwargs):
         if not params:
             return self._get_user_blob(who=who)
-        return ''
+        return NOT_IMPL_RESPONSE
 
 
 # Seem to need to use globals since can't pass 
@@ -303,10 +311,15 @@ def extract_opts():
     parser = OptionParser()
     parser.add_option("-p", "--port", dest="port", action="store", type=int, default=80,
                   help="port from which to serve traffic (default: %default)", metavar="PORT")
+    parser.add_option("-f", '--user-data-file', dest='user_data_file', action='store',
+                      help="user data blob to serve back to incoming requests", metavar='FILE')
     (options, args) = parser.parse_args()
     out = dict()
     out['extra'] = args
     out['port'] = options.port
+    out['user_data_file'] = None
+    if options.user_data_file:
+        out['user_data_file'] = options.user_data_file
     return out
 
 

From fb95590638bd670970dbdd638982da05a21aaf18 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Mon, 2 Jul 2012 19:11:46 -0700
Subject: [PATCH 423/434] Add a check on the filename provided ensuring it
 actually exists.

---
 tools/mock-meta.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index 8a73b43c..5f421c98 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -8,6 +8,7 @@ import functools
 import httplib
 import json
 import logging
+import os
 import random
 import string
 import sys
@@ -312,13 +313,15 @@ def extract_opts():
     parser.add_option("-p", "--port", dest="port", action="store", type=int, default=80,
                   help="port from which to serve traffic (default: %default)", metavar="PORT")
     parser.add_option("-f", '--user-data-file', dest='user_data_file', action='store',
-                      help="user data blob to serve back to incoming requests", metavar='FILE')
+                      help="user data filename to serve back to incoming requests", metavar='FILE')
     (options, args) = parser.parse_args()
     out = dict()
     out['extra'] = args
     out['port'] = options.port
     out['user_data_file'] = None
     if options.user_data_file:
+        if not os.path.isfile(options.user_data_file):
+            parser.error("Option -f specified a non-existent file")
         out['user_data_file'] = options.user_data_file
     return out
 

From b40dfc6e9e28157c67db2157a443766fe56b5b12 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 3 Jul 2012 12:46:55 -0700
Subject: [PATCH 424/434] 1. Update the mock ec2 data with some of the pubkey
 code from smosers ec2 metadata server. 2. Allow the setting of the ip addr
 (not just to 0.0.0.0) 3. Add comment as to how to use this for the 169
 'magic' addr

---
 tools/mock-meta.py | 78 +++++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 70 insertions(+), 8 deletions(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index 5f421c98..7c38ec48 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -4,6 +4,19 @@
 #
 # http://docs.amazonwebservices.com/AWSEC2/2007-08-29/DeveloperGuide/AESDG-chapter-instancedata.html
 
+"""
+To use this to mimic the EC2 metadata service entirely, run it like:
+  # Where 'eth0' is *some* interface.  
+  sudo ifconfig eth0:0 169.254.169.254 netmask 255.255.255.255
+
+  sudo ./mock-meta -a 169.254.169.254 -p 80
+
+Then:
+  wget -q http://169.254.169.254/latest/meta-data/instance-id -O -; echo
+  curl --silent http://169.254.169.254/latest/meta-data/instance-id ; echo
+  ec2metadata --instance-id
+"""
+
 import functools
 import httplib
 import json
@@ -20,7 +33,6 @@ from BaseHTTPServer import (HTTPServer, BaseHTTPRequestHandler)
 
 log = logging.getLogger('meta-server')
 
-# Constants
 EC2_VERSIONS = [
     '1.0',
     '2007-01-19',
@@ -69,6 +81,14 @@ META_CAPABILITIES = [
     'security-groups'
 ]
 
+PUB_KEYS = {
+    'brickies': [
+        'ssh-rsa AAAAB3NzaC1yc2EAAAABIwAAAQEA3I7VUf2l5gSn5uavROsc5HRDpZdQueUq5ozemNSj8T7enqKHOEaFoU2VoPgGEWC9RyzSQVeyD6s7APMcE82EtmW4skVEgEGSbDc1pvxzxtchBj78hJP6Cf5TCMFSXw+Fz5rF1dR23QDbN1mkHs7adr8GW4kSWqU7Q7NDwfIrJJtO7Hi42GyXtvEONHbiRPOe8stqUly7MvUoN+5kfjBM8Qqpfl2+FNhTYWpMfYdPUnE7u536WqzFmsaqJctz3gBxH9Ex7dFtrxR4qiqEr9Qtlu3xGn7Bw07/+i1D+ey3ONkZLN+LQ714cgj8fRS4Hj29SCmXp5Kt5/82cD/VN3NtHw== brickies',
+        '',
+    ],
+}
+
+
 INSTANCE_TYPES = [
     'm1.small',
     'm1.medium',
@@ -136,6 +156,8 @@ class MetaDataHandler(object):
 
     def get_data(self, params, who, **kwargs):
         if not params:
+            # Show the root level capabilities when
+            # no params are passed...
             caps = sorted(META_CAPABILITIES)
             return "\n".join(caps)
         action = params[0]
@@ -172,6 +194,43 @@ class MetaDataHandler(object):
             return "r-%s" % (id_generator(lower=True))
         elif action == 'product-codes':
             return "%s" % (id_generator(size=8))
+        elif action == 'public-keys':
+            nparams = params[1:]
+            # public-keys is messed up. a list of /latest/meta-data/public-keys/
+	        # shows something like: '0=brickies'
+	        # but a GET to /latest/meta-data/public-keys/0=brickies will fail
+	        # you have to know to get '/latest/meta-data/public-keys/0', then
+	        # from there you get a 'openssh-key', which you can get.
+	        # this hunk of code just re-works the object for that.
+            key_ids = sorted(list(PUB_KEYS.keys()))
+            if nparams:
+                mybe_key = nparams[0]
+                try:
+                    key_id = int(mybe_key)
+                    key_name = key_ids[key_id]
+                except:
+                    raise WebException(httplib.BAD_REQUEST, "Unknown key id %r" % mybe_key)
+                # Extract the possible sub-params
+                key_info = {
+                    "openssh-key": "\n".join(PUB_KEYS[key_name]),
+                }
+                result = dict(key_info)
+                for k in nparams[1:]:
+                    try:
+                        result = result.get(k)
+                    except (AttributeError, TypeError):
+                        result = None
+                        break
+                if isinstance(result, (dict)):
+                    result = json.dumps(result)
+                if result is None:
+                    result = ''
+                return str(result)
+            else:
+                contents = []
+                for (i, key_id) in enumerate(key_ids):
+                    contents.append("%s=%s" % (i, key_id))
+                return "\n".join(contents)
         elif action == 'placement':
             nparams = params[1:]
             if not nparams:
@@ -198,10 +257,8 @@ class UserDataHandler(object):
 
     def _get_user_blob(self, **kwargs):
         blob = None
-        if self.opts['user_data_file']:
-            with open(opts['user_data_file'], 'rb') as fh:
-                blob = fh.read()
-                blob = blob.strip()
+        if self.opts['user_data_file'] is not None:
+            blob = self.opts['user_data_file']
         if not blob:
             blob_mp = {
                 'hostname': kwargs.get('who', 'localhost'),
@@ -312,6 +369,8 @@ def extract_opts():
     parser = OptionParser()
     parser.add_option("-p", "--port", dest="port", action="store", type=int, default=80,
                   help="port from which to serve traffic (default: %default)", metavar="PORT")
+    parser.add_option("-a", "--addr", dest="address", action="store", type=str, default='0.0.0.0',
+                  help="address from which to serve traffic (default: %default)", metavar="ADDRESS")
     parser.add_option("-f", '--user-data-file', dest='user_data_file', action='store',
                       help="user data filename to serve back to incoming requests", metavar='FILE')
     (options, args) = parser.parse_args()
@@ -319,10 +378,12 @@ def extract_opts():
     out['extra'] = args
     out['port'] = options.port
     out['user_data_file'] = None
+    out['address'] = options.address
     if options.user_data_file:
         if not os.path.isfile(options.user_data_file):
             parser.error("Option -f specified a non-existent file")
-        out['user_data_file'] = options.user_data_file
+        with open(options.user_data_file, 'rb') as fh:
+            out['user_data_file'] = fh.read()
     return out
 
 
@@ -340,9 +401,10 @@ def run_server():
     setup_logging(logging.DEBUG)
     setup_fetchers(opts)
     log.info("CLI opts: %s", opts)
-    server = HTTPServer(('0.0.0.0', opts['port']), Ec2Handler)
+    server_address = (opts['address'], opts['port'])
+    server = HTTPServer(server_address, Ec2Handler)
     sa = server.socket.getsockname()
-    log.info("Serving server on %s using port %s ...", sa[0], sa[1])
+    log.info("Serving ec2 metadata on %s using port %s ...", sa[0], sa[1])
     server.serve_forever()
 
 

From d043d304f4f0865a49e166823c33cc31566b1be5 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 3 Jul 2012 16:04:58 -0700
Subject: [PATCH 425/434] Add the ability to have setup.py have a CLI option
 that specifies the daemon type which then later affects the installation of
 certain config files, which then can be extracted during package creation as
 needed.

---
 packages/brpm                   |  1 +
 packages/redhat/cloud-init.spec | 38 +++++------------
 setup.py                        | 72 +++++++++++++++++++++++++++++++--
 3 files changed, 78 insertions(+), 33 deletions(-)

diff --git a/packages/brpm b/packages/brpm
index 3abd9f15..1212b0e4 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -150,6 +150,7 @@ def generate_spec_contents(args, tmpl_fn):
     else:
         subs['systemd'] = False
 
+    subs['daemon_type'] = args.boot
     return templater.render_from_file(tmpl_fn, params=subs)
 
 
diff --git a/packages/redhat/cloud-init.spec b/packages/redhat/cloud-init.spec
index e9ce087a..df13bcb7 100644
--- a/packages/redhat/cloud-init.spec
+++ b/packages/redhat/cloud-init.spec
@@ -1,6 +1,6 @@
 %{!?python_sitelib: %global python_sitelib %(%{__python} -c "from distutils.sysconfig import get_python_lib; print get_python_lib()")}
 
-# See: See: http://www.zarb.org/~jasonc/macros.php
+# See: http://www.zarb.org/~jasonc/macros.php
 # Or: http://fedoraproject.org/wiki/Packaging:ScriptletSnippets
 # Or: http://www.rpm.org/max-rpm/ch-rpm-inside.html
 
@@ -61,7 +61,9 @@ ssh keys and to let the user run various scripts.
 
 %install
 rm -rf $RPM_BUILD_ROOT
-%{__python} setup.py install -O1 --skip-build --root $RPM_BUILD_ROOT
+%{__python} setup.py install -O1 \
+            --skip-build --root $RPM_BUILD_ROOT \
+            --daemon-type={{daemon_type}}
 
 # Note that /etc/rsyslog.d didn't exist by default until F15.
 # el6 request: https://bugzilla.redhat.com/show_bug.cgi?id=740420
@@ -69,24 +71,6 @@ mkdir -p $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d
 cp -p tools/21-cloudinit.conf \
                     $RPM_BUILD_ROOT/%{_sysconfdir}/rsyslog.d/21-cloudinit.conf
 
-{{if init_d}}
-mkdir -p $RPM_BUILD_ROOT/%{_initddir}/
-{{endif}}
-{{if init_d_local}}
-cp -p initd/cloud-init-local $RPM_BUILD_ROOT/%{_initddir}/
-cp -p initd/cloud-config $RPM_BUILD_ROOT/%{_initddir}/
-cp -p initd/cloud-final $RPM_BUILD_ROOT/%{_initddir}/
-{{elif init_d}}
-cp -p initd/cloud-init $RPM_BUILD_ROOT/%{_initddir}/
-cp -p initd/cloud-config $RPM_BUILD_ROOT/%{_initddir}/
-cp -p initd/cloud-final $RPM_BUILD_ROOT/%{_initddir}/
-{{endif}}
-
-{{if systemd}}
-mkdir -p        $RPM_BUILD_ROOT/%{_unitdir}
-cp -p systemd/* $RPM_BUILD_ROOT/%{_unitdir}
-{{endif}}
-
 %clean
 rm -rf $RPM_BUILD_ROOT
 
@@ -103,13 +87,13 @@ fi
 {{endif}}
 
 {{if init_d_local}}
-/sbin/chkconfig --add /etc/rc.d/init.d/cloud-init-local
+/sbin/chkconfig --add %{_initrddir}/cloud-init-local
 {{elif init_d}}
-/sbin/chkconfig --add /etc/rc.d/init.d/cloud-init
+/sbin/chkconfig --add %{_initrddir}/cloud-init
 {{endif}}
 {{if init_d}}
-/sbin/chkconfig --add /etc/rc.d/init.d/cloud-config
-/sbin/chkconfig --add /etc/rc.d/init.d/cloud-final
+/sbin/chkconfig --add %{_initrddir}/cloud-config
+/sbin/chkconfig --add %{_initrddir}/cloud-final
 {{endif}}
 
 %preun
@@ -166,11 +150,7 @@ fi
 {{endif}}
 
 {{if systemd}}
-%{_unitdir}/cloud-config.service
-%{_unitdir}/cloud-config.target
-%{_unitdir}/cloud-init.service
-%{_unitdir}/cloud-init-local.service
-%{_unitdir}/cloud-final.service
+%{_unitdir}/cloud-*
 {{endif}}
 
 # Program binaries
diff --git a/setup.py b/setup.py
index d6253384..50e95e9d 100755
--- a/setup.py
+++ b/setup.py
@@ -26,10 +26,45 @@ import os
 import re
 
 import setuptools
+from setuptools.command.install import install
+
+from distutils.command.install_data import install_data
+from distutils.errors import DistutilsArgError
 
 import subprocess
 
 
+def is_f(p):
+    return os.path.isfile(p)
+
+
+DAEMON_FILES = {
+    'initd': filter((lambda x: is_f(x)
+                     and x.find('local') == -1), glob('initd/*')),
+    'initd-local': filter((lambda x: is_f(x)
+                     and not x.endswith('cloud-init')), glob('initd/*')),
+    'systemd': filter((lambda x: is_f(x)), glob('systemd/*')),
+    'upstart': filter((lambda x: is_f(x)
+                     and x.find('local') == -1
+                     and x.find('nonet') == -1), glob('upstart/*')),
+    'upstart-nonet': filter((lambda x: is_f(x)
+                        and x.find('local') == -1
+                        and not x.endswith('cloud-init.conf')), glob('upstart/*')),
+    'upstart-local': filter((lambda x: is_f(x)
+                        and x.find('nonet') == -1
+                        and not x.endswith('cloud-init.conf')), glob('upstart/*')),
+}
+DAEMON_ROOTS = {
+    'initd': '/etc/rc.d/init.d',
+    'initd-local': '/etc/rc.d/init.d',
+    'systemd': '/etc/systemd/system/',
+    'upstart': '/etc/init/',
+    'upstart-nonet': '/etc/init/',
+    'upstart-local': '/etc/init/',
+}
+DAEMON_TYPES = sorted(list(DAEMON_ROOTS.keys()))
+
+
 def tiny_p(cmd, capture=True):
     # Darn python 2.6 doesn't have check_output (argggg)
     stdout = subprocess.PIPE
@@ -46,10 +81,6 @@ def tiny_p(cmd, capture=True):
     return (out, err)
 
 
-def is_f(p):
-    return os.path.isfile(p)
-
-
 def get_version():
     cmd = ['tools/read-version']
     (ver, _e) = tiny_p(cmd)
@@ -62,6 +93,34 @@ def read_requires():
     return deps.splitlines()
 
 
+# TODO: Is there a better way to do this??
+class DaemonInstallData(install):
+    user_options = install.user_options + [
+        # This will magically show up in member variable 'daemon_type'
+        ('daemon-type=', None,
+            ('daemon type to configure (%s) [default: None]') %
+                (", ".join(DAEMON_TYPES))
+        ),
+    ]
+
+    def initialize_options(self):
+        install.initialize_options(self)
+        self.daemon_type = None
+
+    def finalize_options(self):
+        install.finalize_options(self)
+        if self.daemon_type and self.daemon_type not in DAEMON_TYPES:
+                raise DistutilsArgError(
+                    ("You must specify one of (%s) when"
+                     " specifying a daemon type!") % (", ".join(DAEMON_TYPES))
+                )
+        elif self.daemon_type:
+            self.distribution.data_files.append((DAEMON_ROOTS[self.daemon_type], 
+                                                 DAEMON_FILES[self.daemon_type]))
+            # Force that command to reinitalize (with new file list)
+            self.distribution.reinitialize_command('install_data', True)
+
+
 setuptools.setup(name='cloud-init',
       version=get_version(),
       description='EC2 initialisation magic',
@@ -84,4 +143,9 @@ setuptools.setup(name='cloud-init',
                   ('/usr/share/doc/cloud-init/examples/seed', filter(is_f, glob('doc/examples/seed/*'))),
                   ],
       install_requires=read_requires(),
+      cmdclass = {
+          # Use a subclass for install that handles
+          # adding on the right daemon configuration files
+          'install': DaemonInstallData,
+      },
       )

From bbbb06faa2715c379a1ab8253a46eb15f788fd21 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 3 Jul 2012 19:59:04 -0700
Subject: [PATCH 426/434] 1. Cleanup of some mock functionality 2. Adding in
 returning the 'public-keys' to the metadata 'list' response 3. Adding in
 sending back the running users keys (useful for testing) along with
 'brickies' 4. Add in a traverse function that can walk down a dictionary (if
 possible)

---
 tools/mock-meta.py | 103 +++++++++++++++++++++++++++++----------------
 1 file changed, 66 insertions(+), 37 deletions(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index 7c38ec48..5bbe62cc 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -43,16 +43,15 @@ EC2_VERSIONS = [
     '2008-02-01',
     '2008-09-01',
     '2009-04-04',
-    'latest',
 ]
 
 BLOCK_DEVS = [
     'ami',
-    'root',
     'ephemeral0',
+    'root',
 ]
 
-DEV_PREFIX = 'v'
+DEV_PREFIX = 'v'  # This seems to vary alot depending on images...
 DEV_MAPPINGS = {
     'ephemeral0': '%sda2' % (DEV_PREFIX),
     'root': '/dev/%sda1' % (DEV_PREFIX),
@@ -77,22 +76,28 @@ META_CAPABILITIES = [
     'product-codes',
     'public-hostname',
     'public-ipv4',
+    'public-keys/',
     'reservation-id',
     'security-groups'
 ]
 
 PUB_KEYS = {
     'brickies': [
-        'ssh-rsa AAAAB3NzaC1yc2EAAAABIwAAAQEA3I7VUf2l5gSn5uavROsc5HRDpZdQueUq5ozemNSj8T7enqKHOEaFoU2VoPgGEWC9RyzSQVeyD6s7APMcE82EtmW4skVEgEGSbDc1pvxzxtchBj78hJP6Cf5TCMFSXw+Fz5rF1dR23QDbN1mkHs7adr8GW4kSWqU7Q7NDwfIrJJtO7Hi42GyXtvEONHbiRPOe8stqUly7MvUoN+5kfjBM8Qqpfl2+FNhTYWpMfYdPUnE7u536WqzFmsaqJctz3gBxH9Ex7dFtrxR4qiqEr9Qtlu3xGn7Bw07/+i1D+ey3ONkZLN+LQ714cgj8fRS4Hj29SCmXp5Kt5/82cD/VN3NtHw== brickies',
+        ('ssh-rsa '
+         'AAAAB3NzaC1yc2EAAAABIwAAAQEA3I7VUf2l5gSn5uavROsc5HRDpZdQueUq5ozemNSj8T'
+         '7enqKHOEaFoU2VoPgGEWC9RyzSQVeyD6s7APMcE82EtmW4skVEgEGSbDc1pvxzxtchBj78'
+         'hJP6Cf5TCMFSXw+Fz5rF1dR23QDbN1mkHs7adr8GW4kSWqU7Q7NDwfIrJJtO7Hi42GyXtv'
+         'EONHbiRPOe8stqUly7MvUoN+5kfjBM8Qqpfl2+FNhTYWpMfYdPUnE7u536WqzFmsaqJctz'
+         '3gBxH9Ex7dFtrxR4qiqEr9Qtlu3xGn7Bw07/+i1D+ey3ONkZLN+LQ714cgj8fRS4Hj29SC'
+         'mXp5Kt5/82cD/VN3NtHw== brickies'),
         '',
     ],
 }
 
-
 INSTANCE_TYPES = [
-    'm1.small',
-    'm1.medium',
     'm1.large',
+    'm1.medium',
+    'm1.small',
     'm1.xlarge',
 ]
 
@@ -100,10 +105,10 @@ AVAILABILITY_ZONES = [
     "us-east-1a",
     "us-east-1b",
     "us-east-1c",
-    'us-west-1',
     "us-east-1d",
     'eu-west-1a',
     'eu-west-1b',
+    'us-west-1',
 ]
 
 PLACEMENT_CAPABILITIES = {
@@ -139,6 +144,17 @@ def format_text(text):
     return "\n".join(nlines)
 
 
+def traverse(keys, mp):
+    result = dict(mp)
+    for k in keys:
+        try:
+            result = result.get(k)
+        except (AttributeError, TypeError):
+            result = None
+            break
+    return result
+
+
 ID_CHARS = [c for c in (string.ascii_uppercase + string.digits)]
 def id_generator(size=6, lower=False):
     txt = ''.join(random.choice(ID_CHARS) for x in range(size))
@@ -148,6 +164,23 @@ def id_generator(size=6, lower=False):
         return txt
 
 
+def get_ssh_keys():
+    keys = {}
+    keys.update(PUB_KEYS)
+
+    # Nice helper to add in the 'running' users key (if they have one)
+    key_pth = os.path.expanduser('~/.ssh/id_rsa.pub')
+    if not os.path.isfile(key_pth):
+        key_pth = os.path.expanduser('~/.ssh/id_dsa.pub')
+
+    if os.path.isfile(key_pth):
+        with open(key_pth, 'rb') as fh:
+            contents = fh.read()
+        keys[os.getlogin()] = [contents, '']
+
+    return keys
+
+
 class MetaDataHandler(object):
 
     def __init__(self, opts):
@@ -165,7 +198,7 @@ class MetaDataHandler(object):
         if action == 'instance-id':
             return 'i-%s' % (id_generator(lower=True))
         elif action == 'ami-launch-index':
-            return "%s" % random.choice([0,1,2,3])
+            return "%s" % random.choice([0, 1, 2, 3])
         elif action == 'aki-id':
             return 'aki-%s' % (id_generator(lower=True))
         elif action == 'ami-id':
@@ -175,11 +208,15 @@ class MetaDataHandler(object):
         elif action == 'block-device-mapping':
             nparams = params[1:]
             if not nparams:
-                devs = sorted(BLOCK_DEVS)
-                return "\n".join(devs)
+                return "\n".join(BLOCK_DEVS)
             else:
-                return "%s" % (DEV_MAPPINGS.get(nparams[0].strip(), ''))
+                subvalue = traverse(nparams, DEV_MAPPINGS)
+                if not subvalue:
+                    return "\n".join(sorted(list(DEV_MAPPINGS.keys())))
+                else:
+                    return str(subvalue)
         elif action in ['hostname', 'local-hostname', 'public-hostname']:
+            # Just echo back there own hostname that they called in on..
             return "%s" % (who)
         elif action == 'instance-type':
             return random.choice(INSTANCE_TYPES)
@@ -188,21 +225,23 @@ class MetaDataHandler(object):
         elif action == 'security-groups':
             return 'default'
         elif action in ['local-ipv4', 'public-ipv4']:
-            there_ip = kwargs.get('client_ip', '10.0.0.1')
-            return "%s" % (there_ip)
+            # Just echo back there own ip that they called in on...
+            return "%s" % (kwargs.get('client_ip', '10.0.0.1'))
         elif action == 'reservation-id':
             return "r-%s" % (id_generator(lower=True))
         elif action == 'product-codes':
             return "%s" % (id_generator(size=8))
         elif action == 'public-keys':
             nparams = params[1:]
-            # public-keys is messed up. a list of /latest/meta-data/public-keys/
+            # This is a weird kludge, why amazon why!!!
+            # public-keys is messed up, a list of /latest/meta-data/public-keys/
 	        # shows something like: '0=brickies'
 	        # but a GET to /latest/meta-data/public-keys/0=brickies will fail
 	        # you have to know to get '/latest/meta-data/public-keys/0', then
 	        # from there you get a 'openssh-key', which you can get.
 	        # this hunk of code just re-works the object for that.
-            key_ids = sorted(list(PUB_KEYS.keys()))
+            avail_keys = get_ssh_keys()
+            key_ids = sorted(list(avail_keys.keys()))
             if nparams:
                 mybe_key = nparams[0]
                 try:
@@ -211,21 +250,15 @@ class MetaDataHandler(object):
                 except:
                     raise WebException(httplib.BAD_REQUEST, "Unknown key id %r" % mybe_key)
                 # Extract the possible sub-params
-                key_info = {
-                    "openssh-key": "\n".join(PUB_KEYS[key_name]),
-                }
-                result = dict(key_info)
-                for k in nparams[1:]:
-                    try:
-                        result = result.get(k)
-                    except (AttributeError, TypeError):
-                        result = None
-                        break
+                result = traverse(nparams[1:], {
+                    "openssh-key": "\n".join(avail_keys[key_name]),
+                })
                 if isinstance(result, (dict)):
-                    result = json.dumps(result)
-                if result is None:
+                    # TODO: This might not be right??
+                    result = "\n".join(sorted(result.keys()))
+                if not result:
                     result = ''
-                return str(result)
+                return result
             else:
                 contents = []
                 for (i, key_id) in enumerate(key_ids):
@@ -286,12 +319,7 @@ user_fetcher = None
 class Ec2Handler(BaseHTTPRequestHandler):
 
     def _get_versions(self):
-        versions = []
-        for v in EC2_VERSIONS:
-            if v == 'latest':
-                continue
-            else:
-                versions.append(v)
+        versions = ['latest'] + EC2_VERSIONS
         versions = sorted(versions)
         return "\n".join(versions)
 
@@ -308,11 +336,12 @@ class Ec2Handler(BaseHTTPRequestHandler):
             'meta-data': meta_fetcher.get_data,
         }
         segments = [piece for piece in path.split('/') if len(piece)]
+        log.info("Received segments %s", segments)
         if not segments:
             return self._get_versions
         date = segments[0].strip().lower()
-        if date not in EC2_VERSIONS:
-            raise WebException(httplib.BAD_REQUEST, "Unknown date format %r" % date)
+        if date not in self._get_versions():
+            raise WebException(httplib.BAD_REQUEST, "Unknown version format %r" % date)
         if len(segments) < 2:
             raise WebException(httplib.BAD_REQUEST, "No action provided")
         look_name = segments[1].lower()

From d96be3c2af59ef992ba445c62c8e1eb9344566cd Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 3 Jul 2012 20:14:57 -0700
Subject: [PATCH 427/434] When the hostname is also the ip (thus no hostname)
 just use 'localhost'

---
 tools/mock-meta.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index 5bbe62cc..247cff14 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -349,10 +349,14 @@ class Ec2Handler(BaseHTTPRequestHandler):
             raise WebException(httplib.BAD_REQUEST, "Unknown requested data %r" % look_name)
         base_func = func_mapping[look_name]
         who = self.address_string()
+        ip_from = self.client_address[0]
+        if who == ip_from:
+            # Nothing resolved, so just use 'localhost'
+            who = 'localhost'
         kwargs = {
             'params': list(segments[2:]),
-            'who': self.address_string(),
-            'client_ip': self.client_address[0],
+            'who': who,
+            'client_ip': ip_from,
         }
         return functools.partial(base_func, **kwargs)
 

From 6f45663ca6f70ef533f2a3f90fe535e4cadb3b80 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 3 Jul 2012 20:24:01 -0700
Subject: [PATCH 428/434] Add a check on 'chownbyname' that catches the
 keyerror and logs it (instead of failing)

---
 cloudinit/util.py | 17 ++++++++++++-----
 1 file changed, 12 insertions(+), 5 deletions(-)

diff --git a/cloudinit/util.py b/cloudinit/util.py
index 4c29432b..d7dd20b5 100644
--- a/cloudinit/util.py
+++ b/cloudinit/util.py
@@ -917,7 +917,8 @@ def pipe_in_out(in_fh, out_fh, chunk_size=1024, chunk_cb=None):
 
 
 def chownbyid(fname, uid=None, gid=None):
-    if uid is None and gid is None:
+    if uid in [None, -1] and gid in [None, -1]:
+        # Nothing to do
         return
     LOG.debug("Changing the ownership of %s to %s:%s", fname, uid, gid)
     os.chown(fname, uid, gid)
@@ -926,11 +927,17 @@ def chownbyid(fname, uid=None, gid=None):
 def chownbyname(fname, user=None, group=None):
     uid = -1
     gid = -1
-    if user:
-        uid = pwd.getpwnam(user).pw_uid
-    if group:
-        gid = grp.getgrnam(group).gr_gid
+    try:
+        if user:
+            uid = pwd.getpwnam(user).pw_uid
+        if group:
+            gid = grp.getgrnam(group).gr_gid
+    except KeyError:
+        logexc(LOG, ("Failed changing the ownership of %s using username %s and"
+                     " groupname %s (do they exist?)"), fname, user, group)
+        return False
     chownbyid(fname, uid, gid)
+    return True
 
 
 # Always returns well formated values

From c1c2ffb1cc088f9194330f04a72bbaf721ad2b40 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Tue, 3 Jul 2012 20:29:36 -0700
Subject: [PATCH 429/434] Remove the useless function printout.

---
 tools/mock-meta.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tools/mock-meta.py b/tools/mock-meta.py
index 247cff14..4548e4ae 100755
--- a/tools/mock-meta.py
+++ b/tools/mock-meta.py
@@ -365,7 +365,6 @@ class Ec2Handler(BaseHTTPRequestHandler):
         log.info("Got a call from %s for path %s", who, self.path)
         try:
             func = self._find_method(self.path)
-            log.info("Calling into func %s to get your data.", func)
             data = func()
             if not data:
                 data = ''

From b1d357c708af4d96e6684de5c6ea44b36441a3de Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Wed, 4 Jul 2012 13:52:34 -0700
Subject: [PATCH 430/434] 1. Make the debian rules file a template (and pass in
 the daemon-type) 2. Adjust the bddeb to pass this in (as well as other output
 statement being added) 3. Adjust make-tarball to only archive the bzr
 versioned files (using --recursive)

---
 packages/bddeb        | 37 +++++++++++++++-----
 packages/debian/rules |  3 ++
 packages/make-tarball | 80 +++++++++++++++++++++++++++----------------
 3 files changed, 82 insertions(+), 38 deletions(-)

diff --git a/packages/bddeb b/packages/bddeb
index eeb64434..b5a70dd8 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -29,7 +29,7 @@ PKG_MP = {
 }
 
 
-def write_debian_folder(root, version, revno):
+def write_debian_folder(root, version, revno, daemon_type):
     deb_dir = util.abs_join(root, 'debian')
     os.makedirs(deb_dir)
     
@@ -65,8 +65,12 @@ def write_debian_folder(root, version, revno):
                              util.abs_join(deb_dir, 'control'),
                              params={'requires': requires})
     
+    templater.render_to_file(util.abs_join('debian', 'rules'),
+                             util.abs_join(deb_dir, 'rules'),
+                             params={'daemon_type': daemon_type})
+    
     # Just copy the following directly
-    for base_fn in ['dirs', 'copyright', 'compat', 'pycompat', 'rules']:
+    for base_fn in ['dirs', 'copyright', 'compat', 'pycompat']:
         shutil.copy(util.abs_join('debian', base_fn),
                     util.abs_join(deb_dir, base_fn))
 
@@ -84,6 +88,10 @@ def main():
                               " (default: %(default)s)"),
                         default=False,
                         action='store_true')
+    parser.add_argument("-b", "--boot", dest="boot",
+                        help="select boot type (default: %(default)s)", 
+                        metavar="TYPE", default='upstart',
+                        choices=('upstart', 'upstart-local'))
     args = parser.parse_args()
 
     capture = True
@@ -101,25 +109,33 @@ def main():
         (sysout, _stderr) = util.subp(cmd)
         revno = sysout.strip()
         
+        # This is really only a temporary archive
+        # since we will extract it then add in the debian
+        # folder, then re-archive it for debian happiness
+        print("Creating a temporary tarball using the 'make-tarball' helper")
         cmd = [sys.executable,
                 util.abs_join(os.getcwd(), 'make-tarball')]
         (sysout, _stderr) = util.subp(cmd)
         arch_fn = sysout.strip()
-
         tmp_arch_fn = util.abs_join(tdir, os.path.basename(arch_fn))
         shutil.move(arch_fn, tmp_arch_fn)
 
+        print("Extracting temporary tarball %r" % (tmp_arch_fn))
         cmd = ['tar', '-xvzf', tmp_arch_fn, '-C', tdir]
-        util.subp(cmd)
-        
+        util.subp(cmd, capture=capture)
         base_name = os.path.basename(arch_fn)[:-len(".tar.gz")]
         shutil.move(util.abs_join(tdir, base_name), 
                     util.abs_join(tdir, 'cloud-init'))
 
+        print("Creating a debian/ folder in %r" % 
+             (util.abs_join(tdir, 'cloud-init')))
         write_debian_folder(util.abs_join(tdir, 'cloud-init'),
-                            version, revno)
+                            version, revno, args.boot)
 
+        # The naming here seems to follow some debian standard
+        # so it will whine if it is changed...
         tar_fn = "cloud-init_%s~%s.orig.tar.gz" % (version, revno)
+        print("Archiving that new folder into %r" % (tar_fn))
         cmd = ['tar', '-czvf', 
                util.abs_join(tdir, tar_fn), 
                '-C', util.abs_join(tdir, 'cloud-init')]
@@ -127,7 +143,8 @@ def main():
         util.subp(cmd, capture=capture)
         shutil.copy(util.abs_join(tdir, tar_fn), tar_fn)
         print("Wrote out archive %r" % (util.abs_join(tar_fn)))
-        
+
+        print("Running 'debuild' in %r" % (util.abs_join(tdir, 'cloud-init')))
         with util.chdir(util.abs_join(tdir, 'cloud-init')):
             cmd = ['debuild']
             if not args.sign:
@@ -137,14 +154,16 @@ def main():
         globs = [] 
         globs.extend(glob.glob("%s/*.deb" %
                      (os.path.join(tdir))))
+        link_fn = os.path.join(os.getcwd(), 'cloud-init_all.deb')
         for fn in globs:
             base_fn = os.path.basename(fn)
             shutil.move(fn, base_fn)
             print("Wrote out debian package %r" % (base_fn))
             if fn.endswith('_all.deb'):
                 # Add in the local link
-                util.del_file('cloud-init_all.deb')
-                os.symlink(base_fn, 'cloud-init_all.deb')
+                util.del_file(link_fn)
+                os.symlink(base_fn, link_fn)
+                print("Linked %r to %r" % (base_fn, link_fn))
 
     return 0
 
diff --git a/packages/debian/rules b/packages/debian/rules
index 1739f4cf..6814974f 100755
--- a/packages/debian/rules
+++ b/packages/debian/rules
@@ -7,8 +7,11 @@ binary-install/cloud-init::cloud-init-fixups
 include /usr/share/cdbs/1/rules/debhelper.mk
 include /usr/share/cdbs/1/class/python-distutils.mk
 
+DEB_PYTHON_INSTALL_ARGS_ALL += --daemon-type={{daemon_type}}
+
 DEB_DH_INSTALL_SOURCEDIR := debian/tmp
 
 cloud-init-fixups:
 	install -d $(DEB_DESTDIR)/etc/rsyslog.d
 	cp tools/21-cloudinit.conf $(DEB_DESTDIR)/etc/rsyslog.d/21-cloudinit.conf
+	
diff --git a/packages/make-tarball b/packages/make-tarball
index 479e11af..43a6fc33 100755
--- a/packages/make-tarball
+++ b/packages/make-tarball
@@ -7,6 +7,8 @@ import subprocess
 import sys
 import tempfile
 
+import optparse
+
 
 # Use the util functions from cloudinit
 possible_topdir = os.path.normpath(os.path.join(os.path.abspath(
@@ -17,51 +19,71 @@ if os.path.exists(os.path.join(possible_topdir, "cloudinit", "__init__.py")):
 from cloudinit import util
 
 
-def main(args):
+def find_versioned_files():
+    (stdout, _stderr) = util.subp(['bzr', 'ls', '--versioned', '--recursive'])
+    fns = [fn for fn in stdout.splitlines() 
+                  if fn and not fn.startswith('.')]
+    fns.sort()
+    return fns
 
-    base_fn = None
-    if args:
-        base_fn = args[0]
+
+def copy(fn, where_to, verbose):
+    if verbose:
+        print("Copying %r --> %r" % (fn, where_to))
+    if os.path.isfile(fn):
+        shutil.copy(fn, where_to)
+    elif os.path.isdir(fn) and not os.path.isdir(where_to):
+        os.makedirs(where_to)
+    else:
+        raise RuntimeError("Do not know how to copy %s" % (fn))
+
+
+def main():
+
+    parser = optparse.OptionParser()
+    parser.add_option("-f", "--file", dest="filename",
+                      help="write archive to FILE", metavar="FILE")
+    parser.add_option("-v", "--verbose",
+                  action="store_true", dest="verbose", default=False,
+                  help="show verbose messaging")
+
+    (options, args) = parser.parse_args()
+
+    base_fn = options.filename
+    if not base_fn:
+        (stdout, _stderr) = util.subp(['bzr', 'revno'])
+        revno = stdout.strip()
+        cmd = [sys.executable,
+               util.abs_join(os.pardir, 'tools', 'read-version')]
+        (stdout, _stderr) = util.subp(cmd)
+        version = stdout.strip()
+        base_fn = 'cloud-init-%s-%s' % (version, revno)
 
     with util.tempdir() as tdir:
-
-        if not base_fn:
-            (stdout, _stderr) = util.subp(['bzr', 'revno'])
-            revno = stdout.strip()
-    
-            cmd = [sys.executable,
-                   util.abs_join(os.pardir, 'tools', 'read-version')]
-            (stdout, _stderr) = util.subp(cmd)
-            version = stdout.strip()
-            base_fn = 'cloud-init-%s-%s' % (version, revno)
-
         util.ensure_dir(util.abs_join(tdir, base_fn))
         arch_fn = '%s.tar.gz' % (base_fn)
 
         with util.chdir(os.pardir):
-            (stdout, _stderr) = util.subp(['bzr', 'ls', '--versioned'])
-            fns = [fn for fn in stdout.splitlines() 
-                          if fn and not fn.startswith('.')]
-            # TODO - only copy the right files
-            # ie do a recursive versioned...
+            fns =  find_versioned_files()
             for fn in fns:
-                if os.path.isfile(fn):
-                    shutil.copy(fn, util.abs_join(tdir, base_fn, fn))
-                else:
-                    shutil.copytree(fn, util.abs_join(tdir, base_fn, fn))
+                copy(fn, util.abs_join(tdir, base_fn, fn),
+                     verbose=options.verbose)
 
-        cmd = ['tar', '-czf',
-                util.abs_join(tdir, arch_fn), 
-                '-C', tdir, base_fn]
-        util.subp(cmd)
+        arch_full_fn = util.abs_join(tdir, arch_fn)
+        cmd = ['tar', '-czvf', arch_full_fn, '-C', tdir, base_fn]
+        if options.verbose:
+            print("Creating an archive from directory %r to %r" %
+                  (util.abs_join(tdir, base_fn), arch_full_fn))
 
+        util.subp(cmd, capture=(not options.verbose))
         shutil.move(util.abs_join(tdir, arch_fn),
                     util.abs_join(os.getcwd(), arch_fn))
+
         print(os.path.abspath(arch_fn))
         
     return 0
 
 
 if __name__ == '__main__':
-    sys.exit(main(sys.argv[1:]))
+    sys.exit(main())
 

From 0d23f61e5473ff6309bef304ea8f24bb86941595 Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 6 Jul 2012 10:47:19 -0700
Subject: [PATCH 431/434] Updated	so that	if no mirror is	found, the
 module stops	running.

---
 cloudinit/config/cc_apt_update_upgrade.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/cloudinit/config/cc_apt_update_upgrade.py b/cloudinit/config/cc_apt_update_upgrade.py
index 42b6f3e9..5c5e510c 100644
--- a/cloudinit/config/cc_apt_update_upgrade.py
+++ b/cloudinit/config/cc_apt_update_upgrade.py
@@ -45,13 +45,16 @@ EXPORT_GPG_KEYID = """
 """
 
 
-def handle(_name, cfg, cloud, log, _args):
+def handle(name, cfg, cloud, log, _args):
     update = util.get_cfg_option_bool(cfg, 'apt_update', False)
     upgrade = util.get_cfg_option_bool(cfg, 'apt_upgrade', False)
 
     release = get_release()
-
     mirror = find_apt_mirror(cloud, cfg)
+    if not mirror:
+        log.debug(("Skipping module named %s,"
+                   " no package 'mirror' located"), name)
+        return
 
     log.debug("Selected mirror at: %s" % mirror)
 

From df76bcdaf0c0cf8a02b0ffb45009e43fdf3df5bd Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 6 Jul 2012 10:53:35 -0700
Subject: [PATCH 432/434] Add comment about keeping track of what people think
 about the 'read' and 'write' root, and if it confuses them, remove it later
 and just recommend a more 'natural' way of doing it (ie 'chroot').

---
 TODO | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/TODO b/TODO
index 30a52cae..1725db00 100644
--- a/TODO
+++ b/TODO
@@ -29,4 +29,9 @@
   for these modules (or have a combination of the above), this avoids having
   to understand where your modules are coming from (which can be altered by
   the current python inclusion path)
-
+- Depending on if people think the wrapper around 'os.path.join' provided
+  by the 'paths' object is useful (allowing us to modify based off a 'read'
+  and 'write' configuration based 'root') or is just to confusing, it might be 
+  something to remove later, and just recommend using 'chroot' instead (or the X 
+  different other options which are similar to 'chroot'), which is might be more 
+  natural and less confusing...

From 833740407eff9b21a206f0a6bffe31c355a84b22 Mon Sep 17 00:00:00 2001
From: Scott Moser <smoser@ubuntu.com>
Date: Fri, 6 Jul 2012 17:03:11 -0400
Subject: [PATCH 433/434] setup.py: rename "daemon type" to "init system"

This brings with it other changes, and also makes an install
install all of the requisite init files. (ie, cloud-init needs the -local and
the non-local)
---
 packages/bddeb                       |  4 +--
 packages/brpm                        |  2 +-
 packages/debian/rules                |  2 +-
 packages/redhat/cloud-init.spec      |  2 +-
 setup.py                             | 52 ++++++++++------------------
 {initd => sysvinit}/cloud-config     |  0
 {initd => sysvinit}/cloud-final      |  0
 {initd => sysvinit}/cloud-init       |  0
 {initd => sysvinit}/cloud-init-local |  0
 9 files changed, 24 insertions(+), 38 deletions(-)
 rename {initd => sysvinit}/cloud-config (100%)
 rename {initd => sysvinit}/cloud-final (100%)
 rename {initd => sysvinit}/cloud-init (100%)
 rename {initd => sysvinit}/cloud-init-local (100%)

diff --git a/packages/bddeb b/packages/bddeb
index b5a70dd8..10ad08b3 100755
--- a/packages/bddeb
+++ b/packages/bddeb
@@ -29,7 +29,7 @@ PKG_MP = {
 }
 
 
-def write_debian_folder(root, version, revno, daemon_type):
+def write_debian_folder(root, version, revno, init_sys):
     deb_dir = util.abs_join(root, 'debian')
     os.makedirs(deb_dir)
     
@@ -67,7 +67,7 @@ def write_debian_folder(root, version, revno, daemon_type):
     
     templater.render_to_file(util.abs_join('debian', 'rules'),
                              util.abs_join(deb_dir, 'rules'),
-                             params={'daemon_type': daemon_type})
+                             params={'init_sys': init_sys})
     
     # Just copy the following directly
     for base_fn in ['dirs', 'copyright', 'compat', 'pycompat']:
diff --git a/packages/brpm b/packages/brpm
index 1212b0e4..1d05bd2a 100755
--- a/packages/brpm
+++ b/packages/brpm
@@ -150,7 +150,7 @@ def generate_spec_contents(args, tmpl_fn):
     else:
         subs['systemd'] = False
 
-    subs['daemon_type'] = args.boot
+    subs['init_sys'] = args.boot
     return templater.render_from_file(tmpl_fn, params=subs)
 
 
diff --git a/packages/debian/rules b/packages/debian/rules
index 6814974f..87cd6538 100755
--- a/packages/debian/rules
+++ b/packages/debian/rules
@@ -7,7 +7,7 @@ binary-install/cloud-init::cloud-init-fixups
 include /usr/share/cdbs/1/rules/debhelper.mk
 include /usr/share/cdbs/1/class/python-distutils.mk
 
-DEB_PYTHON_INSTALL_ARGS_ALL += --daemon-type={{daemon_type}}
+DEB_PYTHON_INSTALL_ARGS_ALL += --init-system={{init_sys}}
 
 DEB_DH_INSTALL_SOURCEDIR := debian/tmp
 
diff --git a/packages/redhat/cloud-init.spec b/packages/redhat/cloud-init.spec
index df13bcb7..d0f83a4b 100644
--- a/packages/redhat/cloud-init.spec
+++ b/packages/redhat/cloud-init.spec
@@ -63,7 +63,7 @@ ssh keys and to let the user run various scripts.
 rm -rf $RPM_BUILD_ROOT
 %{__python} setup.py install -O1 \
             --skip-build --root $RPM_BUILD_ROOT \
-            --daemon-type={{daemon_type}}
+            --init-system={{init_sys}}
 
 # Note that /etc/rsyslog.d didn't exist by default until F15.
 # el6 request: https://bugzilla.redhat.com/show_bug.cgi?id=740420
diff --git a/setup.py b/setup.py
index 50e95e9d..458d1a9e 100755
--- a/setup.py
+++ b/setup.py
@@ -38,31 +38,17 @@ def is_f(p):
     return os.path.isfile(p)
 
 
-DAEMON_FILES = {
-    'initd': filter((lambda x: is_f(x)
-                     and x.find('local') == -1), glob('initd/*')),
-    'initd-local': filter((lambda x: is_f(x)
-                     and not x.endswith('cloud-init')), glob('initd/*')),
+INITSYS_FILES = {
+    'sysvinit': filter((lambda x: is_f(x)), glob('sysvinit/*')),
     'systemd': filter((lambda x: is_f(x)), glob('systemd/*')),
-    'upstart': filter((lambda x: is_f(x)
-                     and x.find('local') == -1
-                     and x.find('nonet') == -1), glob('upstart/*')),
-    'upstart-nonet': filter((lambda x: is_f(x)
-                        and x.find('local') == -1
-                        and not x.endswith('cloud-init.conf')), glob('upstart/*')),
-    'upstart-local': filter((lambda x: is_f(x)
-                        and x.find('nonet') == -1
-                        and not x.endswith('cloud-init.conf')), glob('upstart/*')),
+    'upstart': filter((lambda x: is_f(x)), glob('upstart/*')),
 }
-DAEMON_ROOTS = {
-    'initd': '/etc/rc.d/init.d',
-    'initd-local': '/etc/rc.d/init.d',
+INITSYS_ROOTS = {
+    'sysvinit': '/etc/rc.d/init.d',
     'systemd': '/etc/systemd/system/',
     'upstart': '/etc/init/',
-    'upstart-nonet': '/etc/init/',
-    'upstart-local': '/etc/init/',
 }
-DAEMON_TYPES = sorted(list(DAEMON_ROOTS.keys()))
+INITSYS_TYPES = sorted(list(INITSYS_ROOTS.keys()))
 
 
 def tiny_p(cmd, capture=True):
@@ -94,29 +80,29 @@ def read_requires():
 
 
 # TODO: Is there a better way to do this??
-class DaemonInstallData(install):
+class InitsysInstallData(install):
     user_options = install.user_options + [
-        # This will magically show up in member variable 'daemon_type'
-        ('daemon-type=', None,
-            ('daemon type to configure (%s) [default: None]') %
-                (", ".join(DAEMON_TYPES))
+        # This will magically show up in member variable 'init_sys'
+        ('init-system=', None,
+            ('init system to configure (%s) [default: None]') %
+                (", ".join(INITSYS_TYPES))
         ),
     ]
 
     def initialize_options(self):
         install.initialize_options(self)
-        self.daemon_type = None
+        self.initsys = None
 
     def finalize_options(self):
         install.finalize_options(self)
-        if self.daemon_type and self.daemon_type not in DAEMON_TYPES:
+        if self.initsys and self.initsys not in INITSYS_TYPES:
                 raise DistutilsArgError(
                     ("You must specify one of (%s) when"
-                     " specifying a daemon type!") % (", ".join(DAEMON_TYPES))
+                     " specifying a init system!") % (", ".join(INITSYS_TYPES))
                 )
-        elif self.daemon_type:
-            self.distribution.data_files.append((DAEMON_ROOTS[self.daemon_type], 
-                                                 DAEMON_FILES[self.daemon_type]))
+        elif self.initsys:
+            self.distribution.data_files.append((INITSYS_ROOTS[self.initsys], 
+                                                 INITSYS_FILES[self.initsys]))
             # Force that command to reinitalize (with new file list)
             self.distribution.reinitialize_command('install_data', True)
 
@@ -145,7 +131,7 @@ setuptools.setup(name='cloud-init',
       install_requires=read_requires(),
       cmdclass = {
           # Use a subclass for install that handles
-          # adding on the right daemon configuration files
-          'install': DaemonInstallData,
+          # adding on the right init system configuration files
+          'install': InitsysInstallData,
       },
       )
diff --git a/initd/cloud-config b/sysvinit/cloud-config
similarity index 100%
rename from initd/cloud-config
rename to sysvinit/cloud-config
diff --git a/initd/cloud-final b/sysvinit/cloud-final
similarity index 100%
rename from initd/cloud-final
rename to sysvinit/cloud-final
diff --git a/initd/cloud-init b/sysvinit/cloud-init
similarity index 100%
rename from initd/cloud-init
rename to sysvinit/cloud-init
diff --git a/initd/cloud-init-local b/sysvinit/cloud-init-local
similarity index 100%
rename from initd/cloud-init-local
rename to sysvinit/cloud-init-local

From 26b36823a5cb5af16c63106392b3d9819c50edab Mon Sep 17 00:00:00 2001
From: Joshua Harlow <harlowja@yahoo-inc.com>
Date: Fri, 6 Jul 2012 14:13:19 -0700
Subject: [PATCH 434/434] Fix the initsys variable, setuptools/distools will
 automatically assign to a variable of the name 'init_system' instead due to
 the param name being 'init-system'.

---
 setup.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/setup.py b/setup.py
index 458d1a9e..06b897a5 100755
--- a/setup.py
+++ b/setup.py
@@ -91,18 +91,18 @@ class InitsysInstallData(install):
 
     def initialize_options(self):
         install.initialize_options(self)
-        self.initsys = None
+        self.init_system = None
 
     def finalize_options(self):
         install.finalize_options(self)
-        if self.initsys and self.initsys not in INITSYS_TYPES:
+        if self.init_system and self.init_system not in INITSYS_TYPES:
                 raise DistutilsArgError(
                     ("You must specify one of (%s) when"
                      " specifying a init system!") % (", ".join(INITSYS_TYPES))
                 )
-        elif self.initsys:
-            self.distribution.data_files.append((INITSYS_ROOTS[self.initsys], 
-                                                 INITSYS_FILES[self.initsys]))
+        elif self.init_system:
+            self.distribution.data_files.append((INITSYS_ROOTS[self.init_system], 
+                                                 INITSYS_FILES[self.init_system]))
             # Force that command to reinitalize (with new file list)
             self.distribution.reinitialize_command('install_data', True)