GitList

Browse code

diagnostics: complete refactor

master/node/client subcommands went away in favor of client/cluster/host diagnostic builders.
Diagnostic logging was completely refactored.
Diagnostics now return a result object instead of logging
directly so they could be run in parallel (though they don't yet).
Updated the help accordingly.

Luke Meyer authored on 2015/07/20 18:25:08
Showing 35 changed files

pkg/cmd/experimental/diagnostics/client.go index 749d888..fbf3531 100644
pkg/cmd/experimental/diagnostics/cluster.go index 0000000..310203a
pkg/cmd/experimental/diagnostics/config.go index 0000000..23a8c43
pkg/cmd/experimental/diagnostics/diagnostics.go index 7c54231..93bfca7 100644
pkg/cmd/experimental/diagnostics/host.go index 0000000..ff40c11
pkg/cmd/experimental/diagnostics/master.go index 543e499..0000000
pkg/cmd/experimental/diagnostics/node.go index 24b78e7..0000000
pkg/cmd/experimental/diagnostics/options/diagnostics.go index 84caddf..5d7b269 100644
pkg/cmd/experimental/diagnostics/options/flaginfo.go index e0bf478..0dbdb26 100644
pkg/diagnostics/README.md index 5532729..243377a 100644
pkg/diagnostics/client/config_contexts.go index 730f2c6..3093ea1 100644
pkg/diagnostics/client/config_loading.go index 0000000..aa2c1e8
pkg/diagnostics/client/node_definitions.go index 02f8e40..0000000
pkg/diagnostics/cluster/node_definitions.go index 0000000..cd4ccc8
pkg/diagnostics/discovery/client.go index 1e986dc..0000000
pkg/diagnostics/discovery/config.go index fd05512..0000000
pkg/diagnostics/discovery/os.go index f3c83e8..0000000
pkg/diagnostics/host/check_master_config.go index 0000000..001e574
pkg/diagnostics/host/check_node_config.go index 0000000..d4febe0
pkg/diagnostics/log/json.go index 903ebd8..5c919d5 100644
pkg/diagnostics/log/log.go index 72849c9..3ae4a21 100644
pkg/diagnostics/log/text.go index e0e45ed..b125f96 100644
pkg/diagnostics/log/yaml.go index 713710e..130dbe3 100644
pkg/diagnostics/master/check_config.go index 73495fd..0000000
pkg/diagnostics/node/check_config.go index f43979a..0000000
pkg/diagnostics/systemd/analyze_logs.go index e220f4d..50fa238 100644
pkg/diagnostics/systemd/locate_units.go index a5a7982..0513674 100644
pkg/diagnostics/systemd/systemd.go index 32a8968..3181912 100644
pkg/diagnostics/systemd/unit_status.go index 1ca1c2f..f9442c6 100644
pkg/diagnostics/types/diagnostic.go index 0000000..cc88409
pkg/diagnostics/types/diagnostic/type.go index 7c77c9b..0000000
pkg/diagnostics/types/error.go index 0000000..7ece678
pkg/diagnostics/types/version.go index f217211..0000000
rel-eng/completions/bash/openshift index 2ff2dbc..9a7e18d 100644
test/integration/diag_nodes_test.go index 0000000..cd94e91

@@ -2,135 +2,44 @@ package diagnostics
                      import (
                      	"fmt"
                     -	"io"
                     -	"os"
                     -	"github.com/spf13/cobra"
+                    -
                     -	kclient "github.com/GoogleCloudPlatform/kubernetes/pkg/client"
                     -	kclientcmdapi "github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd/api"
                     -	kcmdutil "github.com/GoogleCloudPlatform/kubernetes/pkg/kubectl/cmd/util"
                     +	clientcmdapi "github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd/api"
                      	"github.com/GoogleCloudPlatform/kubernetes/pkg/util"
                     -	diagnosticflags "github.com/openshift/origin/pkg/cmd/experimental/diagnostics/options"
                     -	osclientcmd "github.com/openshift/origin/pkg/cmd/util/clientcmd"
                      	clientdiagnostics "github.com/openshift/origin/pkg/diagnostics/client"
                     -	"github.com/openshift/origin/pkg/diagnostics/log"
                     -	diagnostictypes "github.com/openshift/origin/pkg/diagnostics/types/diagnostic"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
+                     )
                     -const ClientDiagnosticsRecommendedName = "client"
                     +const (
                     +	ConfigContexts = "ConfigContexts"
                     +)
                      var (
                     -	AvailableClientDiagnostics = util.NewStringSet("ConfigContexts", "NodeDefinitions")
                     +	AvailableClientDiagnostics = util.NewStringSet(ConfigContexts) // add more diagnostics as they are defined
+                     )
                     -// user options for openshift-diagnostics client command
                     -type ClientDiagnosticsOptions struct {
                     -	RequestedDiagnostics util.StringList
+                    -
                     -	KubeClient *kclient.Client
                     -	KubeConfig *kclientcmdapi.Config
+                    -
                     -	LogOptions *log.LoggerOptions
                     -	Logger     *log.Logger
                     -}
                     +func (o DiagnosticsOptions) buildClientDiagnostics(rawConfig *clientcmdapi.Config) ([]types.Diagnostic, bool /* ok */, error) {
                     -const longClientDescription = `
                     -OpenShift Diagnostics
+                    -
                     -This command helps you understand and troubleshoot OpenShift as a user. It is
                     -intended to be run from the same context as an OpenShift client
                     -("openshift cli" or "osc") and with the same configuration options.
+                    -
                     -    $ %s
                     -`
+                    -
                     -func NewClientCommand(name string, fullName string, out io.Writer) *cobra.Command {
                     -	o := &ClientDiagnosticsOptions{
                     -		RequestedDiagnostics: AvailableClientDiagnostics.List(),
                     -		LogOptions:           &log.LoggerOptions{Out: out},
                     +	osClient, kubeClient, clientErr := o.Factory.Clients()
                     +	_ = osClient   // remove once a diagnostic makes use of OpenShift client
                     +	_ = kubeClient // remove once a diagnostic makes use of kube client
                     +	if clientErr != nil {
                     +		o.Logger.Notice("clLoadDefaultFailed", "Failed creating client from config; client diagnostics will be limited to config testing")
                     +		AvailableClientDiagnostics = util.NewStringSet(ConfigContexts)
+                     	}
                     -	var factory *osclientcmd.Factory
+                    -
                     -	cmd := &cobra.Command{
                     -		Use:   name,
                     -		Short: "Troubleshoot using the OpenShift v3 client.",
                     -		Long:  fmt.Sprintf(longClientDescription, fullName),
                     -		Run: func(c *cobra.Command, args []string) {
                     -			kcmdutil.CheckErr(o.Complete())
+                    -
                     -			_, kubeClient, err := factory.Clients()
                     -			kcmdutil.CheckErr(err)
+                    -
                     -			kubeConfig, err := factory.OpenShiftClientConfig.RawConfig()
                     -			kcmdutil.CheckErr(err)
+                    -
                     -			o.KubeClient = kubeClient
                     -			o.KubeConfig = &kubeConfig
+                    -
                     -			failed, err := o.RunDiagnostics()
                     -			o.Logger.Summary()
                     -			o.Logger.Finish()
+                    -
                     -			kcmdutil.CheckErr(err)
                     -			if failed {
                     -				os.Exit(255)
                     -			}
+                    -
                     -		},
                     -	}
                     -	cmd.SetOutput(out)                     // for output re: usage / help
                     -	factory = osclientcmd.New(cmd.Flags()) // side effect: add standard persistent flags for openshift client
                     -	diagnosticflags.BindLoggerOptionFlags(cmd.Flags(), o.LogOptions, diagnosticflags.RecommendedLoggerOptionFlags())
                     -	diagnosticflags.BindDiagnosticFlag(cmd.Flags(), &o.RequestedDiagnostics, diagnosticflags.NewRecommendedDiagnosticFlag())
+                    -
                     -	return cmd
                     -}
+                    -
                     -func (o *ClientDiagnosticsOptions) Complete() error {
                     -	var err error
                     -	o.Logger, err = o.LogOptions.NewLogger()
                     -	if err != nil {
                     -		return err
                     -	}
+                    -
                     -	return nil
                     -}
+                    -
                     -func (o ClientDiagnosticsOptions) RunDiagnostics() (bool, error) {
                     -	diagnostics := map[string]diagnostictypes.Diagnostic{}
+                    -
                     -	for _, diagnosticName := range o.RequestedDiagnostics {
                     +	diagnostics := []types.Diagnostic{}
                     +	requestedDiagnostics := intersection(util.NewStringSet(o.RequestedDiagnostics...), AvailableClientDiagnostics).List()
                     +	for _, diagnosticName := range requestedDiagnostics {
                      		switch diagnosticName {
                     -		case "ConfigContexts":
                     -			for contextName, _ := range o.KubeConfig.Contexts {
                     -				diagnostics[diagnosticName+"["+contextName+"]"] = clientdiagnostics.ConfigContext{o.KubeConfig, contextName, o.Logger}
                     +		case ConfigContexts:
                     +			for contextName := range rawConfig.Contexts {
                     +				diagnostics = append(diagnostics, clientdiagnostics.ConfigContext{rawConfig, contextName})
+                     			}
                     -		case "NodeDefinitions":
                     -			diagnostics[diagnosticName] = clientdiagnostics.NodeDefinition{o.KubeClient, o.Logger}
+                    -
                      		default:
                     -			return false, fmt.Errorf("unknown diagnostic: %v", diagnosticName)
                     -		}
                     -	}
+                    -
                     -	for name, diagnostic := range diagnostics {
+                    -
                     -		if canRun, reason := diagnostic.CanRun(); !canRun {
                     -			if reason == nil {
                     -				o.Logger.Noticem(log.Message{ID: "diagSkip", Template: "Skipping diagnostic: {{.area}}.{{.name}}\nDescription: {{.diag}}", TemplateData: map[string]string{"area": "client", "name": name, "diag": diagnostic.Description()}})
                     -			} else {
                     -				o.Logger.Noticem(log.Message{ID: "diagSkip", Template: "Skipping diagnostic: {{.area}}.{{.name}}\nDescription: {{.diag}}\nBecause: {{.reason}}", TemplateData: map[string]string{"area": "client", "name": name, "diag": diagnostic.Description(), "reason": reason.Error()}})
                     -			}
                     -			continue
                     +			return nil, false, fmt.Errorf("unknown diagnostic: %v", diagnosticName)
+                     		}
+                    -
                     -		o.Logger.Noticem(log.Message{ID: "diagRun", Template: "Running diagnostic: {{.area}}.{{.name}}\nDescription: {{.diag}}", TemplateData: map[string]string{"area": "client", "name": name, "diag": diagnostic.Description()}})
                     -		diagnostic.Check()
+                     	}
+                    -
                     -	return o.Logger.ErrorsSeen(), nil
                     +	return diagnostics, true, clientErr
+                     }

                     new file mode 100644
@@ -0,0 +1,111 @@
                     +package diagnostics
+                    +
                     +import (
                     +	"fmt"
                     +	"strings"
+                    +
                     +	kclient "github.com/GoogleCloudPlatform/kubernetes/pkg/client"
                     +	clientcmd "github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd"
                     +	clientcmdapi "github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd/api"
                     +	"github.com/GoogleCloudPlatform/kubernetes/pkg/util"
+                    +
                     +	authorizationapi "github.com/openshift/origin/pkg/authorization/api"
                     +	"github.com/openshift/origin/pkg/client"
                     +	osclientcmd "github.com/openshift/origin/pkg/cmd/util/clientcmd"
+                    +
                     +	clustdiags "github.com/openshift/origin/pkg/diagnostics/cluster"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
                     +)
+                    +
                     +var (
                     +	AvailableClusterDiagnostics = util.NewStringSet("NodeDefinitions")
                     +)
+                    +
                     +func (o DiagnosticsOptions) buildClusterDiagnostics(rawConfig *clientcmdapi.Config) ([]types.Diagnostic, bool /* ok */, error) {
                     +	requestedDiagnostics := intersection(util.NewStringSet(o.RequestedDiagnostics...), AvailableClusterDiagnostics).List()
                     +	if len(requestedDiagnostics) == 0 { // no diagnostics to run here
                     +		return nil, true, nil // don't waste time on discovery
                     +	}
+                    +
                     +	var clusterClient *client.Client
                     +	var kclusterClient *kclient.Client
+                    +
                     +	clusterClient, kclusterClient, found, err := o.findClusterClients(rawConfig)
                     +	if !found {
                     +		o.Logger.Notice("noClustCtx", "No cluster-admin client config found; skipping cluster diagnostics.")
                     +		return nil, false, err
                     +	}
+                    +
                     +	diagnostics := []types.Diagnostic{}
                     +	for _, diagnosticName := range requestedDiagnostics {
                     +		switch diagnosticName {
                     +		case "NodeDefinitions":
                     +			diagnostics = append(diagnostics, clustdiags.NodeDefinitions{kclusterClient})
+                    +
                     +		default:
                     +			return nil, false, fmt.Errorf("unknown diagnostic: %v", diagnosticName)
                     +		}
                     +	}
                     +	return diagnostics, true, nil
                     +}
+                    +
                     +func (o DiagnosticsOptions) findClusterClients(rawConfig *clientcmdapi.Config) (*client.Client, *kclient.Client, bool, error) {
                     +	if o.ClientClusterContext != "" { // user has specified cluster context to use
                     +		if context, exists := rawConfig.Contexts[o.ClientClusterContext]; exists {
                     +			configErr := fmt.Errorf("Specified '%s' as cluster-admin context, but it was not found in your client configuration.", o.ClientClusterContext)
                     +			o.Logger.Error("discClustCtx", configErr.Error())
                     +			return nil, nil, false, configErr
                     +		} else if os, kube, found, err := o.makeClusterClients(rawConfig, o.ClientClusterContext, context); found {
                     +			return os, kube, true, err
                     +		} else {
                     +			return nil, nil, false, err
                     +		}
                     +	}
                     +	currentContext, exists := rawConfig.Contexts[rawConfig.CurrentContext]
                     +	if !exists { // config specified cluster admin context that doesn't exist; complain and quit
                     +		configErr := fmt.Errorf("Current context '%s' not found in client configuration; will not attempt cluster diagnostics.", rawConfig.CurrentContext)
                     +		o.Logger.Errorf("discClustCtx", configErr.Error())
                     +		return nil, nil, false, configErr
                     +	}
                     +	// check if current context is already cluster admin
                     +	if os, kube, found, err := o.makeClusterClients(rawConfig, rawConfig.CurrentContext, currentContext); found {
                     +		return os, kube, true, err
                     +	}
                     +	// otherwise, for convenience, search for a context with the same server but with the system:admin user
                     +	for name, context := range rawConfig.Contexts {
                     +		if context.Cluster == currentContext.Cluster && name != rawConfig.CurrentContext && strings.HasPrefix(context.AuthInfo, "system:admin/") {
                     +			if os, kube, found, err := o.makeClusterClients(rawConfig, name, context); found {
                     +				return os, kube, true, err
                     +			} else {
                     +				return nil, nil, false, err // don't try more than one such context, they'll probably fail the same
                     +			}
                     +		}
                     +	}
                     +	return nil, nil, false, nil
                     +}
+                    +
                     +func (o DiagnosticsOptions) makeClusterClients(rawConfig *clientcmdapi.Config, contextName string, context *clientcmdapi.Context) (*client.Client, *kclient.Client, bool, error) {
                     +	overrides := &clientcmd.ConfigOverrides{Context: *context}
                     +	clientConfig := clientcmd.NewDefaultClientConfig(*rawConfig, overrides)
                     +	factory := osclientcmd.NewFactory(clientConfig)
                     +	o.Logger.Debugf("discClustCtxStart", "Checking if context is cluster-admin: '%s'", contextName)
                     +	if osClient, kubeClient, err := factory.Clients(); err != nil {
                     +		o.Logger.Debugf("discClustCtx", "Error creating client for context '%s':\n%v", contextName, err)
                     +		return nil, nil, false, nil
                     +	} else {
                     +		subjectAccessReview := authorizationapi.SubjectAccessReview{
                     +			// we assume if you can list nodes, you're the cluster admin.
                     +			Verb:     "list",
                     +			Resource: "nodes",
                     +		}
                     +		if resp, err := osClient.SubjectAccessReviews("default").Create(&subjectAccessReview); err != nil {
                     +			o.Logger.Errorf("discClustCtx", "Error testing cluster-admin access for context '%s':\n%v", contextName, err)
                     +			return nil, nil, false, err
                     +		} else if resp.Allowed {
                     +			o.Logger.Infof("discClustCtxFound", "Using context for cluster-admin access: '%s'", contextName)
                     +			return osClient, kubeClient, true, nil
                     +		}
                     +	}
                     +	o.Logger.Debugf("discClustCtx", "Context does not have cluster-admin access: '%s'", contextName)
                     +	return nil, nil, false, nil
                     +}

                     new file mode 100644
@@ -0,0 +1,29 @@
                     +package diagnostics
+                    +
                     +import (
                     +	clientcmdapi "github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd/api"
                     +	"github.com/openshift/origin/pkg/cmd/cli/config"
+                    +
                     +	clientdiagnostics "github.com/openshift/origin/pkg/diagnostics/client"
                     +	"github.com/openshift/origin/pkg/diagnostics/log"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
                     +)
+                    +
                     +func (o DiagnosticsOptions) detectClientConfig() (bool, []types.DiagnosticError, []types.DiagnosticError) {
                     +	diagnostic := &clientdiagnostics.ConfigLoading{ConfFlagName: config.OpenShiftConfigFlagName, ClientFlags: o.ClientFlags}
                     +	o.Logger.Noticet("diagRun", "Determining if client configuration exists for client/cluster diagnostics",
                     +		log.Hash{"area": "client", "name": diagnostic.Name(), "diag": diagnostic.Description()})
                     +	result := diagnostic.Check()
                     +	for _, entry := range result.Logs() {
                     +		o.Logger.LogEntry(entry)
                     +	}
                     +	return diagnostic.SuccessfulLoad(), result.Warnings(), result.Errors()
                     +}
+                    +
                     +func (o DiagnosticsOptions) buildRawConfig() (*clientcmdapi.Config, error) {
                     +	kubeConfig, configErr := o.Factory.OpenShiftClientConfig.RawConfig()
                     +	if len(kubeConfig.Contexts) == 0 {
                     +		return nil, configErr
                     +	}
                     +	return &kubeConfig, configErr
                     +}

@@ -2,89 +2,80 @@ package diagnostics
                      import (
                      	"fmt"
                     +	"github.com/spf13/cobra"
                     +	flag "github.com/spf13/pflag"
                      	"io"
                      	"os"
                     -	"github.com/spf13/cobra"
+                    -
                      	kcmdutil "github.com/GoogleCloudPlatform/kubernetes/pkg/kubectl/cmd/util"
                      	"github.com/GoogleCloudPlatform/kubernetes/pkg/util"
                      	kutilerrors "github.com/GoogleCloudPlatform/kubernetes/pkg/util/errors"
+                    -
                     -	diagnosticflags "github.com/openshift/origin/pkg/cmd/experimental/diagnostics/options"
                     -	"github.com/openshift/origin/pkg/cmd/templates"
                     +	"github.com/openshift/origin/pkg/cmd/cli/config"
                     +	"github.com/openshift/origin/pkg/cmd/flagtypes"
                      	osclientcmd "github.com/openshift/origin/pkg/cmd/util/clientcmd"
                     -	"github.com/openshift/origin/pkg/diagnostics/log"
                     -)
                     -var (
                     -	AvailableOverallDiagnostics = util.NewStringSet()
                     +	"github.com/openshift/origin/pkg/cmd/experimental/diagnostics/options"
                     +	"github.com/openshift/origin/pkg/diagnostics/log"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
+                     )
                     -func init() {
                     -	AvailableOverallDiagnostics.Insert(AvailableClientDiagnostics.List()...)
                     -	AvailableOverallDiagnostics.Insert(AvailableMasterDiagnostics.List()...)
                     -	AvailableOverallDiagnostics.Insert(AvailableNodeDiagnostics.List()...)
                     -}
+                    -
                     -type OverallDiagnosticsOptions struct {
                     +type DiagnosticsOptions struct {
                      	RequestedDiagnostics util.StringList
                      	MasterConfigLocation string
                      	NodeConfigLocation   string
                     +	ClientClusterContext string
                     +	IsHost               bool
                     -	Factory *osclientcmd.Factory
                     +	ClientFlags *flag.FlagSet
                     +	Factory     *osclientcmd.Factory
                      	LogOptions *log.LoggerOptions
                      	Logger     *log.Logger
+                     }
                     -const longAllDescription = `
                     +const longDescription = `
                      OpenShift Diagnostics
                     -This command helps you understand and troubleshoot OpenShift. It is
                     -intended to be run from the same context as an OpenShift client or running
                     -master / node in order to troubleshoot from the perspective of each.
                     +This command helps you understand and troubleshoot OpenShift. It runs
                     +diagnostics against an OpenShift cluster as with a client and/or the
                     +state of a running master / node host.
                          $ %[1]s
                     -If run without flags or subcommands, it will check for config files for
                     -client, master, and node, and if found, use them for troubleshooting
                     -those components. If master/node config files are not found, the tool
                     -assumes they are not present and does diagnostics only as a client.
+                    -
                     -You may also specify config files explicitly with flags below, in which
                     -case you will receive an error if they are invalid or not found.
                     +If run without flags, it will check for standard config files for
                     +client, master, and node, and if found, use them for diagnostics.
                     +You may also specify config files explicitly with flags, in which case
                     +you will receive an error if they are not found. For example:
                          $ %[1]s --master-config=/etc/openshift/master/master-config.yaml
                     -Subcommands may be used to scope the troubleshooting to a particular
                     -component and are not limited to using config files; you can and should
                     -use the same flags that are actually set on the command line for that
                     -component to configure the diagnostic.
                     +* If master/node config files are not found and the --host flag is not
                     +  present, host diagnostics are skipped.
                     +* If the client has cluster-admin access, this access enables cluster
                     +  diagnostics to run which regular users cannot.
                     +* If a client config file is not found, client and cluster diagnostics
                     +  are skipped.
                     -    $ %[1]s node --hostname='node.example.com' --kubeconfig=...
+                    -
                     -NOTE: This is an alpha version of diagnostics and will change significantly.
                     -NOTE: Global flags (from the 'options' subcommand) are ignored here but
                     -can be used with subcommands.
                     +NOTE: This is a beta version of diagnostics and may still evolve in a
                     +different direction.
+                     `
                      func NewCommandDiagnostics(name string, fullName string, out io.Writer) *cobra.Command {
                     -	o := &OverallDiagnosticsOptions{
                     -		RequestedDiagnostics: AvailableOverallDiagnostics.List(),
                     +	o := &DiagnosticsOptions{
                     +		RequestedDiagnostics: util.StringList{},
                      		LogOptions:           &log.LoggerOptions{Out: out},
+                     	}
                      	cmd := &cobra.Command{
                      		Use:   name,
                      		Short: "This utility helps you understand and troubleshoot OpenShift v3.",
                     -		Long:  fmt.Sprintf(longAllDescription, fullName),
                     +		Long:  fmt.Sprintf(longDescription, fullName),
                      		Run: func(c *cobra.Command, args []string) {
                      			kcmdutil.CheckErr(o.Complete())
                     -			failed, err := o.RunDiagnostics()
                     -			o.Logger.Summary()
                     +			failed, err, warnCount, errorCount := o.RunDiagnostics()
                     +			o.Logger.Summary(warnCount, errorCount)
                      			o.Logger.Finish()
                      			kcmdutil.CheckErr(err)
@@ -96,21 +87,22 @@ func NewCommandDiagnostics(name string, fullName string, out io.Writer) *cobra.C
+                     	}
                      	cmd.SetOutput(out) // for output re: usage / help
                     -	o.Factory = osclientcmd.New(cmd.Flags()) // side effect: add standard persistent flags for openshift client
                     -	cmd.Flags().StringVar(&o.MasterConfigLocation, "master-config", "", "path to master config file")
                     -	cmd.Flags().StringVar(&o.NodeConfigLocation, "node-config", "", "path to node config file")
                     -	diagnosticflags.BindLoggerOptionFlags(cmd.Flags(), o.LogOptions, diagnosticflags.RecommendedLoggerOptionFlags())
                     -	diagnosticflags.BindDiagnosticFlag(cmd.Flags(), &o.RequestedDiagnostics, diagnosticflags.NewRecommendedDiagnosticFlag())
+                    -
                     -	cmd.AddCommand(NewClientCommand(ClientDiagnosticsRecommendedName, name+" "+ClientDiagnosticsRecommendedName, out))
                     -	cmd.AddCommand(NewMasterCommand(MasterDiagnosticsRecommendedName, name+" "+MasterDiagnosticsRecommendedName, out))
                     -	cmd.AddCommand(NewNodeCommand(NodeDiagnosticsRecommendedName, name+" "+NodeDiagnosticsRecommendedName, out))
                     -	cmd.AddCommand(NewOptionsCommand())
                     +	o.ClientFlags = flag.NewFlagSet("client", flag.ContinueOnError) // hide the extensive set of client flags
                     +	o.Factory = osclientcmd.New(o.ClientFlags)                      // that would otherwise be added to this command
                     +	cmd.Flags().AddFlag(o.ClientFlags.Lookup(config.OpenShiftConfigFlagName))
                     +	cmd.Flags().AddFlag(o.ClientFlags.Lookup("context")) // TODO: find k8s constant
                     +	cmd.Flags().StringVar(&o.ClientClusterContext, options.FlagClusterContextName, "", "client context to use for cluster administrator")
                     +	cmd.Flags().StringVar(&o.MasterConfigLocation, options.FlagMasterConfigName, "", "path to master config file (implies --host)")
                     +	cmd.Flags().StringVar(&o.NodeConfigLocation, options.FlagNodeConfigName, "", "path to node config file (implies --host)")
                     +	cmd.Flags().BoolVar(&o.IsHost, options.FlagIsHostName, false, "look for systemd and journald units even without master/node config")
                     +	flagtypes.GLog(cmd.Flags())
                     +	options.BindLoggerOptionFlags(cmd.Flags(), o.LogOptions, options.RecommendedLoggerOptionFlags())
                     +	options.BindDiagnosticFlag(cmd.Flags(), &o.RequestedDiagnostics, options.NewRecommendedDiagnosticFlag())
                      	return cmd
+                     }
                     -func (o *OverallDiagnosticsOptions) Complete() error {
                     +func (o *DiagnosticsOptions) Complete() error {
                      	var err error
                      	o.Logger, err = o.LogOptions.NewLogger()
                      	if err != nil {
@@ -120,112 +112,129 @@ func (o *OverallDiagnosticsOptions) Complete() error {
                      	return nil
+                     }
                     -func (o OverallDiagnosticsOptions) RunDiagnostics() (bool, error) {
                     +func (o DiagnosticsOptions) RunDiagnostics() (bool, error, int, int) {
                      	failed := false
                     +	warnings := []error{}
                      	errors := []error{}
+                    -
                     -	masterFailed, err := o.CheckMaster()
                     -	failed = failed && masterFailed
                     -	if err != nil {
                     -		errors = append(errors, err)
                     -	}
+                    -
                     -	nodeFailed, err := o.CheckNode()
                     -	failed = failed && nodeFailed
                     -	if err != nil {
                     -		errors = append(errors, err)
                     -	}
+                    -
                     -	clientFailed, err := o.CheckClient()
                     -	failed = failed && clientFailed
                     -	if err != nil {
                     -		errors = append(errors, err)
                     -	}
+                    -
                     -	return failed, kutilerrors.NewAggregate(errors)
                     -}
+                    -
                     -func (o OverallDiagnosticsOptions) CheckClient() (bool, error) {
                     -	runClientChecks := true
+                    -
                     -	_, kubeClient, err := o.Factory.Clients()
                     -	if err != nil {
                     -		runClientChecks = false
                     +	diagnostics := map[string][]types.Diagnostic{}
                     +	AvailableDiagnostics := util.NewStringSet()
                     +	AvailableDiagnostics.Insert(AvailableClientDiagnostics.List()...)
                     +	AvailableDiagnostics.Insert(AvailableClusterDiagnostics.List()...)
                     +	AvailableDiagnostics.Insert(AvailableHostDiagnostics.List()...)
                     +	if len(o.RequestedDiagnostics) == 0 {
                     +		o.RequestedDiagnostics = AvailableDiagnostics.List()
                     +	} else if common := intersection(util.NewStringSet(o.RequestedDiagnostics...), AvailableDiagnostics); len(common) == 0 {
                     +		o.Logger.Errort("emptyReqDiag", "None of the requested diagnostics are available:\n  {{.requested}}\nPlease try from the following:\n  {{.available}}",
                     +			log.Hash{"requested": o.RequestedDiagnostics, "available": AvailableDiagnostics.List()})
                     +		return false, fmt.Errorf("No requested diagnostics available"), 0, 1
                     +	} else if len(common) < len(o.RequestedDiagnostics) {
                     +		errors = append(errors, fmt.Errorf("Not all requested diagnostics are available"))
                     +		o.Logger.Errort("notAllReqDiag", `
                     +Of the requested diagnostics:
                     +    {{.requested}}
                     +only these are available:
                     +    {{.common}}
                     +The list of all possible is:
                     +    {{.available}}
                     +		`, log.Hash{"requested": o.RequestedDiagnostics, "common": common.List(), "available": AvailableDiagnostics.List()})
+                     	}
                     -	kubeConfig, err := o.Factory.OpenShiftClientConfig.RawConfig()
                     -	if err != nil {
                     -		runClientChecks = false
                     -	}
+                    -
                     -	if runClientChecks {
                     -		clientDiagnosticOptions := &ClientDiagnosticsOptions{
                     -			RequestedDiagnostics: intersection(util.NewStringSet(o.RequestedDiagnostics...), AvailableClientDiagnostics).List(),
                     -			KubeClient:           kubeClient,
                     -			KubeConfig:           &kubeConfig,
                     -			LogOptions:           o.LogOptions,
                     -			Logger:               o.Logger,
                     +	func() { // don't trust discovery/build of diagnostics; wrap panic nicely in case of developer error
                     +		defer func() {
                     +			if r := recover(); r != nil {
                     +				failed = true
                     +				errors = append(errors, fmt.Errorf("While building the diagnostics, a panic was encountered.\nThis is a bug in diagnostics. Stack trace follows : \n%v", r))
                     +			}
                     +		}()
                     +		detected, detectWarnings, detectErrors := o.detectClientConfig() // may log and return problems
                     +		for _, warn := range detectWarnings {
                     +			warnings = append(warnings, warn)
+                     		}
                     +		for _, err := range detectErrors {
                     +			errors = append(errors, err)
                     +		}
                     +		if !detected { // there just plain isn't any client config file available
                     +			o.Logger.Notice("discNoClientConf", "No client configuration specified; skipping client and cluster diagnostics.")
                     +		} else if rawConfig, err := o.buildRawConfig(); rawConfig == nil { // client config is totally broken - won't parse etc (problems may have been detected and logged)
                     +			o.Logger.Errorf("discBrokenClientConf", "Client configuration failed to load; skipping client and cluster diagnostics due to error: {{.error}}", log.Hash{"error": err.Error()})
                     +			errors = append(errors, err)
                     +		} else {
                     +			if err != nil { // error encountered, proceed with caution
                     +				o.Logger.Errorf("discClientConfErr", "Client configuration loading encountered an error, but proceeding anyway. Error was:\n{{.error}}", log.Hash{"error": err.Error()})
                     +				errors = append(errors, err)
                     +			}
                     +			if clientDiags, ok, err := o.buildClientDiagnostics(rawConfig); ok {
                     +				diagnostics["client"] = clientDiags
                     +			} else if err != nil {
                     +				failed = true
                     +				errors = append(errors, err)
                     +			}
                     -		return clientDiagnosticOptions.RunDiagnostics()
                     -	}
+                    -
                     -	return false, nil
                     -}
+                    -
                     -func (o OverallDiagnosticsOptions) CheckNode() (bool, error) {
                     -	if len(o.NodeConfigLocation) == 0 {
                     -		if _, err := os.Stat(StandardNodeConfigPath); !os.IsNotExist(err) {
                     -			o.NodeConfigLocation = StandardNodeConfigPath
                     +			if clusterDiags, ok, err := o.buildClusterDiagnostics(rawConfig); ok {
                     +				diagnostics["cluster"] = clusterDiags
                     +			} else if err != nil {
                     +				failed = true
                     +				errors = append(errors, err)
                     +			}
+                     		}
                     -	}
                     -	if len(o.NodeConfigLocation) != 0 {
                     -		masterDiagnosticOptions := &NodeDiagnosticsOptions{
                     -			RequestedDiagnostics: intersection(util.NewStringSet(o.RequestedDiagnostics...), AvailableNodeDiagnostics).List(),
                     -			NodeConfigLocation:   o.NodeConfigLocation,
                     -			LogOptions:           o.LogOptions,
                     -			Logger:               o.Logger,
                     +		if hostDiags, ok, err := o.buildHostDiagnostics(); ok {
                     +			diagnostics["host"] = hostDiags
                     +		} else if err != nil {
                     +			failed = true
                     +			errors = append(errors, err)
+                     		}
                     +	}()
                     -		return masterDiagnosticOptions.RunDiagnostics()
                     +	if failed {
                     +		return failed, kutilerrors.NewAggregate(errors), len(warnings), len(errors)
+                     	}
                     -	return false, nil
                     +	failed, err, numWarnings, numErrors := o.Run(diagnostics)
                     +	numWarnings += len(warnings)
                     +	numErrors += len(errors)
                     +	return failed, err, numWarnings, numErrors
+                     }
                     -func (o OverallDiagnosticsOptions) CheckMaster() (bool, error) {
                     -	if len(o.MasterConfigLocation) == 0 {
                     -		if _, err := os.Stat(StandardMasterConfigPath); !os.IsNotExist(err) {
                     -			o.MasterConfigLocation = StandardMasterConfigPath
                     +func (o DiagnosticsOptions) Run(diagnostics map[string][]types.Diagnostic) (bool, error, int, int) {
                     +	warnCount := 0
                     +	errorCount := 0
                     +	for area, areaDiagnostics := range diagnostics {
                     +		for _, diagnostic := range areaDiagnostics {
                     +			func() { // wrap diagnostic panic nicely in case of developer error
                     +				defer func() {
                     +					if r := recover(); r != nil {
                     +						errorCount += 1
                     +						o.Logger.Errort("diagPanic",
                     +							"While running the {{.area}}.{{.name}} diagnostic, a panic was encountered.\nThis is a bug in diagnostics. Stack trace follows : \n{{.error}}",
                     +							log.Hash{"area": area, "name": diagnostic.Name(), "error": fmt.Sprintf("%v", r)})
                     +					}
                     +				}()
+                    +
                     +				if canRun, reason := diagnostic.CanRun(); !canRun {
                     +					if reason == nil {
                     +						o.Logger.Noticet("diagSkip", "Skipping diagnostic: {{.area}}.{{.name}}\nDescription: {{.diag}}",
                     +							log.Hash{"area": area, "name": diagnostic.Name(), "diag": diagnostic.Description()})
                     +					} else {
                     +						o.Logger.Noticet("diagSkip", "Skipping diagnostic: {{.area}}.{{.name}}\nDescription: {{.diag}}\nBecause: {{.reason}}",
                     +							log.Hash{"area": area, "name": diagnostic.Name(), "diag": diagnostic.Description(), "reason": reason.Error()})
                     +					}
                     +					return
                     +				}
+                    +
                     +				o.Logger.Noticet("diagRun", "Running diagnostic: {{.area}}.{{.name}}\nDescription: {{.diag}}",
                     +					log.Hash{"area": area, "name": diagnostic.Name(), "diag": diagnostic.Description()})
                     +				r := diagnostic.Check()
                     +				for _, entry := range r.Logs() {
                     +					o.Logger.LogEntry(entry)
                     +				}
                     +				warnCount += len(r.Warnings())
                     +				errorCount += len(r.Errors())
                     +			}()
+                     		}
                     -	}
+                    -
                     -	if len(o.MasterConfigLocation) != 0 {
                     -		masterDiagnosticOptions := &MasterDiagnosticsOptions{
                     -			RequestedDiagnostics: intersection(util.NewStringSet(o.RequestedDiagnostics...), AvailableMasterDiagnostics).List(),
                     -			MasterConfigLocation: o.MasterConfigLocation,
                     -			LogOptions:           o.LogOptions,
                     -			Logger:               o.Logger,
                     -		}
+                    -
                     -		return masterDiagnosticOptions.RunDiagnostics()
                     -	}
+                    -
                     -	return false, nil
                     -}
                     -func NewOptionsCommand() *cobra.Command {
                     -	cmd := &cobra.Command{
                     -		Use: "options",
                     -		Run: func(cmd *cobra.Command, args []string) {
                     -			cmd.Usage()
                     -		},
+                     	}
+                    -
                     -	templates.UseOptionsTemplates(cmd)
+                    -
                     -	return cmd
                     +	return errorCount > 0, nil, warnCount, errorCount
+                     }
                      // TODO move upstream

                     new file mode 100644
@@ -0,0 +1,76 @@
                     +package diagnostics
+                    +
                     +import (
                     +	"fmt"
                     +	"github.com/GoogleCloudPlatform/kubernetes/pkg/util"
                     +	"github.com/openshift/origin/pkg/diagnostics/host"
                     +	systemddiagnostics "github.com/openshift/origin/pkg/diagnostics/systemd"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
                     +	"os"
                     +)
+                    +
                     +const (
                     +	StandardMasterConfigPath string = "/etc/openshift/master/master-config.yaml"
                     +	StandardNodeConfigPath   string = "/etc/openshift/node/node-config.yaml"
                     +)
+                    +
                     +var (
                     +	AvailableHostDiagnostics = util.NewStringSet("AnalyzeLogs", "UnitStatus", "MasterConfigCheck", "NodeConfigCheck")
                     +)
+                    +
                     +func (o DiagnosticsOptions) buildHostDiagnostics() ([]types.Diagnostic, bool /* ok */, error) {
                     +	requestedDiagnostics := intersection(util.NewStringSet(o.RequestedDiagnostics...), AvailableHostDiagnostics).List()
                     +	if len(requestedDiagnostics) == 0 { // no diagnostics to run here
                     +		return nil, true, nil // don't waste time on discovery
                     +	}
                     +	isHost := o.IsHost
                     +	// check for standard host config paths if not given
                     +	if len(o.MasterConfigLocation) == 0 {
                     +		if _, err := os.Stat(StandardMasterConfigPath); !os.IsNotExist(err) {
                     +			o.MasterConfigLocation = StandardMasterConfigPath
                     +			isHost = true
                     +		}
                     +	} else {
                     +		isHost = true
                     +	}
                     +	if len(o.NodeConfigLocation) == 0 {
                     +		if _, err := os.Stat(StandardNodeConfigPath); !os.IsNotExist(err) {
                     +			o.NodeConfigLocation = StandardNodeConfigPath
                     +			isHost = true
                     +		}
                     +	} else {
                     +		isHost = true
                     +	}
+                    +
                     +	// If we're not looking at a host, don't try the diagnostics
                     +	if !isHost {
                     +		return nil, true, nil
                     +	}
+                    +
                     +	diagnostics := []types.Diagnostic{}
                     +	systemdUnits := systemddiagnostics.GetSystemdUnits(o.Logger)
                     +	for _, diagnosticName := range requestedDiagnostics {
                     +		switch diagnosticName {
                     +		case "AnalyzeLogs":
                     +			diagnostics = append(diagnostics, systemddiagnostics.AnalyzeLogs{systemdUnits})
+                    +
                     +		case "UnitStatus":
                     +			diagnostics = append(diagnostics, systemddiagnostics.UnitStatus{systemdUnits})
+                    +
                     +		case "MasterConfigCheck":
                     +			if len(o.MasterConfigLocation) > 0 {
                     +				diagnostics = append(diagnostics, host.MasterConfigCheck{o.MasterConfigLocation})
                     +			}
+                    +
                     +		case "NodeConfigCheck":
                     +			if len(o.NodeConfigLocation) > 0 {
                     +				diagnostics = append(diagnostics, host.NodeConfigCheck{o.NodeConfigLocation})
                     +			}
+                    +
                     +		default:
                     +			return diagnostics, false, fmt.Errorf("unknown diagnostic: %v", diagnosticName)
                     +		}
                     +	}
+                    +
                     +	return diagnostics, true, nil
                     +}

...	...	@@ -8,27 +8,27 @@ import (
8	8	"github.com/openshift/origin/pkg/diagnostics/log"
9	9	)
10	10
11		-type RecommendedLoggerOptionsFlags struct {
	11	+type LoggerOptionFlags struct {
12	12	Level FlagInfo
13	13	Format FlagInfo
14	14	}
15	15
16	16	// default overrideable flag specifications to be bound to options.
17		-func RecommendedLoggerOptionFlags() RecommendedLoggerOptionsFlags {
18		- return RecommendedLoggerOptionsFlags{
	17	+func RecommendedLoggerOptionFlags() LoggerOptionFlags {
	18	+ return LoggerOptionFlags{
19	19	Level: FlagInfo{FlagLevelName, "l", "1", "Level of diagnostic output: 4: Error, 3: Warn, 2: Notice, 1: Info, 0: Debug"},
20	20	Format: FlagInfo{FlagFormatName, "o", "text", "Output format: text\|json\|yaml"},
21	21	}
22	22	}
23	23
24		-func BindLoggerOptionFlags(cmdFlags pflag.FlagSet, loggerOptions log.LoggerOptions, flags RecommendedLoggerOptionsFlags) {
	24	+func BindLoggerOptionFlags(cmdFlags pflag.FlagSet, loggerOptions log.LoggerOptions, flags LoggerOptionFlags) {
25	25	flags.Level.BindIntFlag(cmdFlags, &loggerOptions.Level)
26	26	flags.Format.BindStringFlag(cmdFlags, &loggerOptions.Format)
27	27	}
28	28
29	29	// default overrideable flag specifications to be bound to options.
30	30	func NewRecommendedDiagnosticFlag() FlagInfo {
31		- return FlagInfo{FlagDiagnosticsName, "d", "", `comma-separated list of diagnostic names to run, e.g. "systemd.AnalyzeLogs"`}
	31	+ return FlagInfo{FlagDiagnosticsName, "d", "", `comma-separated list of diagnostic names to run, e.g. "AnalyzeLogs"`}
32	32	}
33	33
34	34	func BindDiagnosticFlag(cmdFlags pflag.FlagSet, diagnostics util.StringList, flagInfo FlagInfo) {

@@ -14,10 +14,11 @@ type FlagInfo kclientcmd.FlagInfo // reuse to add methods
                      // with tweaked definitions in different contexts if necessary.
                      func (i FlagInfo) BindStringFlag(flags *pflag.FlagSet, target *string) {
                     -	// assume flags with no longname are not desired
                     -	if len(i.LongName) > 0 {
                     -		flags.StringVarP(target, i.LongName, i.ShortName, i.Default, i.Description)
                     -	}
                     +	kclientcmd.FlagInfo(i).BindStringFlag(flags, target)
                     +}
+                    +
                     +func (i FlagInfo) BindBoolFlag(flags *pflag.FlagSet, target *bool) {
                     +	kclientcmd.FlagInfo(i).BindBoolFlag(flags, target)
+                     }
                      func (i FlagInfo) BindIntFlag(flags *pflag.FlagSet, target *int) {
@@ -29,15 +30,6 @@ func (i FlagInfo) BindIntFlag(flags *pflag.FlagSet, target *int) {
+                     	}
+                     }
                     -func (i FlagInfo) BindBoolFlag(flags *pflag.FlagSet, target *bool) {
                     -	// assume flags with no longname are not desired
                     -	if len(i.LongName) > 0 {
                     -		// try to parse Default as a bool.  If it fails, assume false
                     -		boolVal, _ := strconv.ParseBool(i.Default)
                     -		flags.BoolVarP(target, i.LongName, i.ShortName, boolVal, i.Description)
                     -	}
                     -}
+                    -
                      func (i FlagInfo) BindListFlag(flags *pflag.FlagSet, target *kutil.StringList) {
                      	// assume flags with no longname are not desired
                      	if len(i.LongName) > 0 {
@@ -46,12 +38,11 @@ func (i FlagInfo) BindListFlag(flags *pflag.FlagSet, target *kutil.StringList) {
+                     }
                      const (
                     -	FlagAllClientConfigName = "client-config"
                     -	FlagAllMasterConfigName = "master-config"
                     -	FlagAllNodeConfigName   = "node-config"
                     -	FlagDiagnosticsName     = "diagnostics"
                     -	FlagLevelName           = "diaglevel"
                     -	FlagFormatName          = "output"
                     -	FlagMasterConfigName    = "config"
                     -	FlagNodeConfigName      = "config"
                     +	FlagMasterConfigName   = "master-config"
                     +	FlagNodeConfigName     = "node-config"
                     +	FlagClusterContextName = "cluster-context"
                     +	FlagDiagnosticsName    = "diagnostics"
                     +	FlagLevelName          = "diaglevel"
                     +	FlagFormatName         = "output"
                     +	FlagIsHostName         = "host"
+                     )

@@ -2,7 +2,7 @@ OpenShift v3 Diagnostics
                      ========================
                      This is a tool to help administrators and users resolve common problems
                     -that occur with OpenShift v3 deployments. It is currently (May 2015)
                     +that occur with OpenShift v3 deployments. It will likely remain
                      under continuous development as the OpenShift Origin project progresses.
                      The goals of the diagnostics tool are summarized in this [Trello
@@ -22,32 +22,21 @@ added to the `openshift` binary itself so that wherever there is an
                      OpenShift server or client, the diagnostics can run in the exact same
                      environment.
                     -`openshift ex diagnostics` subcommands for master, node, and client
                     -provide flags to mimic the configurations for those respective components,
                     -so that running diagnostics against a component should be as simple as
                     -supplying the same flags that would invoke the component. So,
                     -for example, if a master is started with:
+                    -
                     -    openshift start master --public-hostname=...
+                    -
                     -Then diagnostics against that master would simply be run as:
+                    -
                     -    openshift ex diagnostics master --public-hostname=...
+                    -
                     -In this way it should be possible to invoke diagnostics against any
                     -given environment.
                     +Diagnostics looks for config files in standard locations. If not found,
                     +related diagnostics are just skipped. Non-standard locations can be
                     +specified with flags.
                      Host environment
                      ================
                     -However, master/node diagnostics will be most useful in a specific
                     -target environment, which is a deployment using Enterprise RPMs and
                     -ansible deployment logic. This provides two major benefits:
                     +Master/node diagnostics will be most useful in a specific target
                     +environment, which is a deployment using RPMs and ansible deployment
                     +logic. This provides two major benefits:
                      * master/node configuration is based on a configuration file in a standard location
                      * all components log to journald
                     -Having configuration file in standard locations means you will generally
                     +Having configuration files in standard locations means you will generally
                      not even need to specify where to find them. Running:
                          openshift ex diagnostics
@@ -71,14 +60,54 @@ Client environment
                      ==================
                      The user may only have access as an ordinary user, as a cluster-admin
                     -user, or may have admin on a host where OpenShift master or node services
                     -are operating. The diagnostics will attempt to use as much access as
                     -the user has available.
                     +user, and/or may be running on a host where OpenShift master or node
                     +services are operating. The diagnostics will attempt to use as much
                     +access as the user has available.
                      A client with ordinary access should be able to diagnose its connection
                     -to the master and look for problems in builds and deployments.
+                    -
                     -A client with cluster-admin access should be able to diagnose the same
                     -things for every project in the deployment, as well as infrastructure
                     -status.
                     +to the master and look for problems in builds and deployments for the
                     +current context.
+                    +
                     +A client with cluster-admin access should be able to diagnose the
                     +status of infrastructure.
+                    +
                     +Writing diagnostics
                     +===================
+                    +
                     +Developers are encouraged to add to the available diagnostics as they
                     +encounter problems that are not easily communicated in the normal
                     +operations of the program, for example components with misconfigured
                     +connections, problems that are buried in logs, etc. The sanity you
                     +save may be your own.
+                    +
                     +A diagnostic is an object that conforms to the Diagnostic interface
                     +(see pkg/diagnostics/types/diagnostic.go). The diagnostic object should
                     +be built in one of the builders in the pkg/cmd/experimental/diagnostics
                     +package (based on whether it depends on client, cluster-admin, or host
                     +configuration). When executed, the diagnostic logs its findings into
                     +a result object. It should be assumed that they may run in parallel.
+                    +
                     +Diagnostics should prefer providing information over perfect accuracy,
                     +as they are the first line of (self-)support for users. On the other
                     +hand, judgment should be exercised to prevent sending users down useless
                     +paths or flooding them with non-issues that obscure real problems.
+                    +
                     +* Errors should be reserved for things that are almost certainly broken
                     +  or causing problems, for example a broken URL.
                     +* Warnings indicate issues that may be a problem but could be valid for
                     +  some configurations / situations, for example a node being disabled.
+                    +
                     +Enabling automation
                     +===================
+                    +
                     +Diagnostic messages are designed to be logged either for human consumption
                     +("text" format) or for scripting/automation ("yaml" or "json" formats). So
                     +messages should:
+                    +
                     +* Have an ID that is unique and unchanging, such that automated alerts
                     +  could filter on specific IDs rather than rely on message text or level.
                     +* Log any data that might be relevant in an automated alert as
                     +  template data; for example, when a node is down, include the name of
                     +  the node so that automation could decide how important it is.
                     +* Not put anything in message template data that cannot be serialized.

@@ -3,14 +3,25 @@ package client
                      import (
                      	"errors"
                      	"fmt"
                     +	"regexp"
                     +	"strings"
                      	kapi "github.com/GoogleCloudPlatform/kubernetes/pkg/api"
                     +	kclientcmd "github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd"
                      	kclientcmdapi "github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd/api"
                     +	"github.com/GoogleCloudPlatform/kubernetes/pkg/fields"
                     +	"github.com/GoogleCloudPlatform/kubernetes/pkg/labels"
                     +	osclientcmd "github.com/openshift/origin/pkg/cmd/util/clientcmd"
                      	"github.com/openshift/origin/pkg/diagnostics/log"
                     -	"github.com/openshift/origin/pkg/diagnostics/types/diagnostic"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
+                     )
                     +type ConfigContext struct {
                     +	RawConfig   *kclientcmdapi.Config
                     +	ContextName string
                     +}
+                    +
                      const (
                      	currentContextMissing = `Your client config specifies a current context of '{{.context}}'
                      which is not defined; it is likely that a mistake was introduced while
@@ -22,20 +33,145 @@ useful to use this as a base if available.`
                      	currentContextSummary = `The current context from client config is '{{.context}}'
                      This will be used by default to contact your OpenShift server.
+                     `
                     +	contextDesc = `
                     +For client config context '{{.context}}':
                     +The server URL is '{{.server}}'
                     +The user authentication is '{{.user}}'
                     +The current project is '{{.project}}'
                     +`
                     +	currContextDesc = `
                     +The current client config context is '{{.context}}':
                     +The server URL is '{{.server}}'
                     +The user authentication is '{{.user}}'
                     +The current project is '{{.project}}'
                     +`
                     +	clientNoResolve = `
                     +This usually means that the hostname does not resolve to an IP.
                     +Hostnames should usually be resolved via DNS or an /etc/hosts file.
                     +Ensure that the hostname resolves correctly from your host before proceeding.
                     +Of course, your config could also simply have the wrong hostname specified.
                     +`
                     +	clientUnknownCa = `
                     +This means that we cannot validate the certificate in use by the
                     +OpenShift API server, so we cannot securely communicate with it.
                     +Connections could be intercepted and your credentials stolen.
+                    +
                     +Since the server certificate we see when connecting is not validated
                     +by public certificate authorities (CAs), you probably need to specify a
                     +certificate from a private CA to validate the connection.
+                    +
                     +Your config may be specifying the wrong CA cert, or none, or there
                     +could actually be a man-in-the-middle attempting to intercept your
                     +connection.  If you are unconcerned about any of this, you can add the
                     +--insecure-skip-tls-verify flag to bypass secure (TLS) verification,
                     +but this is risky and should not be necessary.
                     +** Connections could be intercepted and your credentials stolen. **
                     +`
                     +	clientUnneededCa = `
                     +This means that for client connections to the OpenShift API server, you
                     +(or your kubeconfig) specified both a validating certificate authority
                     +and that the client should bypass connection security validation.
+                    +
                     +This is not allowed because it is likely to be a mistake.
+                    +
                     +If you want to use --insecure-skip-tls-verify to bypass security (which
                     +is usually a bad idea anyway), then you need to also clear the CA cert
                     +from your command line options or kubeconfig file(s). Of course, it
                     +would be far better to obtain and use a correct CA cert.
                     +`
                     +	clientInvCertName = `
                     +This means that the certificate in use by the OpenShift API server
                     +(master) does not match the hostname by which you are addressing it:
                     +  %s
                     +so a secure connection is not allowed. In theory, this *could* mean that
                     +someone is intercepting your connection and presenting a certificate
                     +that is valid but for a different server, which is why secure validation
                     +fails in this case.
+                    +
                     +However, the most likely explanation is that the server certificate
                     +needs to be updated to include the name you are using to reach it.
+                    +
                     +If the OpenShift server is generating its own certificates (which
                     +is default), then the --public-master flag on the OpenShift master is
                     +usually the easiest way to do this. If you need something more complicated
                     +(for instance, multiple public addresses for the API, or your own CA),
                     +then you will need to custom-generate the server certificate with the
                     +right names yourself.
+                    +
                     +If you are unconcerned about any of this, you can add the
                     +--insecure-skip-tls-verify flag to bypass secure (TLS) verification,
                     +but this is risky and should not be necessary.
                     +** Connections could be intercepted and your credentials stolen. **
                     +`
                     +	clientConnRefused = `
                     +This means that when we tried to connect to the OpenShift API
                     +server (master), we reached the host, but nothing accepted the port
                     +connection. This could mean that the OpenShift master is stopped, or
                     +that a firewall or security policy is blocking access at that port.
+                    +
                     +You will not be able to connect or do anything at all with OpenShift
                     +until this server problem is resolved or you specify a corrected
                     +server address.`
+                    +
                     +	clientConnTimeout = `
                     +This means that when we tried to connect to the OpenShift API server
                     +(master), we could not reach the host at all.
                     +* You may have specified the wrong host address.
                     +* This could mean the host is completely unavailable (down).
                     +* This could indicate a routing problem or a firewall that simply
                     +  drops requests rather than responding by reseting the connection.
                     +* It does not generally mean that DNS name resolution failed (which
                     +  would be a different error) though the problem could be that it
                     +  gave the wrong address.`
                     +	clientMalformedHTTP = `
                     +This means that when we tried to connect to the OpenShift API server
                     +(master) with a plain HTTP connection, the server did not speak
                     +HTTP back to us. The most common explanation is that a secure server
                     +is listening but you specified an http: connection instead of https:.
                     +There could also be another service listening at the intended port
                     +speaking some other protocol entirely.
+                    +
                     +You will not be able to connect or do anything at all with OpenShift
                     +until this server problem is resolved or you specify a corrected
                     +server address.`
                     +	clientMalformedTLS = `
                     +This means that when we tried to connect to the OpenShift API server
                     +(master) with a secure HTTPS connection, the server did not speak
                     +HTTPS back to us. The most common explanation is that the server
                     +listening at that port is not the secure server you expected - it
                     +may be a non-secure HTTP server or the wrong service may be
                     +listening there, or you may have specified an incorrect port.
+                    +
                     +You will not be able to connect or do anything at all with OpenShift
                     +until this server problem is resolved or you specify a corrected
                     +server address.`
                     +	clientUnauthn = `
                     +This means that when we tried to make a request to the OpenShift API
                     +server, your kubeconfig did not present valid credentials to
                     +authenticate your client. Credentials generally consist of a client
                     +key/certificate or an access token. Your kubeconfig may not have
                     +presented any, or they may be invalid.`
                     +	clientUnauthz = `
                     +This means that when we tried to make a request to the OpenShift API
                     +server, the request required credentials that were not presented.
                     +This can happen when an authentication token expires. Try logging in
                     +with this user again.`
+                     )
                     -type ConfigContext struct {
                     -	KubeConfig  *kclientcmdapi.Config
                     -	ContextName string
                     +var (
                     +	invalidCertNameRx = regexp.MustCompile("x509: certificate is valid for (\\S+, )+not (\\S+)")
                     +)
                     -	Log *log.Logger
                     +func (d ConfigContext) Name() string {
                     +	return fmt.Sprintf("ConfigContext[%s]", d.ContextName)
+                     }
                      func (d ConfigContext) Description() string {
                     -	return "Test that client config contexts have no undefined references"
                     +	return "Validate client config context is complete and has connectivity"
+                     }
+                    +
                      func (d ConfigContext) CanRun() (bool, error) {
                     -	if d.KubeConfig == nil {
                     +	if d.RawConfig == nil {
                      		// TODO make prettier?
                      		return false, errors.New("There is no client config file")
+                     	}
@@ -46,13 +182,13 @@ func (d ConfigContext) CanRun() (bool, error) {
                      	return true, nil
+                     }
                     -func (d ConfigContext) Check() (bool, []log.Message, []error, []error) {
                     -	if _, err := d.CanRun(); err != nil {
                     -		return false, nil, nil, []error{err}
                     -	}
                     -	isDefaultContext := d.KubeConfig.CurrentContext == d.ContextName
                     +func (d ConfigContext) Check() *types.DiagnosticResult {
                     +	r := types.NewDiagnosticResult("ConfigContext")
                     +	isDefaultContext := d.RawConfig.CurrentContext == d.ContextName
+                    +
                     +	// prepare bad news message
                      	errorKey := "clientCfgError"
                      	unusableLine := fmt.Sprintf("The client config context '%s' is unusable", d.ContextName)
                      	if isDefaultContext {
@@ -60,40 +196,92 @@ func (d ConfigContext) Check() (bool, []log.Message, []error, []error) {
                      		unusableLine = fmt.Sprintf("The current client config context '%s' is unusable", d.ContextName)
+                     	}
                     -	context, exists := d.KubeConfig.Contexts[d.ContextName]
                     +	// check that the context and its constitutuents are defined in the kubeconfig
                     +	context, exists := d.RawConfig.Contexts[d.ContextName]
                      	if !exists {
                     -		err := diagnostic.NewDiagnosticError(errorKey, "", fmt.Errorf(unusableLine+":\n Client config context '%s' is not defined.", d.ContextName))
                     -		d.Log.Error(err.ID, err.Cause.Error())
                     -		return false, nil, nil, []error{err}
                     +		r.Errorf(errorKey, nil, "%s:\n Client config context '%s' is not defined.", unusableLine, d.ContextName)
                     +		return r
+                     	}
+                    -
                      	clusterName := context.Cluster
                     -	cluster, exists := d.KubeConfig.Clusters[clusterName]
                     +	cluster, exists := d.RawConfig.Clusters[clusterName]
                      	if !exists {
+                    -
                     -		err := diagnostic.NewDiagnosticError(errorKey, "", fmt.Errorf(unusableLine+":\n Client config context '%s' has a cluster '%s' which is not defined.", d.ContextName, clusterName))
                     -		d.Log.Error(err.ID, err.Cause.Error())
                     -		return false, nil, nil, []error{err}
                     +		r.Errorf(errorKey, nil, "%s:\n Client config context '%s' has a cluster '%s' which is not defined.", unusableLine, d.ContextName, clusterName)
                     +		return r
+                     	}
                      	authName := context.AuthInfo
                     -	if _, exists := d.KubeConfig.AuthInfos[authName]; !exists {
+                    -
                     -		err := diagnostic.NewDiagnosticError(errorKey, "", fmt.Errorf(unusableLine+":\n Client config context '%s' has a user identity '%s' which is not defined.", d.ContextName, authName))
                     -		d.Log.Error(err.ID, err.Cause.Error())
                     -		return false, nil, nil, []error{err}
                     +	if _, exists := d.RawConfig.AuthInfos[authName]; !exists {
                     +		r.Errorf(errorKey, nil, "%s:\n Client config context '%s' has a user identity '%s' which is not defined.", unusableLine, d.ContextName, authName)
                     +		return r
+                     	}
                     +	// we found a fully-defined context
                      	project := context.Namespace
                      	if project == "" {
                      		project = kapi.NamespaceDefault // OpenShift/k8s fills this in if missing
                     +	}
                     +	msgData := log.Hash{"context": d.ContextName, "server": cluster.Server, "user": authName, "project": project}
                     +	msgText := contextDesc
                     +	if isDefaultContext {
                     +		msgText = currContextDesc
                     +	}
                     +	// Actually send a request to see if context has connectivity.
                     +	// Note: we cannot reuse factories as they cache the clients, so build new factory for each context.
                     +	osClient, _, err := osclientcmd.NewFactory(kclientcmd.NewDefaultClientConfig(*d.RawConfig, &kclientcmd.ConfigOverrides{Context: *context})).Clients()
                     +	// client create now fails if cannot connect to server, so address connectivity errors below
                     +	if err == nil {
                     +		if projects, projerr := osClient.Projects().List(labels.Everything(), fields.Everything()); projerr != nil {
                     +			err = projerr
                     +		} else { // success!
                     +			list := []string{}
                     +			for i, project := range projects.Items {
                     +				if i > 9 {
                     +					list = append(list, "...")
                     +					break
                     +				}
                     +				list = append(list, project.Name)
                     +			}
                     +			msgData["projects"] = list
                     +			if len(list) == 0 {
                     +				r.Infot("CCctxSuccess", msgText+"Successfully requested project list, but it is empty, so user has no access to anything.", msgData)
                     +			} else {
                     +				r.Infot("CCctxSuccess", msgText+"Successfully requested project list; has access to project(s):\n  {{.projects}}", msgData)
                     +			}
                     +			return r
                     +		}
+                     	}
                     -	// TODO: actually send a request to see if can connect
                     -	message := log.Message{EvaluatedText: fmt.Sprintf("For client config context '%s':\n The server URL is '%s'\nThe user authentication is '%s'\nThe current project is '%s'", d.ContextName, cluster.Server, authName, project)}
                     -	if isDefaultContext {
                     -		message = log.Message{EvaluatedText: fmt.Sprintf("The current client config context is '%s':\n The server URL is '%s'\nThe user authentication is '%s'\nThe current project is '%s'", d.ContextName, cluster.Server, authName, project)}
                     +	// something went wrong; couldn't create client or get project list.
                     +	// interpret the terse error messages with helpful info.
                     +	errMsg := err.Error()
                     +	msgData["errMsg"] = fmt.Sprintf("(%T) %[1]v", err)
                     +	var reason, errId string
                     +	switch {
                     +	case regexp.MustCompile("dial tcp: lookup (\\S+): no such host").MatchString(errMsg):
                     +		errId, reason = "clientNoResolve", clientNoResolve
                     +	case strings.Contains(errMsg, "x509: certificate signed by unknown authority"):
                     +		errId, reason = "clientUnknownCa", clientUnknownCa
                     +	case strings.Contains(errMsg, "specifying a root certificates file with the insecure flag is not allowed"):
                     +		errId, reason = "clientUnneededCa", clientUnneededCa
                     +	case invalidCertNameRx.MatchString(errMsg):
                     +		match := invalidCertNameRx.FindStringSubmatch(errMsg)
                     +		serverHost := match[len(match)-1]
                     +		errId, reason = "clientInvCertName", fmt.Sprintf(clientInvCertName, serverHost)
                     +	case regexp.MustCompile("dial tcp (\\S+): connection refused").MatchString(errMsg):
                     +		errId, reason = "clientConnRefused", clientConnRefused
                     +	case regexp.MustCompile("dial tcp (\\S+): (?:connection timed out|i/o timeout|no route to host)").MatchString(errMsg):
                     +		errId, reason = "clientConnTimeout", clientConnTimeout
                     +	case strings.Contains(errMsg, "malformed HTTP response"):
                     +		errId, reason = "clientMalformedHTTP", clientMalformedHTTP
                     +	case strings.Contains(errMsg, "tls: oversized record received with length"):
                     +		errId, reason = "clientMalformedTLS", clientMalformedTLS
                     +	case strings.Contains(errMsg, `403 Forbidden: Forbidden: "/osapi/v1beta1/projects?namespace=" denied by default`):
                     +		errId, reason = "clientUnauthn", clientUnauthn
                     +	case regexp.MustCompile("401 Unauthorized: Unauthorized$").MatchString(errMsg):
                     +		errId, reason = "clientUnauthz", clientUnauthz
                     +	default:
                     +		errId, reason = "clientUnknownConnErr", `Diagnostics does not have an explanation for what this means. Please report this error so one can be added.`
+                     	}
                     -	d.Log.LogMessage(log.InfoLevel, message)
                     -	return true, []log.Message{message}, nil, nil
                     +	r.Errort(errId, err, msgText+"{{.errMsg}}\n"+reason, msgData)
                     +	return r
+                     }

                     new file mode 100644
@@ -0,0 +1,151 @@
                     +package client
+                    +
                     +import (
                     +	"fmt"
                     +	"io/ioutil"
                     +	"os"
+                    +
                     +	"github.com/GoogleCloudPlatform/kubernetes/pkg/client/clientcmd"
                     +	flag "github.com/spf13/pflag"
+                    +
                     +	"github.com/openshift/origin/pkg/cmd/cli/config"
                     +	"github.com/openshift/origin/pkg/diagnostics/log"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
                     +)
+                    +
                     +// This diagnostic is a little special in that it is run separately as a precondition
                     +// in order to determine whether we can run other dependent diagnostics
+                    +
                     +type ConfigLoading struct {
                     +	ConfFlagName   string
                     +	ClientFlags    *flag.FlagSet
                     +	successfulLoad bool // set if at least one file loaded
                     +}
+                    +
                     +func (d *ConfigLoading) Name() string {
                     +	return "ConfigLoading"
                     +}
+                    +
                     +func (d *ConfigLoading) Description() string {
                     +	return "Try to load client config file(s) and report what happens"
                     +}
+                    +
                     +func (d *ConfigLoading) CanRun() (bool, error) {
                     +	return true, nil
                     +}
+                    +
                     +func (d *ConfigLoading) SuccessfulLoad() bool {
                     +	return d.successfulLoad
                     +}
+                    +
                     +func (d *ConfigLoading) Check() *types.DiagnosticResult {
                     +	r := types.NewDiagnosticResult("ConfigLoading")
                     +	confFlagValue := d.ClientFlags.Lookup(d.ConfFlagName).Value.String()
+                    +
                     +	var foundPath string
                     +	rules := config.NewOpenShiftClientConfigLoadingRules()
                     +	paths := append([]string{confFlagValue}, rules.Precedence...)
                     +	for index, path := range paths {
                     +		errmsg := ""
                     +		switch index {
                     +		case 0:
                     +			errmsg = fmt.Sprintf("--%s specified that client config should be at %s\n", d.ConfFlagName, path)
                     +		case len(paths) - 1: // config in ~/.kube
                     +		// no error message indicated if it is not there... user didn't say it would be
                     +		default: // can be multiple paths from the env var in theory; all cases should go here
                     +			if len(os.Getenv(config.OpenShiftConfigPathEnvVar)) != 0 {
                     +				errmsg = fmt.Sprintf("Env var %s specified that client config could be at %s\n", config.OpenShiftConfigPathEnvVar, path)
                     +			}
                     +		}
+                    +
                     +		if d.canOpenConfigFile(path, errmsg, r) && foundPath == "" {
                     +			d.successfulLoad = true
                     +			foundPath = path
                     +		}
                     +	}
                     +	if foundPath != "" {
                     +		if confFlagValue != "" && confFlagValue != foundPath {
                     +			// found config but not where --config said
                     +			r.Errorf("discCCnotFlag", nil, `
                     +The client configuration file was not found where the --%s flag indicated:
                     +  %s
                     +A config file was found at the following location:
                     +  %s
                     +If you wish to use this file for client configuration, you can specify it
                     +with the --%[1]s flag, or just not specify the flag.
                     +			`, d.ConfFlagName, confFlagValue, foundPath)
                     +		}
                     +	} else { // not found, check for master-generated ones to recommend
                     +		if confFlagValue != "" {
                     +			r.Errorf("discCCnotFlag", nil, "Did not find config file where --%s=%s indicated", d.ConfFlagName, confFlagValue)
                     +		}
                     +		adminWarningF := `
                     +No client config file was available; however, one exists at
                     +    %[2]s
                     +which may have been generated automatically by the master.
                     +If you want to use this config, you should copy it to the
                     +standard location (%[3]s),
                     +or you can set the environment variable %[1]s:
                     +    export %[1]s=%[2]s
                     +If not, obtain a config file and place it in the standard
                     +location for use by the client and diagnostics.
                     +`
                     +		adminPaths := []string{
                     +			"/etc/openshift/master/admin.kubeconfig",           // enterprise
                     +			"/openshift.local.config/master/admin.kubeconfig",  // origin systemd
                     +			"./openshift.local.config/master/admin.kubeconfig", // origin binary
                     +		}
                     +		// look for it in auto-generated locations when not found properly
                     +		for _, path := range adminPaths {
                     +			msg := fmt.Sprintf("Looking for a possible client config at %s\n", path)
                     +			if d.canOpenConfigFile(path, msg, r) {
                     +				r.Warnf("discCCautoPath", nil, adminWarningF, config.OpenShiftConfigPathEnvVar, path, config.RecommendedHomeFile)
                     +				break
                     +			}
                     +		}
                     +	}
                     +	return r
                     +}
+                    +
                     +// ----------------------------------------------------------
                     +// Attempt to open file at path as client config
                     +// If there is a problem and errmsg is set, log an error
                     +func (d ConfigLoading) canOpenConfigFile(path string, errmsg string, r *types.DiagnosticResult) bool {
                     +	var file *os.File
                     +	var err error
                     +	if path == "" { // empty param/envvar
                     +		return false
                     +	} else if file, err = os.Open(path); err == nil {
                     +		r.Debugt("discOpenCC", "Reading client config at {{.path}}", log.Hash{"path": path})
                     +	} else if errmsg == "" {
                     +		r.Debugf("discOpenCCNo", "Could not read client config at %s:\n%#v", path, err)
                     +	} else if os.IsNotExist(err) {
                     +		r.Debug("discOpenCCNoExist", errmsg+"but that file does not exist.")
                     +	} else if os.IsPermission(err) {
                     +		r.Error("discOpenCCNoPerm", err, errmsg+"but lack permission to read that file.")
                     +	} else {
                     +		r.Errorf("discOpenCCErr", err, "%sbut there was an error opening it:\n%#v", errmsg, err)
                     +	}
                     +	if file != nil { // it is open for reading
                     +		defer file.Close()
                     +		if buffer, err := ioutil.ReadAll(file); err != nil {
                     +			r.Errorf("discCCReadErr", err, "Unexpected error while reading client config file (%s): %v", path, err)
                     +		} else if _, err := clientcmd.Load(buffer); err != nil {
                     +			r.Errorf("discCCYamlErr", err, `
                     +Error reading YAML from client config file (%s):
                     +  %v
                     +This file may have been truncated or mis-edited.
                     +Please fix, remove, or obtain a new client config`, file.Name(), err)
                     +		} else {
                     +			r.Infof("discCCRead", "Successfully read a client config file at '%s'", path)
                     +			/* Note, we're not going to use this config file directly.
                     +			 * Instead, we'll defer to the openshift client code to assimilate
                     +			 * flags, env vars, and the potential hierarchy of config files
                     +			 * into an actual configuration that the client uses.
                     +			 * However, for diagnostic purposes, record the files we find.
                     +			 */
                     +			return true
                     +		}
                     +	}
                     +	return false
                     +}

...	...	@@ -11,7 +11,7 @@ type yamlLogger struct {
11	11	logStarted bool
12	12	}
13	13
14		-func (y *yamlLogger) Write(entry LogEntry) {
	14	+func (y *yamlLogger) Write(entry Entry) {
15	15	b, _ := yaml.Marshal(&entry)
16	16	fmt.Fprintln(y.out, "---\n"+string(b))
17	17	}

                     deleted file mode 100644
@@ -1,100 +0,0 @@
                     -package client
+                    -
                     -import (
                     -	"errors"
                     -	"fmt"
+                    -
                     -	kapi "github.com/GoogleCloudPlatform/kubernetes/pkg/api"
                     -	kclient "github.com/GoogleCloudPlatform/kubernetes/pkg/client"
+                    -
                     -	"github.com/GoogleCloudPlatform/kubernetes/pkg/fields"
                     -	"github.com/GoogleCloudPlatform/kubernetes/pkg/labels"
                     -	"github.com/openshift/origin/pkg/diagnostics/log"
                     -	"github.com/openshift/origin/pkg/diagnostics/types/diagnostic"
                     -)
+                    -
                     -const (
                     -	clientErrorGettingNodes = `Client error while retrieving node records. Client retrieved records
                     -during discovery, so this is likely to be a transient error. Try running
                     -diagnostics again. If this message persists, there may be a permissions
                     -problem with getting node records. The error was:
+                    -
                     -(%T) %[1]v`
+                    -
                     -	nodeNotReady = `Node {{.node}} is defined but is not marked as ready.
                     -Ready status is {{.status}} because "{{.reason}}"
                     -If the node is not intentionally disabled, check that the master can
                     -reach the node hostname for a health check and the node is checking in
                     -to the master with the same hostname.
+                    -
                     -While in this state, pods should not be scheduled to deploy on the node,
                     -and any existing scheduled pods will be considered failed and removed.
                     -`
                     -)
+                    -
                     -// NodeDefinitions
                     -type NodeDefinition struct {
                     -	KubeClient *kclient.Client
+                    -
                     -	Log *log.Logger
                     -}
+                    -
                     -func (d NodeDefinition) Description() string {
                     -	return "Check node records on master"
                     -}
                     -func (d NodeDefinition) CanRun() (bool, error) {
                     -	if d.KubeClient == nil {
                     -		// TODO make prettier?
                     -		return false, errors.New("must have kube client")
                     -	}
                     -	if _, err := d.KubeClient.Nodes().List(labels.LabelSelector{}, fields.Everything()); err != nil {
                     -		// TODO check for 403 to return: "Client does not have cluster-admin access and cannot see node records"
+                    -
                     -		return false, diagnostic.NewDiagnosticError("clGetNodesFailed", fmt.Sprintf(clientErrorGettingNodes, err), err)
                     -	}
+                    -
                     -	return true, nil
                     -}
                     -func (d NodeDefinition) Check() (bool, []log.Message, []error, []error) {
                     -	if _, err := d.CanRun(); err != nil {
                     -		return false, nil, nil, []error{err}
                     -	}
+                    -
                     -	nodes, err := d.KubeClient.Nodes().List(labels.LabelSelector{}, fields.Everything())
                     -	if err != nil {
                     -		return false, nil, nil, []error{
                     -			diagnostic.NewDiagnosticError("clGetNodesFailed", fmt.Sprintf(clientErrorGettingNodes, err), err),
                     -		}
                     -	}
+                    -
                     -	for _, node := range nodes.Items {
                     -		var ready *kapi.NodeCondition
                     -		for i, condition := range node.Status.Conditions {
                     -			switch condition.Type {
                     -			// currently only one... used to be more, may be again
                     -			case kapi.NodeReady:
                     -				ready = &node.Status.Conditions[i]
                     -				// TODO comment needed to explain why we do last one wins.  should this break instead?
                     -			}
                     -		}
+                    -
                     -		if ready == nil || ready.Status != kapi.ConditionTrue {
                     -			// instead of building this, simply use the node object directly
                     -			templateData := map[string]interface{}{}
                     -			templateData["node"] = node.Name
                     -			if ready == nil {
                     -				templateData["status"] = "None"
                     -				templateData["reason"] = "There is no readiness record."
                     -			} else {
                     -				templateData["status"] = ready.Status
                     -				templateData["reason"] = ready.Reason
                     -			}
+                    -
                     -			return false, nil, []error{
                     -				diagnostic.NewDiagnosticErrorFromTemplate("clNodeBroken", nodeNotReady, templateData),
                     -			}, nil
                     -		}
                     -	}
+                    -
                     -	return true, nil, nil, nil
                     -}

                     deleted file mode 100644
@@ -1,104 +0,0 @@
                     -package discovery // client
+                    -
                     -import (
                     -	"fmt"
                     -	"github.com/openshift/origin/pkg/diagnostics/log"
                     -	"github.com/openshift/origin/pkg/diagnostics/types"
                     -	"os"
                     -	"os/exec"
                     -	"path/filepath"
                     -	"runtime"
                     -	"strings"
                     -)
+                    -
                     -// ----------------------------------------------------------
                     -// Look for 'osc' and 'openshift' executables
                     -func (env *Environment) DiscoverClient() error {
                     -	var err error
                     -	f := env.Options.ClientDiagOptions.Factory
                     -	if config, err := f.OpenShiftClientConfig.RawConfig(); err != nil {
                     -		env.Log.Errorf("discCCstart", "Could not read client config: (%T) %[1]v", err)
                     -	} else {
                     -		env.OsConfig = &config
                     -		env.FactoryForContext[config.CurrentContext] = f
                     -	}
                     -	env.Log.Debug("discSearchExec", "Searching for executables in path:\n  "+strings.Join(filepath.SplitList(os.Getenv("PATH")), "\n  ")) //TODO for non-Linux OS
                     -	env.OscPath = env.findExecAndLog("osc")
                     -	if env.OscPath != "" {
                     -		env.OscVersion, err = getExecVersion(env.OscPath, env.Log)
                     -	}
                     -	env.OpenshiftPath = env.findExecAndLog("openshift")
                     -	if env.OpenshiftPath != "" {
                     -		env.OpenshiftVersion, err = getExecVersion(env.OpenshiftPath, env.Log)
                     -	}
                     -	if env.OpenshiftVersion.NonZero() && env.OscVersion.NonZero() && !env.OpenshiftVersion.Eq(env.OscVersion) {
                     -		env.Log.Warnm("discVersionMM", log.Msg{"osV": env.OpenshiftVersion.GoString(), "oscV": env.OscVersion.GoString(),
                     -			"text": fmt.Sprintf("'openshift' version %#v does not match 'osc' version %#v; update or remove the lower version", env.OpenshiftVersion, env.OscVersion)})
                     -	}
                     -	return err
                     -}
+                    -
                     -// ----------------------------------------------------------
                     -// Look for a specific executable and log what happens
                     -func (env *Environment) findExecAndLog(cmd string) string {
                     -	if path := findExecFor(cmd); path != "" {
                     -		env.Log.Infom("discExecFound", log.Msg{"command": cmd, "path": path, "tmpl": "Found '{{.command}}' at {{.path}}"})
                     -		return path
                     -	} else {
                     -		env.Log.Warnm("discExecNoPath", log.Msg{"command": cmd, "tmpl": "No '{{.command}}' executable was found in your path"})
                     -	}
                     -	return ""
                     -}
+                    -
                     -// ----------------------------------------------------------
                     -// Look in the path for an executable
                     -func findExecFor(cmd string) string {
                     -	path, err := exec.LookPath(cmd)
                     -	if err == nil {
                     -		return path
                     -	}
                     -	if runtime.GOOS == "windows" {
                     -		path, err = exec.LookPath(cmd + ".exe")
                     -		if err == nil {
                     -			return path
                     -		}
                     -	}
                     -	return ""
                     -}
+                    -
                     -// ----------------------------------------------------------
                     -// Invoke executable's "version" command to determine version
                     -func getExecVersion(path string, logger *log.Logger) (version types.Version, err error) {
                     -	cmd := exec.Command(path, "version")
                     -	var out []byte
                     -	out, err = cmd.CombinedOutput()
                     -	if err == nil {
                     -		var name string
                     -		var x, y, z int
                     -		if scanned, err := fmt.Sscanf(string(out), "%s v%d.%d.%d", &name, &x, &y, &z); scanned > 1 {
                     -			version = types.Version{x, y, z}
                     -			logger.Infom("discVersion", log.Msg{"tmpl": "version of {{.command}} is {{.version}}", "command": name, "version": version.GoString()})
                     -		} else {
                     -			logger.Errorf("discVersErr", `
                     -Expected version output from '%s version'
                     -Could not parse output received:
                     -%v
                     -Error was: %#v`, path, string(out), err)
                     -		}
                     -	} else {
                     -		switch err.(type) {
                     -		case *exec.Error:
                     -			logger.Errorf("discVersErr", "error in executing '%v version': %v", path, err)
                     -		case *exec.ExitError:
                     -			logger.Errorf("discVersErr", `
                     -Executed '%v version' which exited with an error code.
                     -This version is likely old or broken.
                     -Error was '%v';
                     -Output was:
                     -%v`, path, err.Error(), log.LimitLines(string(out), 5))
                     -		default:
                     -			logger.Errorf("discVersErr", "executed '%v version' but an error occurred:\n%v\nOutput was:\n%v", path, err, string(out))
                     -		}
                     -	}
                     -	return version, err
                     -}

                     deleted file mode 100644
@@ -1,19 +0,0 @@
                     -package discovery
+                    -
                     -import (
                     -	"os/exec"
                     -	"runtime"
                     -)
+                    -
                     -// ----------------------------------------------------------
                     -// Determine what we need to about the OS
                     -func (env *Environment) DiscoverOperatingSystem() {
                     -	if runtime.GOOS == "linux" {
                     -		if _, err := exec.LookPath("systemctl"); err == nil {
                     -			env.HasSystemd = true
                     -		}
                     -		if _, err := exec.LookPath("/bin/bash"); err == nil {
                     -			env.HasBash = true
                     -		}
                     -	}
                     -}

                     new file mode 100644
@@ -0,0 +1,46 @@
                     +package host
+                    +
                     +import (
                     +	"errors"
+                    +
                     +	configapilatest "github.com/openshift/origin/pkg/cmd/server/api/latest"
                     +	configvalidation "github.com/openshift/origin/pkg/cmd/server/api/validation"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
                     +)
+                    +
                     +// MasterConfigCheck
                     +type MasterConfigCheck struct {
                     +	MasterConfigFile string
                     +}
+                    +
                     +func (d MasterConfigCheck) Name() string {
                     +	return "MasterConfigCheck"
                     +}
+                    +
                     +func (d MasterConfigCheck) Description() string {
                     +	return "Check the master config file"
                     +}
                     +func (d MasterConfigCheck) CanRun() (bool, error) {
                     +	if len(d.MasterConfigFile) == 0 {
                     +		return false, errors.New("must have master config file")
                     +	}
+                    +
                     +	return true, nil
                     +}
                     +func (d MasterConfigCheck) Check() *types.DiagnosticResult {
                     +	r := types.NewDiagnosticResult("MasterConfigCheck")
+                    +
                     +	r.Debugf("discMCfile", "Looking for master config file at '%s'", d.MasterConfigFile)
                     +	masterConfig, err := configapilatest.ReadAndResolveMasterConfig(d.MasterConfigFile)
                     +	if err != nil {
                     +		r.Errorf("discMCfail", err, "Could not read master config file '%s':\n(%T) %[2]v", d.MasterConfigFile, err)
                     +		return r
                     +	}
+                    +
                     +	r.Infof("discMCfound", "Found a master config file: %[1]s", d.MasterConfigFile)
+                    +
                     +	for _, err := range configvalidation.ValidateMasterConfig(masterConfig).Errors {
                     +		r.Errorf("discMCinvalid", err, "Validation of master config file '%s' failed:\n(%T) %[2]v", d.MasterConfigFile, err)
                     +	}
                     +	return r
                     +}

                     new file mode 100644
@@ -0,0 +1,45 @@
                     +package host
+                    +
                     +import (
                     +	"errors"
+                    +
                     +	configapilatest "github.com/openshift/origin/pkg/cmd/server/api/latest"
                     +	configvalidation "github.com/openshift/origin/pkg/cmd/server/api/validation"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
                     +)
+                    +
                     +// NodeConfigCheck
                     +type NodeConfigCheck struct {
                     +	NodeConfigFile string
                     +}
+                    +
                     +func (d NodeConfigCheck) Name() string {
                     +	return "NodeConfigCheck"
                     +}
+                    +
                     +func (d NodeConfigCheck) Description() string {
                     +	return "Check the node config file"
                     +}
                     +func (d NodeConfigCheck) CanRun() (bool, error) {
                     +	if len(d.NodeConfigFile) == 0 {
                     +		return false, errors.New("must have node config file")
                     +	}
+                    +
                     +	return true, nil
                     +}
                     +func (d NodeConfigCheck) Check() *types.DiagnosticResult {
                     +	r := types.NewDiagnosticResult("NodeConfigCheck")
                     +	r.Debugf("discNCfile", "Looking for node config file at '%s'", d.NodeConfigFile)
                     +	nodeConfig, err := configapilatest.ReadAndResolveNodeConfig(d.NodeConfigFile)
                     +	if err != nil {
                     +		r.Errorf("discNCfail", err, "Could not read node config file '%s':\n(%T) %[2]v", d.NodeConfigFile, err)
                     +		return r
                     +	}
+                    +
                     +	r.Infof("discNCfound", "Found a node config file: %[1]s", d.NodeConfigFile)
+                    +
                     +	for _, err := range configvalidation.ValidateNodeConfig(nodeConfig) {
                     +		r.Errorf("discNCinvalid", err, "Validation of node config file '%s' failed:\n(%T) %[2]v", d.NodeConfigFile, err)
                     +	}
                     +	return r
                     +}

@@ -12,7 +12,7 @@ type jsonLogger struct {
                      	logFinished bool
+                     }
                     -func (j *jsonLogger) Write(entry LogEntry) {
                     +func (j *jsonLogger) Write(entry Entry) {
                      	if j.logStarted {
                      		fmt.Fprintln(j.out, ",")
                      	} else {

@@ -7,8 +7,11 @@ import (
                      	ct "github.com/daviddengcn/go-colortext"
                      	"io"
                      	"io/ioutil"
                     +	"runtime"
                      	"strings"
                      	"text/template"
+                    +
                     +	"github.com/openshift/origin/pkg/version"
+                     )
                      type LoggerOptions struct {
@@ -35,6 +38,14 @@ type Level struct {
                      	Bright bool
+                     }
                     +func (l Level) MarshalJSON() ([]byte, error) {
                     +	return []byte(`"` + l.Name + `"`), nil
                     +}
+                    +
                     +func (l Level) MarshalYAML() (interface{}, error) {
                     +	return l.Name, nil
                     +}
+                    +
                      type Logger struct {
                      	loggerType
                      	level        Level
@@ -44,7 +55,7 @@ type Logger struct {
                      // Internal type to deal with different log formats
                      type loggerType interface {
                     -	Write(LogEntry)
                     +	Write(Entry)
                      	Finish()
+                     }
@@ -85,18 +96,23 @@ func NewLogger(setLevel int, setFormat string, out io.Writer) (*Logger, error) {
+                     }
                      type Message struct {
                     -	ID       string
                     -	Template string
+                    -
                     +	// ID: an identifier unique to the message being logged, intended for json/yaml output
                     +	//     so that automation can recognize specific messages without trying to parse them.
                     +	ID string `json:"-" yaml:"-"`
                     +	// Template: a template string as understood by text/template that can use any of the
                     +	//           TemplateData entries in this Message as inputs.
                     +	Template string `json:"-" yaml:"-"`
                      	// TemplateData is passed to template executor to complete the message
                     -	TemplateData interface{}
                     +	TemplateData interface{} `json:"data,omitempty" yaml:"data,omitempty"`
                     -	EvaluatedText string
                     +	EvaluatedText string `json:"text" yaml:"text"` // human-readable message text
+                     }
                     +type Hash map[string]interface{} // convenience/cosmetic type
+                    +
                      func (m Message) String() string {
                      	if len(m.EvaluatedText) > 0 {
                     -		return fmt.Sprintf("%s: %s", m.EvaluatedText)
                     +		return m.EvaluatedText
+                     	}
                      	if len(m.Template) == 0 {
@@ -105,7 +121,7 @@ func (m Message) String() string {
                      	// if given a template, convert it to text
                      	parsedTmpl, err := template.New(m.ID).Parse(m.Template)
                     -	if err != nil {
                     +	if err != nil { // unless the template is broken of course
                      		return fmt.Sprintf("%s: %s %#v: %v", m.ID, m.Template, m.TemplateData, err)
+                     	}
@@ -118,23 +134,13 @@ func (m Message) String() string {
                      	return buff.String()
+                     }
                     -type LogEntry struct {
                     -	Level Level
                     -	Message
                     +type Entry struct {
                     +	ID      string `json:"id"`
                     +	Origin  string `json:"origin"`
                     +	Level   Level  `json:"level"`
                     +	Message `yaml:"-,inline"`
+                     }
                     -/* a Msg can be expected to have the following entries:
                     - * "id": an identifier unique to the message being logged, intended for json/yaml output
                     - *       so that automation can recognize specific messages without trying to parse them.
                     - * "text": human-readable message text
                     - * "tmpl": a template string as understood by text/template that can use any of the other
                     - *         entries in this Msg as inputs. This is removed, evaluated, and the result is
                     - *         placed in "text". If there is an error during evaluation, the error is placed
                     - *         in "templateErr", the original id of the message is stored in "templateId",
                     - *         and the Msg id is changed to "tmplErr". Of course, this should never happen
                     - *         if there are no mistakes in the calling code.
                     - */
+                    -
                      var (
                      	ErrorLevel  = Level{4, "error", "ERROR: ", ct.Red, true}   // Something is definitely wrong
                      	WarnLevel   = Level{3, "warn", "WARN:  ", ct.Yellow, true} // Likely to be an issue but maybe not
@@ -144,136 +150,126 @@ var (
+                     )
                      // Provide a summary at the end
                     -func (l *Logger) Summary() {
                     -	l.Notice("summary", "\nSummary of diagnostics execution:\n")
                     -	if l.warningsSeen > 0 {
                     -		l.Noticef("sumWarn", "Warnings seen: %d", l.warningsSeen)
                     +func (l *Logger) Summary(warningsSeen int, errorsSeen int) {
                     +	l.Noticef("summary", "\nSummary of diagnostics execution (version %v):\n", version.Get())
                     +	if warningsSeen > 0 {
                     +		l.Noticet("sumWarn", "Warnings seen: {{.warnings}}", Hash{"warnings": warningsSeen})
+                     	}
                     -	if l.errorsSeen > 0 {
                     -		l.Noticef("sumErr", "Errors seen: %d", l.errorsSeen)
                     +	if errorsSeen > 0 {
                     +		l.Noticet("sumErr", "Errors seen: {{.errors}}", Hash{"errors": errorsSeen})
+                     	}
                     -	if l.warningsSeen == 0 && l.errorsSeen == 0 {
                     +	if warningsSeen == 0 && errorsSeen == 0 {
                      		l.Notice("sumNone", "Completed with no errors or warnings seen.")
+                     	}
+                     }
                     -func (l *Logger) LogMessage(level Level, message Message) {
                     -	// if there's no logger, return silently
                     -	if l == nil {
                     +func (l *Logger) LogEntry(entry Entry) {
                     +	if l == nil { // if there's no logger, return silently
                      		return
+                     	}
+                    -
                     -	// track how many of every type we've seen (probably unnecessary)
                     -	if level.Level == ErrorLevel.Level {
                     -		l.errorsSeen += 1
                     -	} else if level.Level == WarnLevel.Level {
                     -		l.warningsSeen += 1
                     -	}
+                    -
                     -	if level.Level < l.level.Level {
                     -		return
                     -	}
+                    -
                     -	if len(message.Template) == 0 {
                     -		l.Write(LogEntry{level, message})
                     +	if entry.Level.Level < l.level.Level { // logging level says skip this entry
                      		return
+                     	}
                     -	// if given a template, convert it to text
                     -	parsedTmpl, err := template.New(message.ID).Parse(message.Template)
                     -	if err != nil {
                     -		templateErrorMessage := Message{
                     -			ID: "templateParseErr",
                     -			TemplateData: map[string]interface{}{
                     -				"error":           err.Error(),
                     -				"originalMessage": message,
                     -			},
                     +	if msg := &entry.Message; msg.EvaluatedText == "" && msg.Template != "" {
                     +		// if given a template instead of text, convert it to text
                     +		parsedTmpl, err := template.New(msg.ID).Parse(msg.Template)
                     +		if err != nil {
                     +			entry.Message = Message{
                     +				ID: "templateParseErr",
                     +				TemplateData: Hash{
                     +					"error":           err.Error(),
                     +					"originalMessage": msg,
                     +				},
                     +				EvaluatedText: fmt.Sprintf("Error parsing template for %s:\n%s=== Error was:\n%v\nOriginal message:\n%#v", msg.ID, msg.Template, err, msg),
                     +			}
                     +			entry.ID = entry.Message.ID
                     +			l.Write(entry)
                     +			return
+                     		}
                     -		l.LogMessage(level, templateErrorMessage)
                     -		return
                     -	}
                     -	var buff bytes.Buffer
                     -	err = parsedTmpl.Execute(&buff, message.TemplateData)
                     -	if err != nil {
                     -		templateErrorMessage := Message{
                     -			ID: "templateParseErr",
                     -			TemplateData: map[string]interface{}{
                     -				"error":           err.Error(),
                     -				"originalMessage": message,
                     -			},
                     +		var buff bytes.Buffer
                     +		err = parsedTmpl.Execute(&buff, msg.TemplateData)
                     +		if err != nil {
                     +			entry.Message = Message{
                     +				ID: "templateExecErr",
                     +				TemplateData: Hash{
                     +					"error":           err.Error(),
                     +					"originalMessage": msg,
                     +				},
                     +				EvaluatedText: fmt.Sprintf("Error executing template for %s:\n%s=== Error was:\n%v\nOriginal message:\n%#v", msg.ID, msg.Template, err, msg),
                     +			}
                     +			entry.ID = entry.Message.ID
                     +			l.Write(entry)
                     +			return
+                     		}
                     -		l.LogMessage(level, templateErrorMessage)
                     -		return
                     +		msg.EvaluatedText = buff.String()
+                     	}
                     -	message.EvaluatedText = buff.String()
                     -	l.Write(LogEntry{level, message})
                     +	l.Write(entry)
+                     }
                      // Convenience functions
                      func (l *Logger) Error(id string, text string) {
                     -	l.Logp(ErrorLevel, id, text)
                     +	l.logp(ErrorLevel, id, text)
+                     }
                      func (l *Logger) Errorf(id string, msg string, a ...interface{}) {
                     -	l.Logpf(ErrorLevel, id, msg, a...)
                     +	l.logf(ErrorLevel, id, msg, a...)
+                     }
                     -func (l *Logger) Errorm(message Message) {
                     -	l.LogMessage(ErrorLevel, message)
                     +func (l *Logger) Errort(id string, template string, data interface{}) {
                     +	l.logt(ErrorLevel, id, template, data)
+                     }
                      func (l *Logger) Warn(id string, text string) {
                     -	l.Logp(WarnLevel, id, text)
                     +	l.logp(WarnLevel, id, text)
+                     }
                      func (l *Logger) Warnf(id string, msg string, a ...interface{}) {
                     -	l.Logpf(WarnLevel, id, msg, a...)
                     -}
                     -func (l *Logger) Warnm(message Message) {
                     -	l.LogMessage(WarnLevel, message)
                     +	l.logf(WarnLevel, id, msg, a...)
+                     }
                      func (l *Logger) Info(id string, text string) {
                     -	l.Logp(InfoLevel, id, text)
                     +	l.logp(InfoLevel, id, text)
+                     }
                      func (l *Logger) Infof(id string, msg string, a ...interface{}) {
                     -	l.Logpf(InfoLevel, id, msg, a...)
                     -}
                     -func (l *Logger) Infom(message Message) {
                     -	l.LogMessage(InfoLevel, message)
                     +	l.logf(InfoLevel, id, msg, a...)
+                     }
                      func (l *Logger) Notice(id string, text string) {
                     -	l.Logp(NoticeLevel, id, text)
                     +	l.logp(NoticeLevel, id, text)
+                     }
                      func (l *Logger) Noticef(id string, msg string, a ...interface{}) {
                     -	l.Logpf(NoticeLevel, id, msg, a...)
                     +	l.logf(NoticeLevel, id, msg, a...)
+                     }
                     -func (l *Logger) Noticem(message Message) {
                     -	l.LogMessage(NoticeLevel, message)
                     +func (l *Logger) Noticet(id string, template string, data interface{}) {
                     +	l.logt(NoticeLevel, id, template, data)
+                     }
                      func (l *Logger) Debug(id string, text string) {
                     -	l.Logp(DebugLevel, id, text)
                     +	l.logp(DebugLevel, id, text)
+                     }
                      func (l *Logger) Debugf(id string, msg string, a ...interface{}) {
                     -	l.Logpf(DebugLevel, id, msg, a...)
                     -}
                     -func (l *Logger) Debugm(message Message) {
                     -	l.LogMessage(DebugLevel, message)
                     +	l.logf(DebugLevel, id, msg, a...)
+                     }
                     -func (l *Logger) Logp(level Level, id string, text string) {
                     -	l.LogMessage(level, Message{ID: id, EvaluatedText: text})
                     +func origin(skip int) string {
                     +	if _, file, _, ok := runtime.Caller(skip + 1); ok {
                     +		paths := strings.SplitAfter(file, "github.com/")
                     +		return "controller " + paths[len(paths)-1]
                     +	} else {
                     +		return "unknown"
                     +	}
                     +}
                     +func (l *Logger) logp(level Level, id string, text string) {
                     +	l.LogEntry(Entry{id, origin(1), level, Message{ID: id, EvaluatedText: text}})
+                     }
                     -func (l *Logger) Logpf(level Level, id string, msg string, a ...interface{}) {
                     -	l.Logp(level, id, fmt.Sprintf(msg, a...))
                     +func (l *Logger) logf(level Level, id string, msg string, a ...interface{}) {
                     +	l.LogEntry(Entry{id, origin(1), level, Message{ID: id, EvaluatedText: fmt.Sprintf(msg, a...)}})
                     +}
                     +func (l *Logger) logt(level Level, id string, template string, data interface{}) {
                     +	l.LogEntry(Entry{id, origin(1), level, Message{ID: id, Template: template, TemplateData: data}})
+                     }
                      func (l *Logger) Finish() {
                      	l.loggerType.Finish()
+                     }
                     -func (l *Logger) ErrorsSeen() bool {
                     -	return l.errorsSeen > 0
                     -}
+                    -
                      // turn excess lines into [...]
                      func LimitLines(msg string, n int) string {
                      	lines := strings.SplitN(msg, "\n", n+1)

@@ -31,11 +31,14 @@ func IsTerminal(w io.Writer) bool {
                      	return ok && term.IsTerminal(file.Fd())
+                     }
                     -func (t *textLogger) Write(entry LogEntry) {
                     +func (t *textLogger) Write(entry Entry) {
                      	if t.ttyOutput {
                      		ct.ChangeColor(entry.Level.Color, entry.Level.Bright, ct.None, false)
+                     	}
                     -	text := strings.TrimSpace(entry.EvaluatedText)
                     +	text := strings.TrimSpace(entry.Message.EvaluatedText)
                     +	if entry.Level.Level >= WarnLevel.Level {
                     +		text = fmt.Sprintf("[ID \"%s\" from %s]\n", entry.ID, entry.Origin) + text
                     +	}
                      	if strings.Contains(text, "\n") { // separate multiline comments with newlines
                      		if !t.lastNewline {
                      			fmt.Fprintln(t.out) // separate from previous one-line log msg

@@ -3,38 +3,44 @@ package systemd
                      import (
                      	"bufio"
                      	"encoding/json"
                     -	"fmt"
                      	"io"
                      	"os/exec"
                     +	"strconv"
                     +	"time"
                      	"github.com/openshift/origin/pkg/diagnostics/log"
                      	"github.com/openshift/origin/pkg/diagnostics/types"
                     -	"github.com/openshift/origin/pkg/diagnostics/types/diagnostic"
                     +)
+                    +
                     +const (
                     +	sdLogReadErr = `Diagnostics failed to query journalctl for the '%s' unit logs.
                     +This should be very unusual, so please report this error:
                     +%s`
+                     )
                      // AnalyzeLogs
                      type AnalyzeLogs struct {
                      	SystemdUnits map[string]types.SystemdUnit
                     +}
                     -	Log *log.Logger
                     +func (d AnalyzeLogs) Name() string {
                     +	return "AnalyzeLogs"
+                     }
                      func (d AnalyzeLogs) Description() string {
                     -	return "Check for problems in systemd service logs since each service last started"
                     +	return "Check for recent problems in systemd service logs"
+                     }
+                    +
                      func (d AnalyzeLogs) CanRun() (bool, error) {
                      	return true, nil
+                     }
                     -func (d AnalyzeLogs) Check() (bool, []log.Message, []error, []error) {
                     -	infos := []log.Message{}
                     -	warnings := []error{}
                     -	errors := []error{}
+                    +
                     +func (d AnalyzeLogs) Check() *types.DiagnosticResult {
                     +	r := types.NewDiagnosticResult("AnalyzeLogs")
                      	for _, unit := range unitLogSpecs {
                      		if svc := d.SystemdUnits[unit.Name]; svc.Enabled || svc.Active {
                     -			checkMessage := log.Message{ID: "sdCheckLogs", EvaluatedText: fmt.Sprintf("Checking journalctl logs for '%s' service", unit.Name)}
                     -			d.Log.LogMessage(log.InfoLevel, checkMessage)
                     -			infos = append(infos, checkMessage)
                     +			r.Infof("sdCheckLogs", "Checking journalctl logs for '%s' service", unit.Name)
                      			cmd := exec.Command("journalctl", "-ru", unit.Name, "--output=json")
                      			// JSON comes out of journalctl one line per record
@@ -50,60 +56,54 @@ func (d AnalyzeLogs) Check() (bool, []log.Message, []error, []error) {
                      			}(cmd)
                      			if err != nil {
                     -				diagnosticError := diagnostic.NewDiagnosticError("sdLogReadErr", fmt.Sprintf(sdLogReadErr, unit.Name, errStr(err)), err)
                     -				d.Log.Error(diagnosticError.ID, diagnosticError.Explanation)
                     -				errors = append(errors, diagnosticError)
+                    -
                     -				return false, infos, warnings, errors
                     +				r.Errorf("sdLogReadErr", err, sdLogReadErr, unit.Name, errStr(err))
                     +				return r
+                     			}
                      			defer func() { // close out pipe once done reading
                      				reader.Close()
                      				cmd.Wait()
                      			}()
                     -			entryTemplate := logEntry{Message: `json:"MESSAGE"`}
                     +			timeLimit := time.Now().Add(-time.Hour)                     // if it didn't happen in the last hour, probably not too relevant
                      			matchCopy := append([]logMatcher(nil), unit.LogMatchers...) // make a copy, will remove matchers after they match something
                     -			for lineReader.Scan() {                                     // each log entry is a line
                     +			lineCount := 0                                              // each log entry is a line
                     +			for lineReader.Scan() {
                     +				lineCount += 1
                      				if len(matchCopy) == 0 { // if no rules remain to match
                      					break // don't waste time reading more log entries
+                     				}
                     -				bytes, entry := lineReader.Bytes(), entryTemplate
                     +				bytes, entry := lineReader.Bytes(), logEntry{}
                      				if err := json.Unmarshal(bytes, &entry); err != nil {
                     -					badJSONMessage := log.Message{ID: "sdLogBadJSON", EvaluatedText: fmt.Sprintf("Couldn't read the JSON for this log message:\n%s\nGot error %s", string(bytes), errStr(err))}
                     -					d.Log.LogMessage(log.DebugLevel, badJSONMessage)
+                    -
                     +					r.Debugf("sdLogBadJSON", "Couldn't read the JSON for this log message:\n%s\nGot error %s", string(bytes), errStr(err))
                      				} else {
                     +					if lineCount > 500 && stampTooOld(entry.TimeStamp, timeLimit) {
                     +						r.Debugf("sdLogTrunc", "Stopped reading %s log: timestamp %s too old", unit.Name, entry.TimeStamp)
                     +						break // if we've analyzed at least 500 entries, stop when age limit reached (don't scan days of logs)
                     +					}
                      					if unit.StartMatch.MatchString(entry.Message) {
                     -						break // saw the log message where the unit started; done looking.
                     +						break // saw log message for unit startup; don't analyze previous logs
+                     					}
                      					for index, match := range matchCopy { // match log message against provided matchers
                      						if strings := match.Regexp.FindStringSubmatch(entry.Message); strings != nil {
                      							// if matches: print interpretation, remove from matchCopy, and go on to next log entry
                     -							keep := match.KeepAfterMatch
                     -							if match.Interpret != nil {
                     -								currKeep, currInfos, currWarnings, currErrors := match.Interpret(d.Log, &entry, strings)
                     +							keep := match.KeepAfterMatch // generic keep logic
                     +							if match.Interpret != nil {  // apply custom match logic
                     +								currKeep, result := match.Interpret(&entry, strings)
                      								keep = currKeep
                     -								infos = append(infos, currInfos...)
                     -								warnings = append(warnings, currWarnings...)
                     -								errors = append(errors, currErrors...)
+                    -
                     -							} else {
                     -								text := fmt.Sprintf("Found '%s' journald log message:\n  %s\n", unit.Name, entry.Message) + match.Interpretation
                     -								message := log.Message{ID: match.Id, EvaluatedText: text, TemplateData: map[string]string{"unit": unit.Name, "logMsg": entry.Message}}
                     -								d.Log.LogMessage(match.Level, message)
                     -								diagnosticError := diagnostic.NewDiagnosticError(match.Id, text, nil)
                     +								r.Append(result)
                     +							} else { // apply generic match processing
                     +								template := "Found '{{.unit}}' journald log message:\n  {{.logMsg}}\n{{.interpretation}}"
                     +								templateData := log.Hash{"unit": unit.Name, "logMsg": entry.Message, "interpretation": match.Interpretation}
                      								switch match.Level {
                     -								case log.InfoLevel, log.NoticeLevel:
                     -									infos = append(infos, message)
+                    -
                     +								case log.DebugLevel:
                     +									r.Debugt(match.Id, template, templateData)
                     +								case log.InfoLevel:
                     +									r.Infot(match.Id, template, templateData)
                      								case log.WarnLevel:
                     -									warnings = append(warnings, diagnosticError)
+                    -
                     +									r.Warnt(match.Id, nil, template, templateData)
                      								case log.ErrorLevel:
                     -									errors = append(errors, diagnosticError)
+                    -
                     +									r.Errort(match.Id, nil, template, templateData)
+                     								}
+                    -
+                     							}
                      							if !keep { // remove matcher once seen
@@ -118,11 +118,12 @@ func (d AnalyzeLogs) Check() (bool, []log.Message, []error, []error) {
+                     		}
+                     	}
                     -	return (len(errors) == 0), infos, warnings, errors
                     +	return r
+                     }
                     -const (
                     -	sdLogReadErr = `Diagnostics failed to query journalctl for the '%s' unit logs.
                     -This should be very unusual, so please report this error:
                     -%s`
                     -)
                     +func stampTooOld(stamp string, timeLimit time.Time) bool {
                     +	if epochns, err := strconv.ParseInt(stamp, 10, 64); err == nil {
                     +		return time.Unix(epochns/1000000, 0).Before(timeLimit)
                     +	}
                     +	return true // something went wrong, stop looking...
                     +}

@@ -12,7 +12,7 @@ import (
                      func GetSystemdUnits(logger *log.Logger) map[string]types.SystemdUnit {
                      	systemdUnits := map[string]types.SystemdUnit{}
                     -	logger.Notice("discBegin", "Beginning systemd discovery")
                     +	logger.Notice("discBeginSysd", "Performing systemd discovery")
                      	for _, name := range []string{"openshift", "openshift-master", "openshift-node", "openshift-sdn-master", "openshift-sdn-node", "docker", "openvswitch", "iptables", "etcd", "kubernetes"} {
                      		systemdUnits[name] = discoverSystemdUnit(logger, name)

@@ -5,11 +5,12 @@ import (
                      	"fmt"
                      	"github.com/openshift/origin/pkg/diagnostics/log"
                     -	"github.com/openshift/origin/pkg/diagnostics/types/diagnostic"
                     +	"github.com/openshift/origin/pkg/diagnostics/types"
+                     )
                      type logEntry struct {
                     -	Message string // I feel certain we will want more fields at some point
                     +	Message   string `json:"MESSAGE"`
                     +	TimeStamp string `json:"__REALTIME_TIMESTAMP"` // epoch + ns
+                     }
                      type logMatcher struct { // regex for scanning log messages and interpreting them when found
@@ -19,10 +20,9 @@ type logMatcher struct { // regex for scanning log messages and interpreting the
                      	Interpretation string // log with above level+id if it's simple
                      	KeepAfterMatch bool   // usually note only first matched entry, ignore rest
                      	Interpret      func(  // run this for custom logic on match
                     -		logger *log.Logger,
                      		entry *logEntry,
                      		matches []string,
                     -	) (bool, []log.Message, []error, []error) // KeepAfterMatch?
                     +	) (bool /* KeepAfterMatch? */, *types.DiagnosticResult)
+                     }
                      type unitSpec struct {
@@ -32,8 +32,8 @@ type unitSpec struct {
+                     }
                      //
                     -// -------- Things that feed into the diagnostics definitions -----------
                     -// Search for Diagnostics for the actual diagnostics.
                     +// -------- These are things that feed into the diagnostics definitions -----------
                     +//
                      // Reusable log matchers:
                      var badImageTemplate = logMatcher{
@@ -81,15 +81,15 @@ logs after the node is actually available.`,
                      				// TODO: don't rely on ipv4 format, should be ipv6 "soon"
                      				Regexp: regexp.MustCompile("http: TLS handshake error from ([\\d.]+):\\d+: remote error: bad certificate"),
                      				Level:  log.WarnLevel,
                     -				Interpret: func(logger *log.Logger, entry *logEntry, matches []string) (bool, []log.Message, []error, []error) {
                     -					warnings := []error{}
                     +				Interpret: func(entry *logEntry, matches []string) (bool, *types.DiagnosticResult) {
                     +					r := types.NewDiagnosticResult("openshift-master.journald")
                      					client := matches[1]
                      					prelude := fmt.Sprintf("Found 'openshift-master' journald log message:\n  %s\n", entry.Message)
                      					if tlsClientErrorSeen == nil { // first time this message was seen
                      						tlsClientErrorSeen = map[string]bool{client: true}
                      						// TODO: too generic, adjust message depending on subnet of the "from" address
                     -						diagnosticError := diagnostic.NewDiagnosticError("sdLogOMreBadCert", prelude+`
                     +						r.Warn("sdLogOMreBadCert", nil, prelude+`
                      This error indicates that a client attempted to connect to the master
                      HTTPS API server but broke off the connection because the master's
                      certificate is not validated by a cerificate authority (CA) acceptable
@@ -127,21 +127,13 @@ log message:
                        (so this message may simply indicate that the master generated a new
                        server certificate, e.g. to add a different --public-master, and a
                        browser hasn't accepted it yet and is still attempting API calls;
                     -  try logging out of the console and back in again).`, nil)
+                    -
                     -						message := log.Message{ID: diagnosticError.ID, EvaluatedText: diagnosticError.Explanation, TemplateData: map[string]string{"client": client}}
                     -						logger.LogMessage(log.WarnLevel, message)
                     -						warnings = append(warnings, diagnosticError)
                     +  try logging out of the console and back in again).`)
                      					} else if !tlsClientErrorSeen[client] {
                      						tlsClientErrorSeen[client] = true
                     -						diagnosticError := diagnostic.NewDiagnosticError("sdLogOMreBadCert", prelude+`This message was diagnosed above, but for a different client address.`, nil)
                     -						message := log.Message{ID: diagnosticError.ID, EvaluatedText: diagnosticError.Explanation, TemplateData: map[string]string{"client": client}}
                     -						logger.LogMessage(log.WarnLevel, message)
                     -						warnings = append(warnings, diagnosticError)
+                    -
                     +						r.Warn("sdLogOMreBadCert", nil, prelude+`This message was diagnosed above, but for a different client address.`)
                      					} // else, it's a repeat, don't mention it
                     -					return true, nil, warnings, nil // show once for every client failing to connect, not just the first
                     +					return true /* show once for every client failing to connect, not just the first */, r
                      				},
                      			},
+                     			{
@@ -167,11 +159,6 @@ message for any node with this problem.
                      		},
                      	},
+                     	{
                     -		Name:        "openshift-sdn-master",
                     -		StartMatch:  regexp.MustCompile("Starting OpenShift SDN Master"),
                     -		LogMatchers: []logMatcher{},
                     -	},
                     -	{
                      		Name:       "openshift-node",
                      		StartMatch: regexp.MustCompile("Starting an OpenShift node"),
                      		LogMatchers: []logMatcher{
@@ -236,25 +223,19 @@ to the .kubeconfig specified in /etc/sysconfig/openshift-node
                      This host will not function as a node until this is resolved. Pods
                      scheduled for this node will remain in pending or unknown state forever.`,
                      			},
                     -		},
                     -	},
                     -	{
                     -		Name:       "openshift-sdn-node",
                     -		StartMatch: regexp.MustCompile("Starting OpenShift SDN node"),
                     -		LogMatchers: []logMatcher{
+                     			{
                      				Regexp: regexp.MustCompile("Could not find an allocated subnet for this minion.*Waiting.."),
                      				Level:  log.WarnLevel,
                      				Id:     "sdLogOSNnoSubnet",
                      				Interpretation: `
                     -This warning occurs when openshift-sdn-node is trying to request the
                     +This warning occurs when openshift-node is trying to request the
                      SDN subnet it should be configured with according to openshift-sdn-master,
                      but either can't connect to it ("All the given peers are not reachable")
                      or has not yet been assigned a subnet ("Key not found").
                      This can just be a matter of waiting for the master to become fully
                      available and define a record for the node (aka "minion") to use,
                     -and openshift-sdn-node will wait until that occurs, so the presence
                     +and openshift-node will wait until that occurs, so the presence
                      of this message in the node log isn't necessarily a problem as
                      long as the SDN is actually working, but this message may help indicate
                      the problem if it is not working.
@@ -262,8 +243,8 @@ the problem if it is not working.
                      If the master is available and this node's record is defined and this
                      message persists, then it may be a sign of a different misconfiguration.
                      Unfortunately the message is not specific about why the connection failed.
                     -Check MASTER_URL in /etc/sysconfig/openshift-sdn-node:
                     - * Is the protocol https? It should be http.
                     +Check the master's URL in the node configuration.
                     + * Is the protocol http? It should be https.
                       * Can you reach the address and port from the node using curl?
                         ("404 page not found" is correct response)`,
                      			},

@@ -8,14 +8,15 @@ import (
                      	"github.com/openshift/origin/pkg/diagnostics/log"
                      	"github.com/openshift/origin/pkg/diagnostics/types"
                     -	"github.com/openshift/origin/pkg/diagnostics/types/diagnostic"
+                     )
                      // UnitStatus
                      type UnitStatus struct {
                      	SystemdUnits map[string]types.SystemdUnit
                     +}
                     -	Log *log.Logger
                     +func (d UnitStatus) Name() string {
                     +	return "UnitStatus"
+                     }
                      func (d UnitStatus) Description() string {
@@ -30,67 +31,33 @@ func (d UnitStatus) CanRun() (bool, error) {
                      	return false, errors.New("systemd is not present on this host")
+                     }
                     -func (d UnitStatus) Check() (bool, []log.Message, []error, []error) {
                     -	if _, err := d.CanRun(); err != nil {
                     -		return false, nil, nil, []error{err}
                     -	}
+                    -
                     -	warnings := []error{}
                     -	errors := []error{}
+                    -
                     -	unitWarnings, unitErrors := unitRequiresUnit(d.Log, d.SystemdUnits["openshift-node"], d.SystemdUnits["iptables"], nodeRequiresIPTables)
                     -	warnings = append(warnings, unitWarnings...)
                     -	errors = append(errors, unitErrors...)
                     +func (d UnitStatus) Check() *types.DiagnosticResult {
                     +	r := types.NewDiagnosticResult("UnitStatus")
                     -	unitWarnings, unitErrors = unitRequiresUnit(d.Log, d.SystemdUnits["openshift-node"], d.SystemdUnits["docker"], `OpenShift nodes use Docker to run containers.`)
                     -	warnings = append(warnings, unitWarnings...)
                     -	errors = append(errors, unitErrors...)
+                    -
                     -	unitWarnings, unitErrors = unitRequiresUnit(d.Log, d.SystemdUnits["openshift"], d.SystemdUnits["docker"], `OpenShift nodes use Docker to run containers.`)
                     -	warnings = append(warnings, unitWarnings...)
                     -	errors = append(errors, unitErrors...)
+                    -
                     -	// node's dependency on openvswitch is a special case.
                     -	// We do not need to enable ovs because openshift-node starts it for us.
                     -	if d.SystemdUnits["openshift-node"].Active && !d.SystemdUnits["openvswitch"].Active {
                     -		diagnosticError := diagnostic.NewDiagnosticError("sdUnitSDNreqOVS", sdUnitSDNreqOVS, nil)
                     -		d.Log.Error(diagnosticError.ID, diagnosticError.Explanation)
                     -		errors = append(errors, diagnosticError)
                     -	}
                     +	unitRequiresUnit(r, d.SystemdUnits["openshift-node"], d.SystemdUnits["iptables"], nodeRequiresIPTables)
                     +	unitRequiresUnit(r, d.SystemdUnits["openshift-node"], d.SystemdUnits["docker"], `OpenShift nodes use Docker to run containers.`)
                     +	unitRequiresUnit(r, d.SystemdUnits["openshift-node"], d.SystemdUnits["openvswitch"], sdUnitSDNreqOVS)
                     +	unitRequiresUnit(r, d.SystemdUnits["openshift-master"], d.SystemdUnits["openvswitch"], `OpenShift masters use openvswitch for access to cluster SDN networking`)
                     +	// all-in-one networking *could* be simpler, so fewer checks
                     +	unitRequiresUnit(r, d.SystemdUnits["openshift"], d.SystemdUnits["docker"], `OpenShift nodes use Docker to run containers.`)
                      	// Anything that is enabled but not running deserves notice
                      	for name, unit := range d.SystemdUnits {
                      		if unit.Enabled && !unit.Active {
                     -			diagnosticError := diagnostic.NewDiagnosticErrorFromTemplate("sdUnitInactive", sdUnitInactive, map[string]string{"unit": name})
                     -			d.Log.LogMessage(log.ErrorLevel, *diagnosticError.LogMessage)
                     -			errors = append(errors, diagnosticError)
                     +			r.Errort("sdUnitInactive", nil, sdUnitInactive, log.Hash{"unit": name})
+                     		}
+                     	}
+                    -
                     -	return (len(errors) == 0), nil, warnings, errors
                     +	return r
+                     }
                     -func unitRequiresUnit(logger *log.Logger, unit types.SystemdUnit, requires types.SystemdUnit, reason string) ([]error, []error) {
                     -	templateData := map[string]string{"unit": unit.Name, "required": requires.Name, "reason": reason}
                     +func unitRequiresUnit(r *types.DiagnosticResult, unit types.SystemdUnit, requires types.SystemdUnit, reason string) {
                     +	templateData := log.Hash{"unit": unit.Name, "required": requires.Name, "reason": reason}
                      	if (unit.Active || unit.Enabled) && !requires.Exists {
                     -		diagnosticError := diagnostic.NewDiagnosticErrorFromTemplate("sdUnitReqLoaded", sdUnitReqLoaded, templateData)
                     -		logger.LogMessage(log.ErrorLevel, *diagnosticError.LogMessage)
                     -		return nil, []error{diagnosticError}
+                    -
                     +		r.Errort("sdUnitReqLoaded", nil, sdUnitReqLoaded, templateData)
                      	} else if unit.Active && !requires.Active {
                     -		diagnosticError := diagnostic.NewDiagnosticErrorFromTemplate("sdUnitReqActive", sdUnitReqActive, templateData)
                     -		logger.LogMessage(log.ErrorLevel, *diagnosticError.LogMessage)
                     -		return nil, []error{diagnosticError}
+                    -
                     -	} else if unit.Enabled && !requires.Enabled {
                     -		diagnosticError := diagnostic.NewDiagnosticErrorFromTemplate("sdUnitReqEnabled", sdUnitReqEnabled, templateData)
                     -		logger.LogMessage(log.WarnLevel, *diagnosticError.LogMessage)
                     -		return []error{diagnosticError}, nil
+                    -
                     +		r.Errort("sdUnitReqActive", nil, sdUnitReqActive, templateData)
+                     	}
+                    -
                     -	return nil, nil
+                     }
                      func errStr(err error) string {
@@ -156,12 +123,4 @@ To ensure it is not failing to run, check the status and logs with:
                        # systemctl status {{.required}}
                        # journalctl -ru {{.required}}
+                       `
+                    -
                     -	sdUnitReqEnabled = `
                     -systemd unit {{.unit}} is enabled to run automatically at boot, but {{.required}} is not.
                     -{{.reason}}
                     -An administrator can enable the {{.required}} unit with:
+                    -
                     -  # systemctl enable {{.required}}
                     -  `
+                     )

                     new file mode 100644
@@ -0,0 +1,175 @@
                     +package types
+                    +
                     +import (
                     +	"fmt"
                     +	"github.com/golang/glog"
                     +	"runtime"
                     +	"strings"
+                    +
                     +	"github.com/openshift/origin/pkg/diagnostics/log"
                     +)
+                    +
                     +type Diagnostic interface {
                     +	Name() string
                     +	Description() string
                     +	CanRun() (canRun bool, reason error)
                     +	Check() *DiagnosticResult
                     +}
+                    +
                     +type DiagnosticResult struct {
                     +	failure  bool
                     +	origin   string // name of diagnostic; automatically inserted into log Entries
                     +	logs     []log.Entry
                     +	warnings []DiagnosticError
                     +	errors   []DiagnosticError
                     +}
+                    +
                     +func NewDiagnosticResult(origin string) *DiagnosticResult {
                     +	return &DiagnosticResult{origin: origin}
                     +}
+                    +
                     +func (r *DiagnosticResult) Complete() *DiagnosticResult {
                     +	if r.errors == nil {
                     +		r.errors = make([]DiagnosticError, 0)
                     +	}
                     +	if r.warnings == nil {
                     +		r.warnings = make([]DiagnosticError, 0)
                     +	}
                     +	if r.logs == nil {
                     +		r.logs = make([]log.Entry, 0)
                     +	}
                     +	return r
                     +}
+                    +
                     +func (r *DiagnosticResult) appendLogs(stackDepth int, entry ...log.Entry) {
                     +	if r.logs == nil {
                     +		r.logs = make([]log.Entry, 0)
                     +	}
                     +	r.logs = append(r.logs, entry...)
                     +	// glog immediately for debugging when a diagnostic silently chokes
                     +	for _, entry := range entry {
                     +		if glog.V(glog.Level(6 - entry.Level.Level)) {
                     +			glog.InfoDepth(stackDepth, entry.Message.String())
                     +		}
                     +	}
                     +}
+                    +
                     +func (r *DiagnosticResult) Failure() bool {
                     +	return r.failure
                     +}
+                    +
                     +func (r *DiagnosticResult) Logs() []log.Entry {
                     +	if r.logs == nil {
                     +		return make([]log.Entry, 0)
                     +	}
                     +	return r.logs
                     +}
+                    +
                     +func (r *DiagnosticResult) appendWarnings(warn ...DiagnosticError) {
                     +	if r.warnings == nil {
                     +		r.warnings = make([]DiagnosticError, 0)
                     +	}
                     +	r.warnings = append(r.warnings, warn...)
                     +}
+                    +
                     +func (r *DiagnosticResult) Warnings() []DiagnosticError {
                     +	if r.warnings == nil {
                     +		return make([]DiagnosticError, 0)
                     +	}
                     +	return r.warnings
                     +}
+                    +
                     +func (r *DiagnosticResult) appendErrors(err ...DiagnosticError) {
                     +	if r.errors == nil {
                     +		r.errors = make([]DiagnosticError, 0)
                     +	}
                     +	r.failure = true
                     +	r.errors = append(r.errors, err...)
                     +}
+                    +
                     +func (r *DiagnosticResult) Errors() []DiagnosticError {
                     +	if r.errors == nil {
                     +		return make([]DiagnosticError, 0)
                     +	}
                     +	return r.errors
                     +}
+                    +
                     +func (r *DiagnosticResult) Append(r2 *DiagnosticResult) {
                     +	r.Complete()
                     +	r2.Complete()
                     +	r.logs = append(r.logs, r2.logs...)
                     +	r.warnings = append(r.warnings, r2.warnings...)
                     +	r.errors = append(r.errors, r2.errors...)
                     +	r.failure = r.failure || r2.failure
                     +}
+                    +
                     +// basic ingress functions (private)
                     +func (r *DiagnosticResult) caller(depth int) string {
                     +	if _, file, line, ok := runtime.Caller(depth + 1); ok {
                     +		paths := strings.SplitAfter(file, "github.com/")
                     +		return fmt.Sprintf("diagnostic %s@%s:%d", r.origin, paths[len(paths)-1], line)
                     +	}
                     +	return "diagnostic " + r.origin
                     +}
                     +func (r *DiagnosticResult) logError(id string, err error, msg *log.Message) {
                     +	r.appendLogs(2, log.Entry{id, r.caller(2), log.ErrorLevel, *msg})
                     +	if de, ok := err.(DiagnosticError); ok {
                     +		r.appendErrors(de)
                     +	} else {
                     +		r.appendErrors(DiagnosticError{id, msg, err})
                     +	}
                     +}
                     +func (r *DiagnosticResult) logWarning(id string, err error, msg *log.Message) {
                     +	r.appendLogs(2, log.Entry{id, r.caller(2), log.WarnLevel, *msg})
                     +	if de, ok := err.(DiagnosticError); ok {
                     +		r.appendWarnings(de)
                     +	} else {
                     +		r.appendWarnings(DiagnosticError{id, msg, err})
                     +	}
                     +}
                     +func (r *DiagnosticResult) logMessage(id string, level log.Level, msg *log.Message) {
                     +	r.appendLogs(2, log.Entry{id, r.caller(2), level, *msg})
                     +}
+                    +
                     +// Public ingress functions
                     +// Errors are recorded as errors and also logged
                     +func (r *DiagnosticResult) Error(id string, err error, text string) {
                     +	r.logError(id, err, &log.Message{id, "", nil, text})
                     +}
                     +func (r *DiagnosticResult) Errorf(id string, err error, format string, a ...interface{}) {
                     +	r.logError(id, err, &log.Message{id, "", nil, fmt.Sprintf(format, a...)})
                     +}
                     +func (r *DiagnosticResult) Errort(id string, err error, template string, data interface{} /* log.Hash */) {
                     +	r.logError(id, err, &log.Message{id, template, data, ""})
                     +}
+                    +
                     +// Warnings are recorded as warnings and also logged
                     +func (r *DiagnosticResult) Warn(id string, err error, text string) {
                     +	r.logWarning(id, err, &log.Message{id, "", nil, text})
                     +}
                     +func (r *DiagnosticResult) Warnf(id string, err error, format string, a ...interface{}) {
                     +	r.logWarning(id, err, &log.Message{id, "", nil, fmt.Sprintf(format, a...)})
                     +}
                     +func (r *DiagnosticResult) Warnt(id string, err error, template string, data interface{} /* log.Hash */) {
                     +	r.logWarning(id, err, &log.Message{id, template, data, ""})
                     +}
+                    +
                     +// Info/Debug are just logged.
                     +func (r *DiagnosticResult) Info(id string, text string) {
                     +	r.logMessage(id, log.InfoLevel, &log.Message{id, "", nil, text})
                     +}
                     +func (r *DiagnosticResult) Infof(id string, format string, a ...interface{}) {
                     +	r.logMessage(id, log.InfoLevel, &log.Message{id, "", nil, fmt.Sprintf(format, a...)})
                     +}
                     +func (r *DiagnosticResult) Infot(id string, template string, data interface{} /* log.Hash */) {
                     +	r.logMessage(id, log.InfoLevel, &log.Message{id, template, data, ""})
                     +}
                     +func (r *DiagnosticResult) Debug(id string, text string) {
                     +	r.logMessage(id, log.DebugLevel, &log.Message{id, "", nil, text})
                     +}
                     +func (r *DiagnosticResult) Debugf(id string, format string, a ...interface{}) {
                     +	r.logMessage(id, log.DebugLevel, &log.Message{id, "", nil, fmt.Sprintf(format, a...)})
                     +}
                     +func (r *DiagnosticResult) Debugt(id string, template string, data interface{} /* log.Hash */) {
                     +	r.logMessage(id, log.DebugLevel, &log.Message{id, template, data, ""})
                     +}

                     deleted file mode 100644
@@ -1,55 +0,0 @@
                     -package diagnostic
+                    -
                     -// This needed to be separate from other types to avoid import cycle
                     -// diagnostic -> discovery -> types
+                    -
                     -import (
                     -	"fmt"
+                    -
                     -	"github.com/openshift/origin/pkg/diagnostics/log"
                     -)
+                    -
                     -type Diagnostic interface {
                     -	Description() string
                     -	CanRun() (canRun bool, reason error)
                     -	Check() (success bool, info []log.Message, warnings []error, errors []error)
                     -}
+                    -
                     -type DiagnosticError struct {
                     -	ID          string
                     -	Explanation string
                     -	Cause       error
+                    -
                     -	LogMessage *log.Message
                     -}
+                    -
                     -func NewDiagnosticError(id, explanation string, cause error) DiagnosticError {
                     -	return DiagnosticError{id, explanation, cause, nil}
                     -}
+                    -
                     -func NewDiagnosticErrorFromTemplate(id, template string, templateData interface{}) DiagnosticError {
                     -	return DiagnosticError{id, "", nil,
                     -		&log.Message{
                     -			ID:           id,
                     -			Template:     template,
                     -			TemplateData: templateData,
                     -		},
                     -	}
                     -}
+                    -
                     -func (e DiagnosticError) Error() string {
                     -	if e.Cause != nil {
                     -		return e.Cause.Error()
                     -	}
+                    -
                     -	if e.LogMessage != nil {
                     -		return fmt.Sprintf("%v", e.LogMessage)
                     -	}
+                    -
                     -	return e.Explanation
                     -}
+                    -
                     -func IsDiagnosticError(e error) bool {
                     -	_, ok := e.(DiagnosticError)
                     -	return ok
                     -}

                     deleted file mode 100644
@@ -1,38 +0,0 @@
                     -package types
+                    -
                     -import "fmt"
+                    -
                     -type Version struct {
                     -	X, Y, Z int
                     -}
+                    -
                     -func (a Version) Eq(b Version) bool {
                     -	return a.X == b.X && a.Y == b.Y && a.Z == b.Z
                     -}
+                    -
                     -func (a Version) Gt(b Version) bool {
                     -	if a.X > b.X {
                     -		return true
                     -	}
                     -	if a.X < b.X {
                     -		return false
                     -	} // so, Xs are equal
                     -	if a.Y > b.Y {
                     -		return true
                     -	}
                     -	if a.Y < b.Y {
                     -		return false
                     -	} // so, Ys are equal
                     -	if a.Z > b.Z {
                     -		return true
                     -	}
                     -	return false
                     -}
+                    -
                     -func (v Version) GoString() string {
                     -	return fmt.Sprintf("%d.%d.%d", v.X, v.Y, v.Z)
                     -}
+                    -
                     -func (v Version) NonZero() bool {
                     -	return !v.Eq(Version{0, 0, 0})
                     -}

@@ -4392,6 +4392,36 @@ _openshift_ex_build-chain()
                          must_have_one_noun=()
+                     }
                     +_openshift_ex_diagnostics()
                     +{
                     +    last_command="openshift_ex_diagnostics"
                     +    commands=()
+                    +
                     +    flags=()
                     +    two_word_flags=()
                     +    flags_with_completion=()
                     +    flags_completion=()
+                    +
                     +    flags+=("--cluster-context=")
                     +    flags+=("--config=")
                     +    flags+=("--context=")
                     +    flags+=("--diaglevel=")
                     +    two_word_flags+=("-l")
                     +    flags+=("--diagnostics=")
                     +    two_word_flags+=("-d")
                     +    flags+=("--help")
                     +    flags+=("-h")
                     +    flags+=("--host")
                     +    flags+=("--loglevel=")
                     +    flags+=("--master-config=")
                     +    flags+=("--node-config=")
                     +    flags+=("--output=")
                     +    two_word_flags+=("-o")
+                    +
                     +    must_have_one_flag=()
                     +    must_have_one_noun=()
                     +}
+                    +
                      _openshift_ex_options()
+                     {
                          last_command="openshift_ex_options"
@@ -4416,6 +4446,7 @@ _openshift_ex()
                          commands+=("tokens")
                          commands+=("ipfailover")
                          commands+=("build-chain")
                     +    commands+=("diagnostics")
                          commands+=("options")
                          flags=()

                     new file mode 100644
@@ -0,0 +1,73 @@
                     +// +build integration,!no-etcd
+                    +
                     +package integration
+                    +
                     +import (
                     +	"testing"
+                    +
                     +	kapi "github.com/GoogleCloudPlatform/kubernetes/pkg/api"
+                    +
                     +	clusterdiags "github.com/openshift/origin/pkg/diagnostics/cluster"
                     +	diagtype "github.com/openshift/origin/pkg/diagnostics/types"
                     +	testutil "github.com/openshift/origin/test/util"
                     +)
+                    +
                     +func TestDiagNodeConditions(t *testing.T) {
                     +	//masterConfig, clientFile, err := testutil.StartTestAllInOne()
                     +	_, clientFile, err := testutil.StartTestMaster()
                     +	if err != nil {
                     +		t.Fatalf("unexpected error: %v", err)
                     +	}
                     +	client, err := testutil.GetClusterAdminKubeClient(clientFile)
                     +	if err != nil {
                     +		t.Fatalf("unexpected error: %v", err)
                     +	}
+                    +
                     +	nodeDiag := clusterdiags.NodeDefinitions{KubeClient: client}
                     +	// First check with no nodes defined; should get an error about that.
                     +	// ok, logs, warnings, errors := nodeDiag.Check()
                     +	if errors := nodeDiag.Check().Errors(); len(errors) != 1 ||
                     +		!diagtype.MatchesDiagError(errors[0], "clNoAvailNodes") {
                     +		t.Errorf("expected 1 error about not having nodes, not: %#v", errors)
                     +	}
+                    +
                     +	// Next create a node and leave it in NotReady state. Should get a warning
                     +	// about that, plus the previous error as there are still no nodes available.
                     +	node, err := client.Nodes().Create(&kapi.Node{ObjectMeta: kapi.ObjectMeta{Name: "test-node"}})
                     +	if err != nil {
                     +		t.Fatalf("expected no errors creating a node: %#v", err)
                     +	}
                     +	result := nodeDiag.Check()
                     +	if errors := result.Errors(); len(errors) != 1 ||
                     +		!diagtype.MatchesDiagError(errors[0], "clNoAvailNodes") {
                     +		t.Fatalf("expected 1 error about not having nodes, not: %#v", errors)
                     +	} else if warnings := result.Warnings(); len(warnings) < 1 || !diagtype.MatchesDiagError(warnings[0], "clNodeNotReady") {
                     +		t.Fatalf("expected a warning about test-node not being ready, not: %#v", warnings)
                     +	}
+                    +
                     +	_ = node
                     +	/*
                     +		// Put the new node in Ready state and verify the diagnostic is clean
                     +		if _, err := client.Nodes().UpdateStatus(node); err != nil {
                     +			t.Fatalf("expected no errors updating node status, but: %#v", err)
                     +		}
                     +		result = nodeDiag.Check()
                     +		if warnings := result.Warnings(); len(warnings) > 0 {
                     +			t.Fatalf("expected no warning with one node ready, but: %#v", warnings)
                     +		} else if errors := result.Errors(); len(warnings) > 0 {
                     +			t.Fatalf("expected no errors with one node ready, but: %#v", errors)
                     +		}
+                    +
                     +		// Make the node unschedulable and verify diagnostics notices
                     +		node.Spec.Unschedulable = true
                     +		if _, err := client.Nodes().Update(node); err != nil {
                     +			t.Fatalf("expected no errors making node unschedulable, but: %#v", err)
                     +		}
                     +		if errors := result.Errors(); len(errors) != 1 ||
                     +			!diagtype.MatchesDiagError(errors[0], "clNoAvailNodes") {
                     +			t.Fatalf("expected 1 error about not having nodes, but: %#v", errors)
                     +		} else if warnings := result.Warnings(); len(warnings) < 1 || !diagtype.MatchesDiagError(warnings[0], "clNodeNotSched") {
                     +			t.Fatalf("expected a warning about test-node not being schedulable, but: %#v", warnings)
                     +		}
                     +	*/
                     +}