Merge branch '19818-api-pydoc'

[arvados.git] / tools / crunchstat-summary / crunchstat_summary / summarizer.py
diff --git a/tools/crunchstat-summary/crunchstat_summary/summarizer.py b/tools/crunchstat-summary/crunchstat_summary/summarizer.py

index d99d3c1cf8324c4dd33f9bcdd72a15fa4f015d7c..2bd329719bec70300d268b06bb6abe8e3abf245c 100644 (file)
--- a/tools/crunchstat-summary/crunchstat_summary/summarizer.py
+++ b/tools/crunchstat-summary/crunchstat_summary/summarizer.py
@@ -15,7 +15,6 @@ import sys
  import threading
  import _strptime
  
-from arvados.api import OrderedJsonModel
  from crunchstat_summary import logger
  
  # Recommend memory constraints that are this multiple of an integral
@@ -105,7 +104,7 @@ class Summarizer(object):
                                         self.label, uuid)
                          continue
                      logger.debug('%s: follow %s', self.label, uuid)
-                    child_summarizer = ProcessSummarizer(uuid)
+                    child_summarizer = NewSummarizer(uuid)
                      child_summarizer.stats_max = self.stats_max
                      child_summarizer.task_stats = self.task_stats
                      child_summarizer.tasks = self.tasks
@@ -245,6 +244,27 @@ class Summarizer(object):
                      self.job_tot[category][stat] += val
          logger.debug('%s: done totals', self.label)
  
+        missing_category = {
+            'cpu': 'CPU',
+            'mem': 'memory',
+            'net:': 'network I/O',
+            'statfs': 'storage space',
+        }
+        for task_stat in self.task_stats.values():
+            for category in task_stat.keys():
+                for checkcat in missing_category:
+                    if checkcat.endswith(':'):
+                        if category.startswith(checkcat):
+                            missing_category.pop(checkcat)
+                            break
+                    else:
+                        if category == checkcat:
+                            missing_category.pop(checkcat)
+                            break
+        for catlabel in missing_category.values():
+            logger.warning('%s: %s stats are missing -- possible cluster configuration issue',
+                        self.label, catlabel)
+
      def long_label(self):
          label = self.label
          if hasattr(self, 'process') and self.process['uuid'] not in label:
@@ -364,7 +384,7 @@ class Summarizer(object):
                  constraint_key,
                  int(used_cores))
  
-    # FIXME: This needs to be updated to account for current nodemanager algorithms
+    # FIXME: This needs to be updated to account for current a-d-c algorithms
      def _recommend_ram(self):
          """Recommend an economical RAM constraint for this job.
  
@@ -497,7 +517,7 @@ def NewSummarizer(process_or_uuid, **kwargs):
      else:
          uuid = process_or_uuid
          process = None
-        arv = arvados.api('v1', model=OrderedJsonModel())
+        arv = arvados.api('v1')
  
      if '-dz642-' in uuid:
          if process is None:
@@ -526,7 +546,7 @@ def NewSummarizer(process_or_uuid, **kwargs):
  
  
  class ProcessSummarizer(Summarizer):
-    """Process is a job, pipeline, container, or container request."""
+    """Process is a job, pipeline, or container request."""
  
      def __init__(self, process, label=None, **kwargs):
          rdr = None
@@ -535,17 +555,16 @@ class ProcessSummarizer(Summarizer):
              label = self.process.get('name', self.process['uuid'])
          # Pre-Arvados v1.4 everything is in 'log'
          # For 1.4+ containers have no logs and container_requests have them in 'log_uuid', not 'log'
-        log_collection = self.process.get('log')
-        if not log_collection:
-            log_collection = self.process.get('log_uuid')
-        if log_collection:
+        log_collection = self.process.get('log', self.process.get('log_uuid'))
+        if log_collection and self.process.get('state') != 'Uncommitted': # arvados.util.CR_UNCOMMITTED:
              try:
                  rdr = crunchstat_summary.reader.CollectionReader(log_collection)
              except arvados.errors.NotFoundError as e:
                  logger.warning("Trying event logs after failing to read "
                                 "log collection %s: %s", self.process['log'], e)
          if rdr is None:
-            rdr = crunchstat_summary.reader.LiveLogReader(self.process['uuid'])
+            uuid = self.process.get('container_uuid', self.process.get('uuid'))
+            rdr = crunchstat_summary.reader.LiveLogReader(uuid)
              label = label + ' (partial)'
          super(ProcessSummarizer, self).__init__(rdr, label=label, **kwargs)
          self.existing_constraints = self.process.get('runtime_constraints', {})
@@ -619,7 +638,7 @@ class MultiSummarizer(object):
  class JobTreeSummarizer(MultiSummarizer):
      """Summarizes a job and all children listed in its components field."""
      def __init__(self, job, label=None, **kwargs):
-        arv = arvados.api('v1', model=OrderedJsonModel())
+        arv = arvados.api('v1')
          label = label or job.get('name', job['uuid'])
          children = collections.OrderedDict()
          children[job['uuid']] = JobSummarizer(job, label=label, **kwargs)
@@ -663,7 +682,7 @@ class PipelineSummarizer(MultiSummarizer):
  
  class ContainerRequestTreeSummarizer(MultiSummarizer):
      def __init__(self, root, skip_child_jobs=False, **kwargs):
-        arv = arvados.api('v1', model=OrderedJsonModel())
+        arv = arvados.api('v1')
  
          label = kwargs.pop('label', None) or root.get('name') or root['uuid']
          root['name'] = label