Merge branch '19818-api-pydoc'

[arvados.git] / tools / crunchstat-summary / crunchstat_summary / summarizer.py
diff --git a/tools/crunchstat-summary/crunchstat_summary/summarizer.py b/tools/crunchstat-summary/crunchstat_summary/summarizer.py

index 3780ef783d45b10aab9d24f77dba2cd40cb53ec6..2bd329719bec70300d268b06bb6abe8e3abf245c 100644 (file)
--- a/tools/crunchstat-summary/crunchstat_summary/summarizer.py
+++ b/tools/crunchstat-summary/crunchstat_summary/summarizer.py
@@ -4,7 +4,6 @@
  
  import arvados
  import collections
-import arvados.util
  import crunchstat_summary.dygraphs
  import crunchstat_summary.reader
  import datetime
@@ -16,7 +15,6 @@ import sys
  import threading
  import _strptime
  
-from arvados.api import OrderedJsonModel
  from crunchstat_summary import logger
  
  # Recommend memory constraints that are this multiple of an integral
@@ -246,6 +244,27 @@ class Summarizer(object):
                      self.job_tot[category][stat] += val
          logger.debug('%s: done totals', self.label)
  
+        missing_category = {
+            'cpu': 'CPU',
+            'mem': 'memory',
+            'net:': 'network I/O',
+            'statfs': 'storage space',
+        }
+        for task_stat in self.task_stats.values():
+            for category in task_stat.keys():
+                for checkcat in missing_category:
+                    if checkcat.endswith(':'):
+                        if category.startswith(checkcat):
+                            missing_category.pop(checkcat)
+                            break
+                    else:
+                        if category == checkcat:
+                            missing_category.pop(checkcat)
+                            break
+        for catlabel in missing_category.values():
+            logger.warning('%s: %s stats are missing -- possible cluster configuration issue',
+                        self.label, catlabel)
+
      def long_label(self):
          label = self.label
          if hasattr(self, 'process') and self.process['uuid'] not in label:
@@ -365,7 +384,7 @@ class Summarizer(object):
                  constraint_key,
                  int(used_cores))
  
-    # FIXME: This needs to be updated to account for current nodemanager algorithms
+    # FIXME: This needs to be updated to account for current a-d-c algorithms
      def _recommend_ram(self):
          """Recommend an economical RAM constraint for this job.
  
@@ -498,7 +517,7 @@ def NewSummarizer(process_or_uuid, **kwargs):
      else:
          uuid = process_or_uuid
          process = None
-        arv = arvados.api('v1', model=OrderedJsonModel())
+        arv = arvados.api('v1')
  
      if '-dz642-' in uuid:
          if process is None:
@@ -537,7 +556,7 @@ class ProcessSummarizer(Summarizer):
          # Pre-Arvados v1.4 everything is in 'log'
          # For 1.4+ containers have no logs and container_requests have them in 'log_uuid', not 'log'
          log_collection = self.process.get('log', self.process.get('log_uuid'))
-        if log_collection and self.process.get('state') != arvados.util.CR_UNCOMMITTED:
+        if log_collection and self.process.get('state') != 'Uncommitted': # arvados.util.CR_UNCOMMITTED:
              try:
                  rdr = crunchstat_summary.reader.CollectionReader(log_collection)
              except arvados.errors.NotFoundError as e:
@@ -619,7 +638,7 @@ class MultiSummarizer(object):
  class JobTreeSummarizer(MultiSummarizer):
      """Summarizes a job and all children listed in its components field."""
      def __init__(self, job, label=None, **kwargs):
-        arv = arvados.api('v1', model=OrderedJsonModel())
+        arv = arvados.api('v1')
          label = label or job.get('name', job['uuid'])
          children = collections.OrderedDict()
          children[job['uuid']] = JobSummarizer(job, label=label, **kwargs)
@@ -663,7 +682,7 @@ class PipelineSummarizer(MultiSummarizer):
  
  class ContainerRequestTreeSummarizer(MultiSummarizer):
      def __init__(self, root, skip_child_jobs=False, **kwargs):
-        arv = arvados.api('v1', model=OrderedJsonModel())
+        arv = arvados.api('v1')
  
          label = kwargs.pop('label', None) or root.get('name') or root['uuid']
          root['name'] = label