1 from __future__ import print_function
2 from __future__ import absolute_import
3 from future import standard_library
4 standard_library.install_aliases()
5 from builtins import object
25 if sys.version_info >= (3, 0):
26 from collections import UserDict
28 from UserDict import UserDict
30 from .api import api, api_from_config, http_cache
31 from .collection import CollectionReader, CollectionWriter, ResumableCollectionWriter
32 from arvados.keep import *
33 from arvados.stream import *
34 from .arvfile import StreamFileReader
35 from .retry import RetryLoop
36 import arvados.errors as errors
37 import arvados.util as util
39 # Set up Arvados logging based on the user's configuration.
40 # All Arvados code should log under the arvados hierarchy.
41 log_handler = logging.StreamHandler()
42 log_handler.setFormatter(logging.Formatter(
43 '%(asctime)s %(name)s[%(process)d] %(levelname)s: %(message)s',
45 logger = logging.getLogger('arvados')
46 logger.addHandler(log_handler)
47 logger.setLevel(logging.DEBUG if config.get('ARVADOS_DEBUG')
50 def task_set_output(self, s, num_retries=5):
51 for tries_left in RetryLoop(num_retries=num_retries, backoff_start=0):
53 return api('v1').job_tasks().update(
60 except errors.ApiError as error:
61 if retry.check_http_response_success(error.resp.status) is None and tries_left > 0:
62 logger.debug("task_set_output: job_tasks().update() raised {}, retrying with {} tries left".format(repr(error),tries_left))
67 def current_task(num_retries=5):
72 for tries_left in RetryLoop(num_retries=num_retries, backoff_start=2):
74 task = api('v1').job_tasks().get(uuid=os.environ['TASK_UUID']).execute()
76 task.set_output = types.MethodType(task_set_output, task)
77 task.tmpdir = os.environ['TASK_WORK']
80 except errors.ApiError as error:
81 if retry.check_http_response_success(error.resp.status) is None and tries_left > 0:
82 logger.debug("current_task: job_tasks().get() raised {}, retrying with {} tries left".format(repr(error),tries_left))
87 def current_job(num_retries=5):
92 for tries_left in RetryLoop(num_retries=num_retries, backoff_start=2):
94 job = api('v1').jobs().get(uuid=os.environ['JOB_UUID']).execute()
96 job.tmpdir = os.environ['JOB_WORK']
99 except errors.ApiError as error:
100 if retry.check_http_response_success(error.resp.status) is None and tries_left > 0:
101 logger.debug("current_job: jobs().get() raised {}, retrying with {} tries left".format(repr(error),tries_left))
105 def getjobparam(*args):
106 return current_job()['script_parameters'].get(*args)
108 def get_job_param_mount(*args):
109 return os.path.join(os.environ['TASK_KEEPMOUNT'], current_job()['script_parameters'].get(*args))
111 def get_task_param_mount(*args):
112 return os.path.join(os.environ['TASK_KEEPMOUNT'], current_task()['parameters'].get(*args))
114 class JobTask(object):
115 def __init__(self, parameters=dict(), runtime_constraints=dict()):
116 print("init jobtask %s %s" % (parameters, runtime_constraints))
118 class job_setup(object):
120 def one_task_per_input_file(if_sequence=0, and_end_task=True, input_as_path=False, api_client=None):
121 if if_sequence != current_task()['sequence']:
125 api_client = api('v1')
127 job_input = current_job()['script_parameters']['input']
128 cr = CollectionReader(job_input, api_client=api_client)
130 for s in cr.all_streams():
131 for f in s.all_files():
133 task_input = os.path.join(job_input, s.name(), f.name())
135 task_input = f.as_manifest()
137 'job_uuid': current_job()['uuid'],
138 'created_by_job_task_uuid': current_task()['uuid'],
139 'sequence': if_sequence + 1,
144 api_client.job_tasks().create(body=new_task_attrs).execute()
146 api_client.job_tasks().update(uuid=current_task()['uuid'],
147 body={'success':True}
152 def one_task_per_input_stream(if_sequence=0, and_end_task=True):
153 if if_sequence != current_task()['sequence']:
155 job_input = current_job()['script_parameters']['input']
156 cr = CollectionReader(job_input)
157 for s in cr.all_streams():
158 task_input = s.tokens()
160 'job_uuid': current_job()['uuid'],
161 'created_by_job_task_uuid': current_task()['uuid'],
162 'sequence': if_sequence + 1,
167 api('v1').job_tasks().create(body=new_task_attrs).execute()
169 api('v1').job_tasks().update(uuid=current_task()['uuid'],
170 body={'success':True}