X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/013efe3cfb6e53b372be1f785646e76a7965a948..d843787b4ece9952597d7814cbf10fb383c72625:/sdk/python/arvados/__init__.py diff --git a/sdk/python/arvados/__init__.py b/sdk/python/arvados/__init__.py index b165412d46..1df64703a9 100644 --- a/sdk/python/arvados/__init__.py +++ b/sdk/python/arvados/__init__.py @@ -18,13 +18,25 @@ import fcntl import time import threading -from api import * -from collection import * +from .api import api, http_cache +from collection import CollectionReader, CollectionWriter, ResumableCollectionWriter from keep import * from stream import * +from arvfile import StreamFileReader import errors import util +# Set up Arvados logging based on the user's configuration. +# All Arvados code should log under the arvados hierarchy. +log_handler = logging.StreamHandler() +log_handler.setFormatter(logging.Formatter( + '%(asctime)s %(name)s[%(process)d] %(levelname)s: %(message)s', + '%Y-%m-%d %H:%M:%S')) +logger = logging.getLogger('arvados') +logger.addHandler(log_handler) +logger.setLevel(logging.DEBUG if config.get('ARVADOS_DEBUG') + else logging.WARNING) + def task_set_output(self,s): api('v1').job_tasks().update(uuid=self['uuid'], body={ @@ -59,20 +71,34 @@ def current_job(): def getjobparam(*args): return current_job()['script_parameters'].get(*args) +def get_job_param_mount(*args): + return os.path.join(os.environ['TASK_KEEPMOUNT'], current_job()['script_parameters'].get(*args)) + +def get_task_param_mount(*args): + return os.path.join(os.environ['TASK_KEEPMOUNT'], current_task()['parameters'].get(*args)) + class JobTask(object): def __init__(self, parameters=dict(), runtime_constraints=dict()): print "init jobtask %s %s" % (parameters, runtime_constraints) class job_setup: @staticmethod - def one_task_per_input_file(if_sequence=0, and_end_task=True): + def one_task_per_input_file(if_sequence=0, and_end_task=True, input_as_path=False, api_client=None): if if_sequence != current_task()['sequence']: return + + if not api_client: + api_client = api('v1') + job_input = current_job()['script_parameters']['input'] - cr = CollectionReader(job_input) + cr = CollectionReader(job_input, api_client=api_client) + cr.normalize() for s in cr.all_streams(): for f in s.all_files(): - task_input = f.as_manifest() + if input_as_path: + task_input = os.path.join(job_input, s.name(), f.name()) + else: + task_input = f.as_manifest() new_task_attrs = { 'job_uuid': current_job()['uuid'], 'created_by_job_task_uuid': current_task()['uuid'], @@ -81,9 +107,9 @@ class job_setup: 'input':task_input } } - api('v1').job_tasks().create(body=new_task_attrs).execute() + api_client.job_tasks().create(body=new_task_attrs).execute() if and_end_task: - api('v1').job_tasks().update(uuid=current_task()['uuid'], + api_client.job_tasks().update(uuid=current_task()['uuid'], body={'success':True} ).execute() exit(0) @@ -110,5 +136,3 @@ class job_setup: body={'success':True} ).execute() exit(0) - -