#!/usr/bin/env python3 {% comment %} Copyright (C) The Arvados Authors. All rights reserved. SPDX-License-Identifier: CC-BY-SA-3.0 {% endcomment %} import arvados # Automatically parallelize this job by running one task per file. arvados.job_setup.one_task_per_input_file(if_sequence=0, and_end_task=True, input_as_path=True) # Get the input file for the task input_file = arvados.get_task_param_mount('input') # Run the external 'md5sum' program on the input file stdoutdata, stderrdata = arvados.util.run_command(['md5sum', input_file]) # Save the standard output (stdoutdata) to "md5sum.txt" in the output collection out = arvados.CollectionWriter() with out.open('md5sum.txt') as out_file: out_file.write(stdoutdata) arvados.current_task().set_output(out.finish())