4523: Add "store long string" test.

[arvados.git] / doc / _includes / _tutorial_hash_script_py.liquid
diff --git a/doc/_includes/_tutorial_hash_script_py.liquid b/doc/_includes/_tutorial_hash_script_py.liquid

index 6462aab110daafe7e3afb4f881ab3e464c91586b..b9c7f31532088892958a886ef77f7c89b239192c 100644 (file)
--- a/doc/_includes/_tutorial_hash_script_py.liquid
+++ b/doc/_includes/_tutorial_hash_script_py.liquid
@@ -1,6 +1,6 @@
  #!/usr/bin/env python
  
-import hashlib      # Import the hashlib module to compute md5.
+import hashlib      # Import the hashlib module to compute MD5.
  import arvados      # Import the Arvados sdk module
  
  # Automatically parallelize this job by running one task per file.
@@ -10,16 +10,19 @@ import arvados      # Import the Arvados sdk module
  arvados.job_setup.one_task_per_input_file(if_sequence=0, and_end_task=True, 
                                            input_as_path=True)
  
-# Create the object that will actually compute the md5 hash
+# Create the message digest object that will compute the MD5 hash
  digestor = hashlib.new('md5')
  
-# Get the input file for the task and open it for reading
-with open(arvados.get_task_param_mount('input')) as f:
+# Get the input file for the task
+input_file = arvados.get_task_param_mount('input')
+
+# Open the input file for reading
+with open(input_file) as f:
      while True:
          buf = f.read(2**20)      # read a 1 megabyte block from the file
          if len(buf) == 0:        # break when there is no more data left
              break
-        digestor.update(buf)     # update the md5 hash object
+        digestor.update(buf)     # update the MD5 hash object
  
  # Get object representing the current task
  this_task = arvados.current_task()
@@ -30,7 +33,7 @@ out = arvados.CollectionWriter()
   # Set output file within the collection
  out.set_current_file_name("md5sum.txt")
  
-# Write an output line with the md5 value and input
+# Write an output line with the MD5 value and input
  out.write("%s %s\n" % (digestor.hexdigest(), this_task['parameters']['input']))
  
   # Commit the output to keep.  This returns a Keep id.