[ARVADOS] created: 1.1.4-431-g02763280f

Git user git at public.curoverse.com
Thu Jun 21 09:51:25 EDT 2018


        at  02763280f54fd0c2a499285f8ce6afcbd8b9e082 (commit)


commit 02763280f54fd0c2a499285f8ce6afcbd8b9e082
Author: Fuad Muhic <fmuhic at capeannenterprises.com>
Date:   Mon Jun 18 16:37:42 2018 +0200

    Update intermediate collection name, properties and trash_at atrribute
    
    Arvados-DCO-1.1-Signed-off-by: Fuad Muhic <fmuhic at capeannenterprises.com>

diff --git a/sdk/cwl/arvados_cwl/arvcontainer.py b/sdk/cwl/arvados_cwl/arvcontainer.py
index 0bec69264..1ad276e67 100644
--- a/sdk/cwl/arvados_cwl/arvcontainer.py
+++ b/sdk/cwl/arvados_cwl/arvcontainer.py
@@ -20,6 +20,7 @@ from cwltool.utils import aslist
 
 import arvados.collection
 
+from arvados.errors import ApiError
 from .arvdocker import arv_docker_get_image
 from . import done
 from .runner import Runner, arvados_jobs_image, packed_workflow, trim_anonymous_location, remove_redundant_fields
@@ -156,8 +157,26 @@ class ArvadosContainer(object):
 
                 keepemptydirs(vwd)
 
+                trash_time = None 
+                if self.arvrunner.intermediate_output_ttl > 0: 
+                    trash_time = datetime.datetime.now() + datetime.timedelta(seconds=self.arvrunner.intermediate_output_ttl) 
+ 
+                current_container_uuid = None 
+                try: 
+                    current_container = self.arvrunner.api.containers().current().execute(num_retries=self.arvrunner.num_retries) 
+                    current_container_uuid = current_container['uuid'] 
+                except ApiError as e: 
+                    # Status code 404 just means we're not running in a container. 
+                    if e.resp.status != 404: 
+                        logger.info("Getting current container: %s", e) 
+                props = {"type": "Intermediate", 
+                         "container": current_container_uuid}
+
                 with Perf(metrics, "generatefiles.save_new %s" % self.name):
-                    vwd.save_new()
+                    vwd.save_new(name="Intermediate collection", 
+                                 ensure_unique_name=True, 
+                                 trash_at=trash_time, 
+                                 properties=props)
 
                 prev = None
                 for f, p in sorteditems:
diff --git a/sdk/cwl/arvados_cwl/arvjob.py b/sdk/cwl/arvados_cwl/arvjob.py
index 04256c68f..2d98a53b3 100644
--- a/sdk/cwl/arvados_cwl/arvjob.py
+++ b/sdk/cwl/arvados_cwl/arvjob.py
@@ -6,6 +6,7 @@ import logging
 import re
 import copy
 import json
+import datetime
 import time
 
 from cwltool.process import get_feature, shortname, UnsupportedRequirement
@@ -66,8 +67,26 @@ class ArvadosJob(object):
                                 n.write(p.resolved.encode("utf-8"))
 
                 if vwd:
+                    trash_time = None 
+                    if self.arvrunner.intermediate_output_ttl > 0: 
+                        trash_time = datetime.datetime.now() + datetime.timedelta(seconds=self.arvrunner.intermediate_output_ttl) 
+ 
+                    current_container_uuid = None 
+                    try: 
+                        current_container = self.arvrunner.api.containers().current().execute(num_retries=self.arvrunner.num_retries) 
+                        current_container_uuid = current_container['uuid'] 
+                    except ApiError as e: 
+                        # Status code 404 just means we're not running in a container. 
+                        if e.resp.status != 404: 
+                            logger.info("Getting current container: %s", e) 
+ 
+                    props = {"type": "Intermediate", 
+                             "container": current_container_uuid}
                     with Perf(metrics, "generatefiles.save_new %s" % self.name):
-                        vwd.save_new()
+                        vwd.save_new(name="Intermediate collection", 
+                                     ensure_unique_name=True, 
+                                     trash_at=trash_time, 
+                                     properties=props)
 
                 for f, p in generatemapper.items():
                     if p.type == "File":
diff --git a/sdk/cwl/arvados_cwl/pathmapper.py b/sdk/cwl/arvados_cwl/pathmapper.py
index 27e48f1f4..a749b5162 100644
--- a/sdk/cwl/arvados_cwl/pathmapper.py
+++ b/sdk/cwl/arvados_cwl/pathmapper.py
@@ -7,12 +7,14 @@ import logging
 import uuid
 import os
 import urllib
+import datetime
 
 import arvados.commands.run
 import arvados.collection
 
 from schema_salad.sourceline import SourceLine
 
+from arvados.errors import ApiError
 from cwltool.pathmapper import PathMapper, MapperEnt, abspath, adjustFileObjs, adjustDirObjs
 from cwltool.workflow import WorkflowException
 
@@ -153,9 +155,13 @@ class ArvPathMapper(PathMapper):
                 for l in srcobj.get("listing", []):
                     self.addentry(l, c, ".", remap)
 
-                check = self.arvrunner.api.collections().list(filters=[["portable_data_hash", "=", c.portable_data_hash()]], limit=1).execute(num_retries=self.arvrunner.num_retries)
-                if not check["items"]:
-                    c.save_new(owner_uuid=self.arvrunner.project_uuid)
+                trash_time, props = self.__get_collection_attributes()
+
+                c.save_new(name="Intermediate collection", 
+                           owner_uuid=self.arvrunner.project_uuid, 
+                           ensure_unique_name=True, 
+                           trash_at=trash_time, 
+                           properties=props)
 
                 ab = self.collection_pattern % c.portable_data_hash()
                 self._pathmap[srcobj["location"]] = MapperEnt("keep:"+c.portable_data_hash(), ab, "Directory", True)
@@ -167,9 +173,13 @@ class ArvPathMapper(PathMapper):
                                                   num_retries=self.arvrunner.num_retries                                                  )
                 self.addentry(srcobj, c, ".", remap)
 
-                check = self.arvrunner.api.collections().list(filters=[["portable_data_hash", "=", c.portable_data_hash()]], limit=1).execute(num_retries=self.arvrunner.num_retries)
-                if not check["items"]:
-                    c.save_new(owner_uuid=self.arvrunner.project_uuid)
+                trash_time, props = self.__get_collection_attributes()
+
+                c.save_new(name="Intermediate collection", 
+                           owner_uuid=self.arvrunner.project_uuid, 
+                           ensure_unique_name=True, 
+                           trash_at=trash_time, 
+                           properties=props)
 
                 ab = self.file_pattern % (c.portable_data_hash(), srcobj["basename"])
                 self._pathmap[srcobj["location"]] = MapperEnt("keep:%s/%s" % (c.portable_data_hash(), srcobj["basename"]),
@@ -202,6 +212,25 @@ class ArvPathMapper(PathMapper):
         else:
             return None
 
+    def __get_collection_attributes(self):
+            trash_time = None 
+            if self.arvrunner.intermediate_output_ttl > 0: 
+                trash_time = datetime.datetime.now() + datetime.timedelta(seconds=self.arvrunner.intermediate_output_ttl) 
+
+            current_container_uuid = None 
+            try: 
+                current_container = self.arvrunner.api.containers().current().execute(num_retries=self.arvrunner.num_retries) 
+                current_container_uuid = current_container['uuid'] 
+            except ApiError as e: 
+                # Status code 404 just means we're not running in a container. 
+                if e.resp.status != 404: 
+                    logger.info("Getting current container: %s", e)
+            properties = {"type": "Intermediate", 
+                          "container": current_container_uuid}
+
+            return (trash_time, properties)
+
+
 class StagingPathMapper(PathMapper):
     _follow_dirs = True
 

commit 988c59f51aa579ce8bf0eab1cc729e05a5ee5631
Merge: 94f2b4397 92ac046a8
Author: Fuad Muhic <fmuhic at capeannenterprises.com>
Date:   Mon Jun 18 14:20:21 2018 +0200

    Merge branch '13330-intermediates-test' of git.curoverse.com:arvados into 13330-cwl-intermediate-collections-cleanup
    
    Arvados-DCO-1.1-Signed-off-by: Fuad Muhic <fmuhic at capeannenterprises.com>


-----------------------------------------------------------------------


hooks/post-receive
-- 




More information about the arvados-commits mailing list