diff --git a/README.md b/README.md
index 2f6f441c..b8101a06 100644
--- a/README.md
+++ b/README.md
@@ -67,7 +67,31 @@ Instrumenting these components is the **ClearML-server**, see [Self-Hosting](htt
 </div>
 
 ---
-<a href="https://app.clear.ml"><img src="https://github.com/allegroai/clearml/blob/master/docs/webapp_screenshots.gif?raw=true" width="100%"></a>
+
+<table>
+<tbody>
+  <tr>
+    <td>Experiment Management</td>
+    <td>Datasets</td>
+  </tr>
+  <tr>
+    <td><a href="https://app.clear.ml"><img src="https://github.com/allegroai/clearml/blob/master/docs/experiment_manager.gif?raw=true" width="100%"></a></td>
+    <td><a href="https://app.clear.ml/datasets"><img src="https://github.com/allegroai/clearml/blob/master/docs/datasets.gif?raw=true" width="100%"></a></td>
+  </tr>
+  <tr>
+    <td colspan="2" height="24px"></td>
+  </tr>
+  <tr>
+    <td>Orchestration</td>
+    <td>Pipelines</td>
+  </tr>
+  <tr>
+    <td><a href="https://app.clear.ml/workers-and-queues/autoscalers"><img src="https://github.com/allegroai/clearml/blob/master/docs/orchestration.gif?raw=true" width="100%"></a></td>
+    <td><a href="https://app.clear.ml/pipelines"><img src="https://github.com/allegroai/clearml/blob/master/docs/pipelines.gif?raw=true" width="100%"></a></td>
+  </tr>
+</tbody>
+</table>
+
 
 ## ClearML Experiment Manager
 
diff --git a/clearml/automation/controller.py b/clearml/automation/controller.py
index b470f546..253d3c73 100644
--- a/clearml/automation/controller.py
+++ b/clearml/automation/controller.py
@@ -1469,6 +1469,7 @@ class PipelineController(object):
         pipeline_object._task = pipeline_task
         pipeline_object._nodes = {}
         pipeline_object._running_nodes = []
+        pipeline_object._version = pipeline_task._get_runtime_properties().get("version")
         try:
             pipeline_object._deserialize(pipeline_task._get_configuration_dict(cls._config_section), force=True)
         except Exception:
@@ -1485,6 +1486,11 @@ class PipelineController(object):
         # type: () -> List[str]
         return self._task.get_tags() or []
 
+    @property
+    def version(self):
+        # type: () -> str
+        return self._version
+
     def add_tags(self, tags):
         # type: (Union[Sequence[str], str]) -> None
         """
@@ -4075,6 +4081,13 @@ class PipelineDecorator(PipelineController):
                     ):
                         _node.name = "{}_{}".format(_node_name, counter)
                         counter += 1
+                    # Copy callbacks to the replicated node
+                    if cls._singleton._pre_step_callbacks.get(_node_name):
+                        cls._singleton._pre_step_callbacks[_node.name] = cls._singleton._pre_step_callbacks[_node_name]
+                    if cls._singleton._post_step_callbacks.get(_node_name):
+                        cls._singleton._post_step_callbacks[_node.name] = cls._singleton._post_step_callbacks[_node_name]
+                    if cls._singleton._status_change_callbacks.get(_node_name):
+                        cls._singleton._status_change_callbacks[_node.name] = cls._singleton._status_change_callbacks[_node_name]
                     _node_name = _node.name
                     if _node.name not in cls._singleton._nodes:
                         cls._singleton._nodes[_node.name] = _node
diff --git a/clearml/automation/optimization.py b/clearml/automation/optimization.py
index c8ec47e8..08fa2c7c 100644
--- a/clearml/automation/optimization.py
+++ b/clearml/automation/optimization.py
@@ -1947,7 +1947,7 @@ class HyperParameterOptimizer(object):
                     objective if objective is not None else (
                             [-1] * self._objective_metric.len
                     ),
-                    iteration_value if iteration_value is not None else (
+                    [iteration_value] * self._objective_metric.len if iteration_value is not None else (
                             [-1] * self._objective_metric.len
                     ),
                     params
diff --git a/clearml/automation/scheduler.py b/clearml/automation/scheduler.py
index d09e52ee..545c92b7 100644
--- a/clearml/automation/scheduler.py
+++ b/clearml/automation/scheduler.py
@@ -8,8 +8,8 @@ from typing import List, Union, Optional, Callable, Sequence, Dict
 from attr import attrs, attrib
 from dateutil.relativedelta import relativedelta
 
-from .job import ClearmlJob
 from .controller import PipelineController
+from .job import ClearmlJob
 from ..backend_interface.util import datetime_from_isoformat, datetime_to_isoformat, mutually_exclusive
 from ..task import Task
 
@@ -28,12 +28,11 @@ class BaseScheduleJob(object):
     _executed_instances = attrib(type=list, default=None)
 
     def to_dict(self, full=False):
-        return {k: v for k, v in self.__dict__.items()
-                if not callable(v) and (full or not str(k).startswith('_'))}
+        return {k: v for k, v in self.__dict__.items() if not callable(v) and (full or not str(k).startswith("_"))}
 
     def update(self, a_job):
         # type: (Union[Dict, BaseScheduleJob]) -> BaseScheduleJob
-        converters = {a.name: a.converter for a in getattr(self, '__attrs_attrs__', [])}
+        converters = {a.name: a.converter for a in getattr(self, "__attrs_attrs__", [])}
         for k, v in (a_job.to_dict(full=True) if not isinstance(a_job, dict) else a_job).items():
             if v is not None and not callable(getattr(self, k, v)):
                 setattr(self, k, converters[k](v) if converters.get(k) else v)
@@ -80,7 +79,7 @@ class BaseScheduleJob(object):
 
 @attrs
 class ScheduleJob(BaseScheduleJob):
-    _weekdays_ind = ('monday', 'tuesday', 'wednesday', 'thursday', 'friday', 'saturday', 'sunday')
+    _weekdays_ind = ("monday", "tuesday", "wednesday", "thursday", "friday", "saturday", "sunday")
 
     execution_limit_hours = attrib(type=float, default=None)
     recurring = attrib(type=bool, default=True)
@@ -100,8 +99,7 @@ class ScheduleJob(BaseScheduleJob):
         # type: () -> None
         def check_integer(value):
             try:
-                return False if not isinstance(value, (int, float)) or \
-                               int(value) != float(value) else True
+                return False if not isinstance(value, (int, float)) or int(value) != float(value) else True
             except (TypeError, ValueError):
                 return False
 
@@ -155,7 +153,7 @@ class ScheduleJob(BaseScheduleJob):
                 month=int(self.month or 1),
                 day=int(self.day or 1),
                 hour=int(self.hour or 0),
-                minute=int(self.minute or 0)
+                minute=int(self.minute or 0),
             )
             if self.weekdays:
                 self._next_run += relativedelta(weekday=self.get_weekday_ord(self.weekdays[0]))
@@ -172,7 +170,7 @@ class ScheduleJob(BaseScheduleJob):
             except ValueError:
                 # in case previous execution was not in the weekday (for example executed immediately at scheduling)
                 prev_weekday_ind = -1
-            weekday = _weekdays[(prev_weekday_ind+1) % len(_weekdays)]
+            weekday = _weekdays[(prev_weekday_ind + 1) % len(_weekdays)]
 
         prev_timestamp = self._last_executed or self.starting_time
         # fix first scheduled job should be as close as possible to starting time
@@ -184,8 +182,8 @@ class ScheduleJob(BaseScheduleJob):
             # if this is a daily schedule and we can still run it today, then we should
             run0 = self._calc_next_run(self.starting_time, weekday)
             run1 = self._calc_next_run(run0, weekday)
-            delta = run1-run0
-            optional_first_timestamp = self._calc_next_run(prev_timestamp-delta, weekday)
+            delta = run1 - run0
+            optional_first_timestamp = self._calc_next_run(prev_timestamp - delta, weekday)
             if optional_first_timestamp > prev_timestamp:
                 # this is us, we can still run it
                 self._next_run = optional_first_timestamp
@@ -236,7 +234,7 @@ class ScheduleJob(BaseScheduleJob):
                     months=0 if self.year else (self.month or 0),
                     hours=self.hour or 0,
                     minutes=self.minute or 0,
-                    weekday=weekday
+                    weekday=weekday,
                 )
 
             return next_timestamp
@@ -283,7 +281,7 @@ class ScheduleJob(BaseScheduleJob):
         if self.execution_limit_hours and task_id:
             self._execution_timeout = self._last_executed + relativedelta(
                 hours=int(self.execution_limit_hours),
-                minutes=int((self.execution_limit_hours - int(self.execution_limit_hours)) * 60)
+                minutes=int((self.execution_limit_hours - int(self.execution_limit_hours)) * 60),
             )
         else:
             self._execution_timeout = None
@@ -306,16 +304,16 @@ class ExecutedJob(object):
     thread_id = attrib(type=str, default=None)
 
     def to_dict(self, full=False):
-        return {k: v for k, v in self.__dict__.items() if full or not str(k).startswith('_')}
+        return {k: v for k, v in self.__dict__.items() if full or not str(k).startswith("_")}
 
 
 class BaseScheduler(object):
     def __init__(
-            self,
-            sync_frequency_minutes=15,
-            force_create_task_name=None,
-            force_create_task_project=None,
-            pooling_frequency_minutes=None
+        self,
+        sync_frequency_minutes=15,
+        force_create_task_name=None,
+        force_create_task_project=None,
+        pooling_frequency_minutes=None
     ):
         # type: (float, Optional[str], Optional[str], Optional[float]) -> None
         """
@@ -333,8 +331,8 @@ class BaseScheduler(object):
         self._sync_frequency_minutes = sync_frequency_minutes
         if force_create_task_name or not Task.current_task():
             self._task = Task.init(
-                project_name=force_create_task_project or 'DevOps',
-                task_name=force_create_task_name or 'Scheduler',
+                project_name=force_create_task_project or "DevOps",
+                task_name=force_create_task_name or "Scheduler",
                 task_type=Task.TaskTypes.service,
                 auto_resource_monitoring=False,
             )
@@ -356,12 +354,12 @@ class BaseScheduler(object):
         while True:
             # sync with backend
             try:
-                if time() - self._last_sync > 60. * self._sync_frequency_minutes:
+                if time() - self._last_sync > 60.0 * self._sync_frequency_minutes:
                     self._last_sync = time()
                     self._deserialize()
                     self._update_execution_plots()
             except Exception as ex:
-                self._log('Warning: Exception caught during deserialization: {}'.format(ex))
+                self._log("Warning: Exception caught during deserialization: {}".format(ex))
                 self._last_sync = time()
 
             try:
@@ -369,16 +367,16 @@ class BaseScheduler(object):
                     self._serialize_state()
                     self._update_execution_plots()
             except Exception as ex:
-                self._log('Warning: Exception caught during scheduling step: {}'.format(ex))
+                self._log("Warning: Exception caught during scheduling step: {}".format(ex))
                 # rate control
                 sleep(15)
 
             # sleep until the next pool (default None)
             if self._pooling_frequency_minutes:
                 self._log("Sleeping until the next pool in {} minutes".format(self._pooling_frequency_minutes))
-                sleep(self._pooling_frequency_minutes*60.)
+                sleep(self._pooling_frequency_minutes * 60.0)
 
-    def start_remotely(self, queue='services'):
+    def start_remotely(self, queue="services"):
         # type: (str) -> None
         """
         Start the Task TaskScheduler loop (notice this function does not return)
@@ -456,11 +454,8 @@ class BaseScheduler(object):
         # check if this is a single instance, then we need to abort the Task
         if job.single_instance and job.get_last_executed_task_id():
             t = Task.get_task(task_id=job.get_last_executed_task_id())
-            if t.status in ('in_progress', 'queued'):
-                self._log(
-                    'Skipping Task {} scheduling, previous Task instance {} still running'.format(
-                        job.name, t.id
-                    ))
+            if t.status in ("in_progress", "queued"):
+                self._log("Skipping Task {} scheduling, previous Task instance {} still running".format(job.name, t.id))
                 job.run(None)
                 return None
 
@@ -474,8 +469,7 @@ class BaseScheduler(object):
             target_project=job.get_resolved_target_project(),
             tags=[add_tags] if add_tags and isinstance(add_tags, str) else add_tags,
         )
-        self._log('Scheduling Job {}, Task {} on queue {}.'.format(
-            job.name, task_job.task_id(), job.queue))
+        self._log("Scheduling Job {}, Task {} on queue {}.".format(job.name, task_job.task_id(), job.queue))
         if task_job.launch(queue_name=job.queue):
             # mark as run
             job.run(task_job.task_id())
@@ -501,12 +495,12 @@ class BaseScheduler(object):
                 self._log(
                     "Skipping Task '{}' scheduling, previous Thread instance '{}' still running".format(
                         job.name, a_thread.ident
-                    ))
+                    )
+                )
                 job.run(None)
                 return None
 
-        self._log("Scheduling Job '{}', Task '{}' on background thread".format(
-            job.name, job.base_function))
+        self._log("Scheduling Job '{}', Task '{}' on background thread".format(job.name, job.base_function))
         t = Thread(target=job.base_function, args=func_args or ())
         t.start()
         # mark as run
@@ -520,9 +514,9 @@ class BaseScheduler(object):
             return
         t = Task.get_task(task_id=task_id)
         status = t.status
-        if status in ('in_progress',):
+        if status in ("in_progress",):
             t.stopped(force=True)
-        elif status in ('queued',):
+        elif status in ("queued",):
             Task.dequeue(t)
 
 
@@ -531,7 +525,8 @@ class TaskScheduler(BaseScheduler):
     Task Scheduling controller.
     Notice time-zone is ALWAYS UTC
     """
-    _configuration_section = 'schedule'
+
+    _configuration_section = "schedule"
 
     def __init__(self, sync_frequency_minutes=15, force_create_task_name=None, force_create_task_project=None):
         # type: (float, Optional[str], Optional[str]) -> None
@@ -548,32 +543,32 @@ class TaskScheduler(BaseScheduler):
         super(TaskScheduler, self).__init__(
             sync_frequency_minutes=sync_frequency_minutes,
             force_create_task_name=force_create_task_name,
-            force_create_task_project=force_create_task_project
+            force_create_task_project=force_create_task_project,
         )
         self._schedule_jobs = []  # List[ScheduleJob]
         self._timeout_jobs = {}  # Dict[datetime, str]
         self._executed_jobs = []  # List[ExecutedJob]
 
     def add_task(
-            self,
-            schedule_task_id=None,  # type: Union[str, Task]
-            schedule_function=None,   # type: Callable
-            queue=None,  # type: str
-            name=None,  # type: Optional[str]
-            target_project=None,  # type: Optional[str]
-            minute=None,  # type: Optional[int]
-            hour=None,  # type: Optional[int]
-            day=None,  # type: Optional[int]
-            weekdays=None,  # type: Optional[List[str]]
-            month=None,  # type: Optional[int]
-            year=None,  # type: Optional[int]
-            limit_execution_time=None,  # type: Optional[float]
-            single_instance=False,  # type: bool
-            recurring=True,  # type: bool
-            execute_immediately=False,  # type: bool
-            reuse_task=False,  # type: bool
-            task_parameters=None,  # type: Optional[dict]
-            task_overrides=None,  # type: Optional[dict]
+        self,
+        schedule_task_id=None,  # type: Union[str, Task]
+        schedule_function=None,  # type: Callable
+        queue=None,  # type: str
+        name=None,  # type: Optional[str]
+        target_project=None,  # type: Optional[str]
+        minute=None,  # type: Optional[int]
+        hour=None,  # type: Optional[int]
+        day=None,  # type: Optional[int]
+        weekdays=None,  # type: Optional[List[str]]
+        month=None,  # type: Optional[int]
+        year=None,  # type: Optional[int]
+        limit_execution_time=None,  # type: Optional[float]
+        single_instance=False,  # type: bool
+        recurring=True,  # type: bool
+        execute_immediately=False,  # type: bool
+        reuse_task=False,  # type: bool
+        task_parameters=None,  # type: Optional[dict]
+        task_overrides=None,  # type: Optional[dict]
     ):
         # type: (...) -> bool
         """
@@ -640,7 +635,7 @@ class TaskScheduler(BaseScheduler):
         :return: True if job is successfully added to the scheduling list
         """
         mutually_exclusive(schedule_function=schedule_function, schedule_task_id=schedule_task_id)
-        task_id = schedule_task_id.id if isinstance(schedule_task_id, Task) else str(schedule_task_id or '')
+        task_id = schedule_task_id.id if isinstance(schedule_task_id, Task) else str(schedule_task_id or "")
 
         # noinspection PyProtectedMember
         job = ScheduleJob(
@@ -715,46 +710,46 @@ class TaskScheduler(BaseScheduler):
 
         # get idle timeout (aka sleeping)
         scheduled_jobs = sorted(
-            [j for j in self._schedule_jobs if j.next_run() is not None],
-            key=lambda x: x.next_run()
+            [j for j in self._schedule_jobs if j.next_run() is not None], key=lambda x: x.next_run()
         )
         # sort by key
         timeout_job_datetime = min(self._timeout_jobs, key=self._timeout_jobs.get) if self._timeout_jobs else None
         if not scheduled_jobs and timeout_job_datetime is None:
             # sleep and retry
-            seconds = 60. * self._sync_frequency_minutes
-            self._log('Nothing to do, sleeping for {:.2f} minutes.'.format(seconds / 60.))
+            seconds = 60.0 * self._sync_frequency_minutes
+            self._log("Nothing to do, sleeping for {:.2f} minutes.".format(seconds / 60.0))
             sleep(seconds)
             return False
 
         next_time_stamp = scheduled_jobs[0].next_run() if scheduled_jobs else None
         if timeout_job_datetime is not None:
-            next_time_stamp = (
-                min(next_time_stamp, timeout_job_datetime) if next_time_stamp else timeout_job_datetime
-            )
+            next_time_stamp = min(next_time_stamp, timeout_job_datetime) if next_time_stamp else timeout_job_datetime
 
         sleep_time = (next_time_stamp - datetime.utcnow()).total_seconds()
         if sleep_time > 0:
             # sleep until we need to run a job or maximum sleep time
-            seconds = min(sleep_time, 60. * self._sync_frequency_minutes)
-            self._log('Waiting for next run [UTC {}], sleeping for {:.2f} minutes, until next sync.'.format(
-                next_time_stamp, seconds / 60.))
+            seconds = min(sleep_time, 60.0 * self._sync_frequency_minutes)
+            self._log(
+                "Waiting for next run [UTC {}], sleeping for {:.2f} minutes, until next sync.".format(
+                    next_time_stamp, seconds / 60.0
+                )
+            )
             sleep(seconds)
             return False
 
         # check if this is a Task timeout check
         if timeout_job_datetime is not None and next_time_stamp == timeout_job_datetime:
             task_id = self._timeout_jobs[timeout_job_datetime]
-            self._log('Aborting job due to timeout: {}'.format(task_id))
+            self._log("Aborting job due to timeout: {}".format(task_id))
             self._cancel_task(task_id=task_id)
             self._timeout_jobs.pop(timeout_job_datetime, None)
         else:
-            self._log('Launching job: {}'.format(scheduled_jobs[0]))
+            self._log("Launching job: {}".format(scheduled_jobs[0]))
             self._launch_job(scheduled_jobs[0])
 
         return True
 
-    def start_remotely(self, queue='services'):
+    def start_remotely(self, queue="services"):
         # type: (str) -> None
         """
         Start the Task TaskScheduler loop (notice this function does not return)
@@ -770,8 +765,8 @@ class TaskScheduler(BaseScheduler):
         """
         # noinspection PyProtectedMember
         self._task._set_configuration(
-            config_type='json',
-            description='schedule tasks configuration',
+            config_type="json",
+            description="schedule tasks configuration",
             config_text=self._serialize_schedule_into_string(),
             name=self._configuration_section,
         )
@@ -785,9 +780,9 @@ class TaskScheduler(BaseScheduler):
             dict(
                 scheduled_jobs=[j.to_dict(full=True) for j in self._schedule_jobs],
                 timeout_jobs={datetime_to_isoformat(k): v for k, v in self._timeout_jobs.items()},
-                executed_jobs=[j.to_dict(full=True) for j in self._executed_jobs]
+                executed_jobs=[j.to_dict(full=True) for j in self._executed_jobs],
             ),
-            default=datetime_to_isoformat
+            default=datetime_to_isoformat,
         )
         self._task.upload_artifact(name="state", artifact_object=json_str, preview="scheduler internal state")
 
@@ -798,34 +793,32 @@ class TaskScheduler(BaseScheduler):
         """
         # get artifact
         self._task.reload()
-        artifact_object = self._task.artifacts.get('state')
+        artifact_object = self._task.artifacts.get("state")
         if artifact_object is not None:
             state_json_str = artifact_object.get(force_download=True)
             if state_json_str is not None:
                 state_dict = json.loads(state_json_str)
                 self._schedule_jobs = self.__deserialize_scheduled_jobs(
-                    serialized_jobs_dicts=state_dict.get('scheduled_jobs', []),
-                    current_jobs=self._schedule_jobs
+                    serialized_jobs_dicts=state_dict.get("scheduled_jobs", []), current_jobs=self._schedule_jobs
                 )
-                self._timeout_jobs = {datetime_from_isoformat(k): v for k, v in (state_dict.get('timeout_jobs') or {})}
-                self._executed_jobs = [ExecutedJob(**j) for j in state_dict.get('executed_jobs', [])]
+                self._timeout_jobs = {datetime_from_isoformat(k): v for k, v in (state_dict.get("timeout_jobs") or {})}
+                self._executed_jobs = [ExecutedJob(**j) for j in state_dict.get("executed_jobs", [])]
 
     def _deserialize(self):
         # type: () -> None
         """
         Deserialize Task scheduling configuration only
         """
-        self._log('Syncing scheduler')
+        self._log("Syncing scheduler")
         self._task.reload()
         # noinspection PyProtectedMember
         json_str = self._task._get_configuration_text(name=self._configuration_section)
         try:
             self._schedule_jobs = self.__deserialize_scheduled_jobs(
-                serialized_jobs_dicts=json.loads(json_str),
-                current_jobs=self._schedule_jobs
+                serialized_jobs_dicts=json.loads(json_str), current_jobs=self._schedule_jobs
             )
         except Exception as ex:
-            self._log('Failed deserializing configuration: {}'.format(ex), level=logging.WARN)
+            self._log("Failed deserializing configuration: {}".format(ex), level=logging.WARN)
             return
 
     @staticmethod
@@ -858,45 +851,61 @@ class TaskScheduler(BaseScheduler):
         if not self._task:
             return
 
-        task_link_template = self._task.get_output_log_web_page() \
-            .replace('/{}/'.format(self._task.project), '/{project}/') \
-            .replace('/{}/'.format(self._task.id), '/{task}/')
+        task_link_template = (
+            self._task.get_output_log_web_page()
+            .replace("/{}/".format(self._task.project), "/{project}/")
+            .replace("/{}/".format(self._task.id), "/{task}/")
+        )
 
         # plot the schedule definition
         columns = [
-            'name', 'base_task_id', 'base_function', 'next_run', 'target_project', 'queue',
-            'minute', 'hour', 'day', 'month', 'year',
-            'starting_time', 'execution_limit_hours', 'recurring',
-            'single_instance', 'task_parameters', 'task_overrides', 'clone_task',
+            "name",
+            "base_task_id",
+            "base_function",
+            "next_run",
+            "target_project",
+            "queue",
+            "minute",
+            "hour",
+            "day",
+            "month",
+            "year",
+            "starting_time",
+            "execution_limit_hours",
+            "recurring",
+            "single_instance",
+            "task_parameters",
+            "task_overrides",
+            "clone_task",
         ]
         scheduler_table = [columns]
         for j in self._schedule_jobs:
             j_dict = j.to_dict()
-            j_dict['next_run'] = j.next()
-            j_dict['base_function'] = "{}.{}".format(
-                getattr(j.base_function, '__module__', ''),
-                getattr(j.base_function, '__name__', '')
-            ) if j.base_function else ''
+            j_dict["next_run"] = j.next()
+            j_dict["base_function"] = (
+                "{}.{}".format(getattr(j.base_function, "__module__", ""), getattr(j.base_function, "__name__", ""))
+                if j.base_function
+                else ""
+            )
 
-            if not j_dict.get('base_task_id'):
-                j_dict['clone_task'] = ''
+            if not j_dict.get("base_task_id"):
+                j_dict["clone_task"] = ""
 
             row = [
-                str(j_dict.get(c)).split('.', 1)[0] if isinstance(j_dict.get(c), datetime) else str(j_dict.get(c) or '')
+                str(j_dict.get(c)).split(".", 1)[0] if isinstance(j_dict.get(c), datetime) else str(j_dict.get(c) or "")
                 for c in columns
             ]
             if row[1]:
-                row[1] = '<a href="{}">{}</a>'.format(
-                        task_link_template.format(project='*', task=row[1]), row[1])
+                row[1] = '<a href="{}">{}</a>'.format(task_link_template.format(project="*", task=row[1]), row[1])
             scheduler_table += [row]
 
         # plot the already executed Tasks
-        executed_table = [['name', 'task id', 'started', 'finished']]
+        executed_table = [["name", "task id", "started", "finished"]]
         for executed_job in sorted(self._executed_jobs, key=lambda x: x.started, reverse=True):
             if not executed_job.finished:
                 if executed_job.task_id:
                     t = Task.get_task(task_id=executed_job.task_id)
-                    if t.status not in ('in_progress', 'queued'):
+                    if t.status not in ("in_progress", "queued"):
                         executed_job.finished = t.data.completed or datetime.utcnow()
                 elif executed_job.thread_id:
                     # noinspection PyBroadException
@@ -908,30 +917,31 @@ class TaskScheduler(BaseScheduler):
                         pass
 
             executed_table += [
-                [executed_job.name,
-                 '<a href="{}">{}</a>'.format(task_link_template.format(
-                     project='*', task=executed_job.task_id), executed_job.task_id)
-                 if executed_job.task_id else 'function',
-                 str(executed_job.started).split('.', 1)[0], str(executed_job.finished).split('.', 1)[0]
-                 ]
+                [
+                    executed_job.name,
+                    '<a href="{}">{}</a>'.format(
+                        task_link_template.format(project="*", task=executed_job.task_id), executed_job.task_id
+                    )
+                    if executed_job.task_id
+                    else "function",
+                    str(executed_job.started).split(".", 1)[0],
+                    str(executed_job.finished).split(".", 1)[0],
+                ]
             ]
 
         self._task.get_logger().report_table(
-            title='Schedule Tasks', series=' ', iteration=0,
-            table_plot=scheduler_table
-        )
-        self._task.get_logger().report_table(
-            title='Executed Tasks', series=' ', iteration=0,
-            table_plot=executed_table
+            title="Schedule Tasks", series=" ", iteration=0, table_plot=scheduler_table
         )
+        self._task.get_logger().report_table(title="Executed Tasks", series=" ", iteration=0, table_plot=executed_table)
 
     def _launch_job_task(self, job, task_parameters=None, add_tags=None):
         # type: (ScheduleJob, Optional[dict], Optional[List[str]]) -> Optional[ClearmlJob]
         task_job = super(TaskScheduler, self)._launch_job_task(job, task_parameters=task_parameters, add_tags=add_tags)
         # make sure this is not a function job
         if task_job:
-            self._executed_jobs.append(ExecutedJob(
-                name=job.name, task_id=task_job.task_id(), started=datetime.utcnow()))
+            self._executed_jobs.append(
+                ExecutedJob(name=job.name, task_id=task_job.task_id(), started=datetime.utcnow())
+            )
             # add timeout check
             if job.get_execution_timeout():
                 # we should probably make sure we are not overwriting a Task
@@ -943,8 +953,9 @@ class TaskScheduler(BaseScheduler):
         thread_job = super(TaskScheduler, self)._launch_job_function(job, func_args=func_args)
         # make sure this is not a function job
         if thread_job:
-            self._executed_jobs.append(ExecutedJob(
-                name=job.name, thread_id=str(thread_job.ident), started=datetime.utcnow()))
+            self._executed_jobs.append(
+                ExecutedJob(name=job.name, thread_id=str(thread_job.ident), started=datetime.utcnow())
+            )
             # execution timeout is not supported with function callbacks.
 
         return thread_job
diff --git a/clearml/backend_api/session/defs.py b/clearml/backend_api/session/defs.py
index a477ebd9..46ad41f3 100644
--- a/clearml/backend_api/session/defs.py
+++ b/clearml/backend_api/session/defs.py
@@ -11,8 +11,7 @@ ENV_AUTH_TOKEN = EnvEntry("CLEARML_AUTH_TOKEN")
 ENV_VERBOSE = EnvEntry(
     "CLEARML_API_VERBOSE", "TRAINS_API_VERBOSE", converter=safe_text_to_bool, type=bool, default=False
 )
-ENV_HOST_VERIFY_CERT = EnvEntry("CLEARML_API_HOST_VERIFY_CERT", "TRAINS_API_HOST_VERIFY_CERT",
-                                type=bool, default=True)
+ENV_HOST_VERIFY_CERT = EnvEntry("CLEARML_API_HOST_VERIFY_CERT", "TRAINS_API_HOST_VERIFY_CERT", default=True)
 ENV_OFFLINE_MODE = EnvEntry("CLEARML_OFFLINE_MODE", "TRAINS_OFFLINE_MODE", type=bool, converter=safe_text_to_bool)
 ENV_CLEARML_NO_DEFAULT_SERVER = EnvEntry(
     "CLEARML_NO_DEFAULT_SERVER", "TRAINS_NO_DEFAULT_SERVER", converter=safe_text_to_bool, type=bool, default=True
diff --git a/clearml/backend_api/utils.py b/clearml/backend_api/utils.py
index 0b34c28b..8738910d 100644
--- a/clearml/backend_api/utils.py
+++ b/clearml/backend_api/utils.py
@@ -9,6 +9,7 @@ from urllib3 import PoolManager
 import six
 
 from .session.defs import ENV_HOST_VERIFY_CERT
+from ..backend_config.converters import strtobool
 
 if six.PY3:
     from functools import lru_cache
@@ -141,8 +142,14 @@ def get_http_session_with_retry(
     adapter = TLSv1HTTPAdapter(max_retries=retry, pool_connections=pool_connections, pool_maxsize=pool_maxsize)
     session.mount('http://', adapter)
     session.mount('https://', adapter)
+
     # update verify host certificate
-    session.verify = ENV_HOST_VERIFY_CERT.get(default=config.get('api.verify_certificate', True))
+    verify = ENV_HOST_VERIFY_CERT.get(default=config.get('api.verify_certificate', True))
+    try:
+        session.verify = bool(strtobool(verify) if isinstance(verify, str) else verify)
+    except (ValueError, AttributeError):
+        session.verify = verify
+
     if not session.verify and __disable_certificate_verification_warning < 2:
         # show warning
         __disable_certificate_verification_warning += 1
diff --git a/clearml/backend_config/bucket_config.py b/clearml/backend_config/bucket_config.py
index 0bc5ac8e..9b6228b5 100644
--- a/clearml/backend_config/bucket_config.py
+++ b/clearml/backend_config/bucket_config.py
@@ -34,9 +34,19 @@ class S3BucketConfig(object):
     verify = attrib(type=bool, default=None)
     use_credentials_chain = attrib(type=bool, default=False)
     extra_args = attrib(type=dict, default=None)
+    profile = attrib(type=str, default="")
 
     def update(
-        self, key, secret, multipart=True, region=None, use_credentials_chain=False, token="", extra_args=None
+        self,
+        key="",
+        secret="",
+        multipart=True,
+        region=None,
+        use_credentials_chain=False,
+        token="",
+        extra_args=None,
+        secure=True,
+        profile=""
     ):
         self.key = key
         self.secret = secret
@@ -45,6 +55,8 @@ class S3BucketConfig(object):
         self.region = region
         self.use_credentials_chain = use_credentials_chain
         self.extra_args = extra_args
+        self.secure = secure
+        self.profile = profile
 
     def is_valid(self):
         return (self.key and self.secret) or self.use_credentials_chain
@@ -107,6 +119,8 @@ class S3BucketConfigurations(BaseBucketConfigurations):
         default_token="",
         default_extra_args=None,
         default_verify=None,
+        default_profile="",
+        default_secure=True
     ):
         super(S3BucketConfigurations, self).__init__()
         self._buckets = buckets if buckets else list()
@@ -118,12 +132,12 @@ class S3BucketConfigurations(BaseBucketConfigurations):
         self._default_use_credentials_chain = default_use_credentials_chain
         self._default_extra_args = default_extra_args
         self._default_verify = default_verify
+        self._default_profile = default_profile
+        self._default_secure = default_secure
 
     @classmethod
     def from_config(cls, s3_configuration):
-        config_list = S3BucketConfig.from_list(
-            s3_configuration.get("credentials", [])
-        )
+        config_list = S3BucketConfig.from_list(s3_configuration.get("credentials", []))
 
         default_key = s3_configuration.get("key", "") or getenv("AWS_ACCESS_KEY_ID", "")
         default_secret = s3_configuration.get("secret", "") or getenv("AWS_SECRET_ACCESS_KEY", "")
@@ -132,11 +146,14 @@ class S3BucketConfigurations(BaseBucketConfigurations):
         default_use_credentials_chain = s3_configuration.get("use_credentials_chain") or False
         default_extra_args = s3_configuration.get("extra_args")
         default_verify = s3_configuration.get("verify", None)
+        default_profile = s3_configuration.get("profile", "") or getenv("AWS_PROFILE", "")
+        default_secure = s3_configuration.get("secure", True)
 
-        default_key = _none_to_empty_string(default_key)
-        default_secret = _none_to_empty_string(default_secret)
-        default_token = _none_to_empty_string(default_token)
-        default_region = _none_to_empty_string(default_region)
+        default_key = _none_to_empty_string(default_key).strip()
+        default_secret = _none_to_empty_string(default_secret).strip()
+        default_token = _none_to_empty_string(default_token).strip()
+        default_region = _none_to_empty_string(default_region).strip()
+        default_profile = _none_to_empty_string(default_profile).strip()
 
         return cls(
             config_list,
@@ -147,6 +164,8 @@ class S3BucketConfigurations(BaseBucketConfigurations):
             default_token,
             default_extra_args,
             default_verify,
+            default_profile,
+            default_secure
         )
 
     def add_config(self, bucket_config):
@@ -178,6 +197,8 @@ class S3BucketConfigurations(BaseBucketConfigurations):
             use_credentials_chain=self._default_use_credentials_chain,
             token=self._default_token,
             extra_args=self._default_extra_args,
+            profile=self._default_profile,
+            secure=self._default_secure
         )
 
     def _get_prefix_from_bucket_config(self, config):
@@ -204,7 +225,6 @@ class S3BucketConfigurations(BaseBucketConfigurations):
         :param uri: URI of bucket, directory or file
         :return: S3BucketConfig: bucket config
         """
-
         def find_match(uri):
             self._update_prefixes(refresh=False)
             uri = uri.lower()
@@ -244,6 +264,8 @@ class S3BucketConfigurations(BaseBucketConfigurations):
             host=host,
             token=self._default_token,
             extra_args=self._default_extra_args,
+            profile=self._default_profile,
+            secure=self._default_secure
         )
 
 
diff --git a/clearml/backend_interface/setupuploadmixin.py b/clearml/backend_interface/setupuploadmixin.py
index 00072bca..db767d9c 100644
--- a/clearml/backend_interface/setupuploadmixin.py
+++ b/clearml/backend_interface/setupuploadmixin.py
@@ -67,6 +67,7 @@ class SetupUploadMixin(object):
         multipart=True,  # bool
         secure=True,  # bool
         verify=True,  # bool
+        profile=None  # Optional[str]
     ):
         # type: (...) -> None
         """
@@ -85,6 +86,7 @@ class SetupUploadMixin(object):
             multipart.
         :param secure: Server supports HTTPS. Only required when using a Non-AWS S3 solution that only supports HTTPS.
         :param verify: Whether or not to verify SSL certificates.
+        :param profile: The AWS profile
             Only required when using a Non-AWS S3 solution that only supports HTTPS with self-signed certificate.
         """
         self._bucket_config = S3BucketConfig(  # noqa
@@ -98,6 +100,7 @@ class SetupUploadMixin(object):
             multipart=multipart,
             secure=secure,
             verify=verify,
+            profile=profile
         )
         StorageHelper.add_aws_configuration(self._bucket_config, log=self.log)
         self.storage_uri = StorageHelper.get_aws_storage_uri_from_config(self._bucket_config)
diff --git a/clearml/backend_interface/task/populate.py b/clearml/backend_interface/task/populate.py
index e20be854..30181e15 100644
--- a/clearml/backend_interface/task/populate.py
+++ b/clearml/backend_interface/task/populate.py
@@ -92,7 +92,6 @@ class CreateAndPopulate(object):
             repo = None
         else:
             folder = None
-
         if raise_on_missing_entries and not base_task_id:
             if not script:
                 raise ValueError("Entry point script not provided")
@@ -168,7 +167,6 @@ class CreateAndPopulate(object):
                 and not self.repo and (
                 not repo_info or not repo_info.script or not repo_info.script.get('repository')):
             raise ValueError("Standalone script detected \'{}\', but no requirements provided".format(self.script))
-
         if dry_run:
             task = None
             task_state = dict(
@@ -204,7 +202,6 @@ class CreateAndPopulate(object):
 
         # clear the script section
         task_state['script'] = {}
-
         if repo_info:
             task_state['script']['repository'] = repo_info.script['repository']
             task_state['script']['version_num'] = repo_info.script['version_num']
@@ -216,15 +213,19 @@ class CreateAndPopulate(object):
             task_state['script']['requirements'] = repo_info.script.get('requirements') or {}
             if self.cwd:
                 self.cwd = self.cwd
-                cwd = self.cwd if Path(self.cwd).is_dir() else (
-                        Path(repo_info.script['repo_root']) / self.cwd).as_posix()
+                # cwd should be relative to the repo_root, but we need the full path
+                # (repo_root + cwd) in order to resolve the entry point
+                cwd = (Path(repo_info.script['repo_root']) / self.cwd).as_posix()
+
                 if not Path(cwd).is_dir():
                     raise ValueError("Working directory \'{}\' could not be found".format(cwd))
-                cwd = Path(cwd).relative_to(repo_info.script['repo_root']).as_posix()
                 entry_point = \
                     Path(repo_info.script['repo_root']) / repo_info.script['working_dir'] / repo_info.script[
                         'entry_point']
+                # resolve entry_point relative to the current working directory
                 entry_point = entry_point.relative_to(cwd).as_posix()
+                # restore cwd - make it relative to the repo_root again
+                cwd = Path(cwd).relative_to(repo_info.script['repo_root']).as_posix()
                 task_state['script']['entry_point'] = entry_point or ""
                 task_state['script']['working_dir'] = cwd or "."
         elif self.repo:
@@ -260,7 +261,6 @@ class CreateAndPopulate(object):
             # standalone task
             task_state['script']['entry_point'] = self.script or ""
             task_state['script']['working_dir'] = '.'
-
         # update requirements
         reqs = []
         if self.requirements_file:
@@ -345,7 +345,6 @@ class CreateAndPopulate(object):
             if task_state['script']['diff'] and not task_state['script']['diff'].endswith('\n'):
                 task_state['script']['diff'] += '\n'
             task_state['script']['diff'] += task_init_patch
-
         # set base docker image if provided
         if self.docker:
             if dry_run:
diff --git a/clearml/binding/artifacts.py b/clearml/binding/artifacts.py
index 5577bf24..99d02668 100644
--- a/clearml/binding/artifacts.py
+++ b/clearml/binding/artifacts.py
@@ -203,6 +203,10 @@ class Artifact(object):
                 with open(local_file, "rt") as f:
                     self._object = f.read()
             elif self.type == "pickle":
+                if self.hash:
+                    file_hash, _ = sha256sum(local_file, block_size=Artifacts._hash_block_size)
+                    if self.hash != file_hash:
+                        raise Exception("incorrect pickle file hash, artifact file might be corrupted")
                 with open(local_file, "rb") as f:
                     self._object = pickle.load(f)
         except Exception as e:
diff --git a/clearml/datasets/dataset.py b/clearml/datasets/dataset.py
index d57b158e..ef6759dd 100644
--- a/clearml/datasets/dataset.py
+++ b/clearml/datasets/dataset.py
@@ -29,6 +29,7 @@ from ..storage.util import sha256sum, is_windows, md5text, format_size
 from ..utilities.matching import matches_any_wildcard
 from ..utilities.parallel import ParallelZipper
 from ..utilities.version import Version
+from ..utilities.files import is_path_traversal
 
 try:
     from pathlib import Path as _Path  # noqa
@@ -1856,6 +1857,12 @@ class Dataset(object):
             for ds in datasets:
                 base_folder = Path(ds._get_dataset_files())
                 files = [f.relative_path for f in ds.file_entries if f.parent_dataset_id == ds.id]
+                files = [
+                    os.path.basename(file)
+                    if is_path_traversal(base_folder, file) or is_path_traversal(temp_folder, file)
+                    else file
+                    for file in files
+                ]
                 pool.map(
                     lambda x:
                         (temp_folder / x).parent.mkdir(parents=True, exist_ok=True) or
@@ -2326,12 +2333,24 @@ class Dataset(object):
                 link.size = Path(target_path).stat().st_size
         if not max_workers:
             for relative_path, link in links.items():
-                target_path = os.path.join(target_folder, relative_path)
+                if not is_path_traversal(target_folder, relative_path):
+                    target_path = os.path.join(target_folder, relative_path)
+                else:
+                    LoggerRoot.get_base_logger().warning(
+                        "Ignoring relative path `{}`: it must not traverse directories".format(relative_path)
+                    )
+                    target_path = os.path.join(target_folder, os.path.basename(relative_path))
                 _download_link(link, target_path)
         else:
             with ThreadPoolExecutor(max_workers=max_workers) as pool:
                 for relative_path, link in links.items():
-                    target_path = os.path.join(target_folder, relative_path)
+                    if not is_path_traversal(target_folder, relative_path):
+                        target_path = os.path.join(target_folder, relative_path)
+                    else:
+                        LoggerRoot.get_base_logger().warning(
+                            "Ignoring relative path `{}`: it must not traverse directories".format(relative_path)
+                        )
+                        target_path = os.path.join(target_folder, os.path.basename(relative_path))
                     pool.submit(_download_link, link, target_path)
 
     def _extract_dataset_archive(
diff --git a/clearml/errors.py b/clearml/errors.py
index 76516e27..a240708e 100644
--- a/clearml/errors.py
+++ b/clearml/errors.py
@@ -1,5 +1,6 @@
 class UsageError(RuntimeError):
-    """ An exception raised for illegal usage of clearml objects"""
+    """An exception raised for illegal usage of clearml objects"""
+
     pass
 
 
@@ -12,5 +13,5 @@ class ArtifactUriDeleteError(ValueError):
 
     @property
     def remaining_uris(self):
-        """ Remaining URIs to delete. Deletion of these URIs was aborted due to the error. """
+        """Remaining URIs to delete. Deletion of these URIs was aborted due to the error."""
         return self._remaining_uris
diff --git a/clearml/model.py b/clearml/model.py
index b7ccc4bd..6288795a 100644
--- a/clearml/model.py
+++ b/clearml/model.py
@@ -1932,8 +1932,8 @@ class InputModel(Model):
         # type: () -> str
         return self._base_model_id
 
-    def connect(self, task, name=None):
-        # type: (Task, Optional[str]) -> None
+    def connect(self, task, name=None, ignore_remote_overrides=False):
+        # type: (Task, Optional[str], bool) -> None
         """
         Connect the current model to a Task object, if the model is preexisting. Preexisting models include:
 
@@ -1943,24 +1943,31 @@ class InputModel(Model):
         - Models whose origin is not ClearML that are used to create an InputModel object. For example,
           models created using TensorFlow models.
 
-        When the experiment is executed remotely in a worker, the input model already specified in the experiment is
-        used.
+        When the experiment is executed remotely in a worker, the input model specified in the experiment UI/backend
+        is used, unless `ignore_remote_overrides` is set to True.
 
         .. note::
            The **ClearML Web-App** allows you to switch one input model for another and then enqueue the experiment
            to execute in a worker.
 
         :param object task: A Task object.
+        :param ignore_remote_overrides: If True, changing the model in the UI/backend will have no
+            effect when running remotely.
+            Default is False, meaning that any changes made in the UI/backend will be applied in remote execution.
         :param str name: The model name to be stored on the Task
-            (default to filename of the model weights, without the file extension, or to `Input Model` if that is not found)
+            (default to filename of the model weights, without the file extension, or to `Input Model`
+            if that is not found)
         """
         self._set_task(task)
         name = name or InputModel._get_connect_name(self)
         InputModel._warn_on_same_name_connect(name)
+        ignore_remote_overrides = task._handle_ignore_remote_overrides(
+            name + "/_ignore_remote_overrides_input_model_", ignore_remote_overrides
+        )
 
         model_id = None
         # noinspection PyProtectedMember
-        if running_remotely() and (task.is_main_task() or task._is_remote_main_task()):
+        if running_remotely() and (task.is_main_task() or task._is_remote_main_task()) and not ignore_remote_overrides:
             input_models = task.input_models_id
             # noinspection PyBroadException
             try:
@@ -2245,7 +2252,7 @@ class OutputModel(BaseModel):
             pass
         self.connect(task, name=name)
 
-    def connect(self, task, name=None):
+    def connect(self, task, name=None, **kwargs):
         # type: (Task, Optional[str]) -> None
         """
         Connect the current model to a Task object, if the model is a preexisting model. Preexisting models include:
diff --git a/clearml/storage/cache.py b/clearml/storage/cache.py
index e8c0bbb3..ec5f319d 100644
--- a/clearml/storage/cache.py
+++ b/clearml/storage/cache.py
@@ -208,11 +208,21 @@ class CacheManager(object):
                     new_file.touch(exist_ok=True)
                 except Exception:
                     pass
+            # if file doesn't exist, return file size None
+            # noinspection PyBroadException
+            try:
+                new_file_size = new_file.stat().st_size if new_file_exists else None
+            except Exception:
+                new_file_size = None
+
+            folder_files = list(folder.iterdir())
+            if len(folder_files) <= self._file_limit:
+                return new_file.as_posix(), new_file_size
 
             # first exclude lock files
             lock_files = dict()
             files = []
-            for f in sorted(folder.iterdir(), reverse=True, key=sort_max_access_time):
+            for f in sorted(folder_files, reverse=True, key=sort_max_access_time):
                 if f.name.startswith(CacheManager._lockfile_prefix) and f.name.endswith(
                     CacheManager._lockfile_suffix
                 ):
@@ -233,10 +243,7 @@ class CacheManager(object):
 
             # delete old files
             files = files[self._file_limit:]
-            for i, f in enumerate(files):
-                if i < self._file_limit:
-                    continue
-
+            for f in files:
                 # check if the file is in the lock folder list:
                 folder_lock = self._folder_locks.get(f.absolute().as_posix())
                 if folder_lock:
@@ -285,14 +292,7 @@ class CacheManager(object):
                     except BaseException:
                         pass
 
-            # if file doesn't exist, return file size None
-            # noinspection PyBroadException
-            try:
-                size = new_file.stat().st_size if new_file_exists else None
-            except Exception:
-                size = None
-
-            return new_file.as_posix(), size
+            return new_file.as_posix(), new_file_size
 
         def lock_cache_folder(self, local_path):
             # type: (Union[str, Path]) -> ()
diff --git a/clearml/storage/helper.py b/clearml/storage/helper.py
index 5da873db..c7c75a98 100644
--- a/clearml/storage/helper.py
+++ b/clearml/storage/helper.py
@@ -17,7 +17,7 @@ from concurrent.futures import ThreadPoolExecutor
 from copy import copy
 from datetime import datetime
 from multiprocessing.pool import ThreadPool
-from tempfile import mktemp
+from tempfile import mkstemp
 from time import time
 from types import GeneratorType
 
@@ -461,15 +461,15 @@ class _Boto3Driver(_Driver):
                     )
                 }
                 if not cfg.use_credentials_chain:
-                    boto_kwargs["aws_access_key_id"] = cfg.key
-                    boto_kwargs["aws_secret_access_key"] = cfg.secret
+                    boto_kwargs["aws_access_key_id"] = cfg.key or None
+                    boto_kwargs["aws_secret_access_key"] = cfg.secret or None
                     if cfg.token:
                         boto_kwargs["aws_session_token"] = cfg.token
 
-                self.resource = boto3.resource(
-                    "s3",
-                    **boto_kwargs
+                boto_session = boto3.Session(
+                    profile_name=cfg.profile or None,
                 )
+                self.resource = boto_session.resource("s3", **boto_kwargs)
 
                 self.config = cfg
                 bucket_name = self.name[len(cfg.host) + 1:] if cfg.host else self.name
@@ -683,7 +683,12 @@ class _Boto3Driver(_Driver):
                 'time': datetime.utcnow().isoformat()
             }
 
-            boto_session = boto3.Session(conf.key, conf.secret, aws_session_token=conf.token)
+            boto_session = boto3.Session(
+                aws_access_key_id=conf.key or None,
+                aws_secret_access_key=conf.secret or None,
+                aws_session_token=conf.token or None,
+                profile_name=conf.profile or None
+            )
             endpoint = (('https://' if conf.secure else 'http://') + conf.host) if conf.host else None
             boto_resource = boto_session.resource('s3', region_name=conf.region or None, endpoint_url=endpoint)
             bucket = boto_resource.Bucket(bucket_name)
@@ -738,7 +743,9 @@ class _Boto3Driver(_Driver):
                 cls._bucket_location_failure_reported.add(conf.get_bucket_host())
 
         try:
-            boto_session = boto3.Session(conf.key, conf.secret, aws_session_token=conf.token)
+            boto_session = boto3.Session(
+                conf.key, conf.secret, aws_session_token=conf.token, profile_name=conf.profile_name or None
+            )
             boto_resource = boto_session.resource('s3')
             return boto_resource.meta.client.get_bucket_location(Bucket=conf.bucket)["LocationConstraint"]
 
@@ -2004,7 +2011,7 @@ class StorageHelper(object):
             return None
         # create temp file with the requested file name
         file_name = '.' + remote_url.split('/')[-1].split(os.path.sep)[-1]
-        local_path = mktemp(suffix=file_name)
+        _, local_path = mkstemp(suffix=file_name)
         return helper.download_to_file(remote_url, local_path, skip_zero_size_check=skip_zero_size_check)
 
     def __init__(
@@ -2018,6 +2025,7 @@ class StorageHelper(object):
         logger=None,
         retries=5,
         token=None,
+        profile=None,
         **kwargs
     ):
         level = config.get("storage.log.level", None)
@@ -2072,6 +2080,8 @@ class StorageHelper(object):
                 region=final_region,
                 use_credentials_chain=self._conf.use_credentials_chain,
                 token=token or self._conf.token,
+                profile=profile or self._conf.profile,
+                secure=self._secure,
                 extra_args=self._conf.extra_args,
             )
 
@@ -2614,7 +2624,9 @@ class StorageHelper(object):
         try:
             if verbose:
                 self._log.info("Start downloading from {}".format(remote_path))
-            if not overwrite_existing and Path(local_path).is_file():
+            # check for 0 sized files as well - we want to override empty files that were created
+            # via mkstemp or similar functions
+            if not overwrite_existing and Path(local_path).is_file() and Path(local_path).stat().st_size != 0:
                 self._log.debug(
                     'File {} already exists, no need to download, thread id = {}'.format(
                         local_path,
diff --git a/clearml/storage/manager.py b/clearml/storage/manager.py
index 55710017..ff0a7f20 100644
--- a/clearml/storage/manager.py
+++ b/clearml/storage/manager.py
@@ -36,6 +36,8 @@ class StorageManager(object):
         the returned link is the same, otherwise a link to a local copy of the url file is returned.
         Caching is enabled by default, cache limited by number of stored files per cache context.
         Oldest accessed files are deleted when cache is full.
+        One can also use this function to prevent the deletion of a file that has been cached,
+        as the respective file will have its timestamp refreshed
 
         :param str remote_url: remote url link (string)
         :param str cache_context: Optional caching context identifier (string), default context 'global'
diff --git a/clearml/task.py b/clearml/task.py
index d0a216fa..501308af 100644
--- a/clearml/task.py
+++ b/clearml/task.py
@@ -1516,11 +1516,13 @@ class Task(_Task):
         self.data.tags = list(set((self.data.tags or []) + tags))
         self._edit(tags=self.data.tags)
 
-    def connect(self, mutable, name=None):
-        # type: (Any, Optional[str]) -> Any
+    def connect(self, mutable, name=None, ignore_remote_overrides=False):
+        # type: (Any, Optional[str], bool) -> Any
         """
         Connect an object to a Task object. This connects an experiment component (part of an experiment) to the
         experiment. For example, an experiment component can be a valid object containing some hyperparameters, or a :class:`Model`.
+        When running remotely, the value of the connected object is overridden by the corresponding value found
+        under the experiment's UI/backend (unless `ignore_remote_overrides` is True).
 
         :param object mutable: The experiment component to connect. The object must be one of the following types:
 
@@ -1533,16 +1535,23 @@ class Task(_Task):
 
         :param str name: A section name associated with the connected object, if 'name' is None defaults to 'General'
             Currently, `name` is only supported for `dict` and `TaskParameter` objects, and should be omitted for the other supported types. (Optional)
-
             For example, by setting `name='General'` the connected dictionary will be under the General section in the hyperparameters section.
             While by setting `name='Train'` the connected dictionary will be under the Train section in the hyperparameters section.
 
+        :param ignore_remote_overrides: If True, ignore UI/backend overrides when running remotely.
+        Default is False, meaning that any changes made in the UI/backend will be applied in remote execution.
+
         :return: It will return the same object that was passed as the `mutable` argument to the method, except if the type of the object is dict.
                  For dicts the :meth:`Task.connect` will return the dict decorated as a `ProxyDictPostWrite`.
                  This is done to allow propagating the updates from the connected object.
 
         :raise: Raises an exception if passed an unsupported object.
         """
+        # input model connect and task parameters will handle this instead
+        if not isinstance(mutable, (InputModel, TaskParameters)):
+            ignore_remote_overrides = self._handle_ignore_remote_overrides(
+                (name or "General") + "/_ignore_remote_overrides_", ignore_remote_overrides
+            )
         # dispatching by match order
         dispatch = (
             (OutputModel, self._connect_output_model),
@@ -1564,7 +1573,7 @@ class Task(_Task):
 
         for mutable_type, method in dispatch:
             if isinstance(mutable, mutable_type):
-                return method(mutable, name=name)
+                return method(mutable, name=name, ignore_remote_overrides=ignore_remote_overrides)
 
         raise Exception('Unsupported mutable type %s: no connect function found' % type(mutable).__name__)
 
@@ -1631,8 +1640,8 @@ class Task(_Task):
                 self.data.script.version_num = commit or ""
             self._edit(script=self.data.script)
 
-    def connect_configuration(self, configuration, name=None, description=None):
-        # type: (Union[Mapping, list, Path, str], Optional[str], Optional[str]) -> Union[dict, Path, str]
+    def connect_configuration(self, configuration, name=None, description=None, ignore_remote_overrides=False):
+        # type: (Union[Mapping, list, Path, str], Optional[str], Optional[str], bool) -> Union[dict, Path, str]
         """
         Connect a configuration dictionary or configuration file (pathlib.Path / str) to a Task object.
         This method should be called before reading the configuration file.
@@ -1650,6 +1659,9 @@ class Task(_Task):
 
            my_params = task.connect_configuration(my_params)
 
+        When running remotely, the value of the connected configuration is overridden by the corresponding value found
+        under the experiment's UI/backend (unless `ignore_remote_overrides` is True).
+
         :param configuration: The configuration. This is usually the configuration used in the model training process.
             Specify one of the following:
 
@@ -1664,9 +1676,15 @@ class Task(_Task):
 
         :param str description: Configuration section description (text). default: None
 
+        :param bool ignore_remote_overrides: If True, ignore UI/backend overrides when running remotely.
+        Default is False, meaning that any changes made in the UI/backend will be applied in remote execution.
+
         :return: If a dictionary is specified, then a dictionary is returned. If pathlib2.Path / string is
             specified, then a path to a local configuration file is returned. Configuration object.
         """
+        ignore_remote_overrides = self._handle_ignore_remote_overrides(
+            (name or "General") + "/_ignore_remote_overrides_config_", ignore_remote_overrides
+        )
         pathlib_Path = None  # noqa
         cast_Path = Path
         if not isinstance(configuration, (dict, list, Path, six.string_types)):
@@ -1710,7 +1728,7 @@ class Task(_Task):
                     configuration_ = ProxyDictPostWrite(self, _update_config_dict, configuration_)
                 return configuration_
 
-            if not running_remotely() or not (self.is_main_task() or self._is_remote_main_task()):
+            if not running_remotely() or not (self.is_main_task() or self._is_remote_main_task()) or ignore_remote_overrides:
                 configuration = get_dev_config(configuration)
             else:
                 # noinspection PyBroadException
@@ -1744,7 +1762,7 @@ class Task(_Task):
             return configuration
 
         # it is a path to a local file
-        if not running_remotely() or not (self.is_main_task() or self._is_remote_main_task()):
+        if not running_remotely() or not (self.is_main_task() or self._is_remote_main_task()) or ignore_remote_overrides:
             # check if not absolute path
             configuration_path = cast_Path(configuration)
             if not configuration_path.is_file():
@@ -1793,8 +1811,8 @@ class Task(_Task):
                 f.write(configuration_text)
             return cast_Path(local_filename) if isinstance(configuration, cast_Path) else local_filename
 
-    def connect_label_enumeration(self, enumeration):
-        # type: (Dict[str, int]) -> Dict[str, int]
+    def connect_label_enumeration(self, enumeration, ignore_remote_overrides=False):
+        # type: (Dict[str, int], bool) -> Dict[str, int]
         """
         Connect a label enumeration dictionary to a Task (experiment) object.
 
@@ -1811,13 +1829,22 @@ class Task(_Task):
                     "person": 1
                }
 
+        :param ignore_remote_overrides: If True, ignore UI/backend overrides when running remotely.
+            Default is False, meaning that any changes made in the UI/backend will be applied in remote execution.
         :return: The label enumeration dictionary (JSON).
         """
+        ignore_remote_overrides = self._handle_ignore_remote_overrides(
+            "General/_ignore_remote_overrides_label_enumeration_", ignore_remote_overrides
+        )
         if not isinstance(enumeration, dict):
             raise ValueError("connect_label_enumeration supports only `dict` type, "
                              "{} is not supported".format(type(enumeration)))
 
-        if not running_remotely() or not (self.is_main_task() or self._is_remote_main_task()):
+        if (
+            not running_remotely()
+            or not (self.is_main_task() or self._is_remote_main_task())
+            or ignore_remote_overrides
+        ):
             self.set_model_label_enumeration(enumeration)
         else:
             # pop everything
@@ -3750,9 +3777,9 @@ class Task(_Task):
 
         return self._logger
 
-    def _connect_output_model(self, model, name=None):
+    def _connect_output_model(self, model, name=None, **kwargs):
         assert isinstance(model, OutputModel)
-        model.connect(self, name=name)
+        model.connect(self, name=name, ignore_remote_overrides=False)
         return model
 
     def _save_output_model(self, model):
@@ -3764,6 +3791,19 @@ class Task(_Task):
         # deprecated
         self._connected_output_model = model
 
+    def _handle_ignore_remote_overrides(self, overrides_name, ignore_remote_overrides):
+        if self.running_locally() and ignore_remote_overrides:
+            self.set_parameter(
+                overrides_name,
+                True,
+                description="If True, ignore UI/backend overrides when running remotely."
+                " Set it to False if you would like the overrides to be applied",
+                value_type=bool
+            )
+        elif not self.running_locally():
+            ignore_remote_overrides = self.get_parameter(overrides_name, default=ignore_remote_overrides, cast=True)
+        return ignore_remote_overrides
+
     def _reconnect_output_model(self):
         """
         Deprecated: If there is a saved connected output model, connect it again.
@@ -3776,7 +3816,7 @@ class Task(_Task):
         if self._connected_output_model:
             self.connect(self._connected_output_model)
 
-    def _connect_input_model(self, model, name=None):
+    def _connect_input_model(self, model, name=None, ignore_remote_overrides=False):
         assert isinstance(model, InputModel)
         # we only allow for an input model to be connected once
         # at least until we support multiple input models
@@ -3791,18 +3831,21 @@ class Task(_Task):
         comment += 'Using model id: {}'.format(model.id)
         self.set_comment(comment)
 
-        model.connect(self, name)
+        model.connect(self, name, ignore_remote_overrides=ignore_remote_overrides)
         return model
 
-    def _connect_argparse(self, parser, args=None, namespace=None, parsed_args=None, name=None):
+    def _connect_argparse(
+        self, parser, args=None, namespace=None, parsed_args=None, name=None, ignore_remote_overrides=False
+    ):
         # do not allow argparser to connect to jupyter notebook
         # noinspection PyBroadException
         try:
-            if 'IPython' in sys.modules:
+            if "IPython" in sys.modules:
                 # noinspection PyPackageRequirements
                 from IPython import get_ipython  # noqa
+
                 ip = get_ipython()
-                if ip is not None and 'IPKernelApp' in ip.config:
+                if ip is not None and "IPKernelApp" in ip.config:
                     return parser
         except Exception:
             pass
@@ -3825,14 +3868,14 @@ class Task(_Task):
                     if parsed_args is None and parser == _parser:
                         parsed_args = _parsed_args
 
-        if running_remotely() and (self.is_main_task() or self._is_remote_main_task()):
+        if running_remotely() and (self.is_main_task() or self._is_remote_main_task()) and not ignore_remote_overrides:
             self._arguments.copy_to_parser(parser, parsed_args)
         else:
             self._arguments.copy_defaults_from_argparse(
                 parser, args=args, namespace=namespace, parsed_args=parsed_args)
         return parser
 
-    def _connect_dictionary(self, dictionary, name=None):
+    def _connect_dictionary(self, dictionary, name=None, ignore_remote_overrides=False):
         def _update_args_dict(task, config_dict):
             # noinspection PyProtectedMember
             task._arguments.copy_from_dict(flatten_dictionary(config_dict), prefix=name)
@@ -3862,7 +3905,7 @@ class Task(_Task):
                 if isinstance(v, dict):
                     _check_keys(v, warning_sent)
 
-        if not running_remotely() or not (self.is_main_task() or self._is_remote_main_task()):
+        if not running_remotely() or not (self.is_main_task() or self._is_remote_main_task()) or ignore_remote_overrides:
             _check_keys(dictionary)
             flat_dict = {str(k): v for k, v in flatten_dictionary(dictionary).items()}
             self._arguments.copy_from_dict(flat_dict, prefix=name)
@@ -3875,19 +3918,28 @@ class Task(_Task):
 
         return dictionary
 
-    def _connect_task_parameters(self, attr_class, name=None):
-        if running_remotely() and (self.is_main_task() or self._is_remote_main_task()):
-            parameters = self.get_parameters()
-            if not name:
-                attr_class.update_from_dict(parameters)
-            else:
-                attr_class.update_from_dict(
-                    dict((k[len(name) + 1:], v) for k, v in parameters.items() if k.startswith('{}/'.format(name))))
+    def _connect_task_parameters(self, attr_class, name=None, ignore_remote_overrides=False):
+        ignore_remote_overrides_section = "_ignore_remote_overrides_"
+        if running_remotely():
+            ignore_remote_overrides = self.get_parameter(
+                (name or "General") + "/" + ignore_remote_overrides_section, default=ignore_remote_overrides, cast=True
+            )
+        if running_remotely() and (self.is_main_task() or self._is_remote_main_task()) and not ignore_remote_overrides:
+            parameters = self.get_parameters(cast=True)
+            if name:
+                parameters = dict(
+                    (k[len(name) + 1:], v) for k, v in parameters.items() if k.startswith("{}/".format(name))
+                )
+            parameters.pop(ignore_remote_overrides_section, None)
+            attr_class.update_from_dict(parameters)
         else:
-            self.set_parameters(attr_class.to_dict(), __parameters_prefix=name)
+            parameters_dict = attr_class.to_dict()
+            if ignore_remote_overrides:
+                parameters_dict[ignore_remote_overrides_section] = True
+            self.set_parameters(parameters_dict, __parameters_prefix=name)
         return attr_class
 
-    def _connect_object(self, an_object, name=None):
+    def _connect_object(self, an_object, name=None, ignore_remote_overrides=False):
         def verify_type(key, value):
             if str(key).startswith('_') or not isinstance(value, self._parameters_allowed_types):
                 return False
@@ -3904,15 +3956,15 @@ class Task(_Task):
             for k, v in cls_.__dict__.items()
             if verify_type(k, v)
         }
-        if running_remotely() and (self.is_main_task() or self._is_remote_main_task()):
-            a_dict = self._connect_dictionary(a_dict, name)
+        if running_remotely() and (self.is_main_task() or self._is_remote_main_task()) and not ignore_remote_overrides:
+            a_dict = self._connect_dictionary(a_dict, name, ignore_remote_overrides=ignore_remote_overrides)
             for k, v in a_dict.items():
                 if getattr(an_object, k, None) != a_dict[k]:
                     setattr(an_object, k, v)
 
             return an_object
         else:
-            self._connect_dictionary(a_dict, name)
+            self._connect_dictionary(a_dict, name, ignore_remote_overrides=ignore_remote_overrides)
             return an_object
 
     def _dev_mode_stop_task(self, stop_reason, pid=None):
diff --git a/clearml/utilities/files.py b/clearml/utilities/files.py
index 15c21053..59698f7c 100644
--- a/clearml/utilities/files.py
+++ b/clearml/utilities/files.py
@@ -20,3 +20,15 @@ def get_filename_max_length(dir_path):
         print(err)
 
     return 255  # Common filesystems like NTFS, EXT4 and HFS+ limited with 255
+
+
+def is_path_traversal(target_folder, relative_path):
+    try:
+        target_folder = pathlib2.Path(target_folder)
+        relative_path = pathlib2.Path(relative_path)
+        # returns the relative path starting from the target_folder,
+        # or raise an ValueError if a directory traversal attack is tried
+        target_folder.joinpath(relative_path).resolve().relative_to(target_folder.resolve())
+        return False
+    except ValueError:
+        return True
diff --git a/clearml/utilities/resource_monitor.py b/clearml/utilities/resource_monitor.py
index dfe010eb..f0ea960a 100644
--- a/clearml/utilities/resource_monitor.py
+++ b/clearml/utilities/resource_monitor.py
@@ -52,7 +52,7 @@ class ResourceMonitor(BackgroundMonitor):
             try:
                 active_gpus = os.environ.get('NVIDIA_VISIBLE_DEVICES', '') or \
                     os.environ.get('CUDA_VISIBLE_DEVICES', '')
-                if active_gpus:
+                if active_gpus != "all":
                     self._active_gpus = [g.strip() for g in active_gpus.split(',')]
             except Exception:
                 pass
diff --git a/clearml/version.py b/clearml/version.py
index c162747f..476b0706 100644
--- a/clearml/version.py
+++ b/clearml/version.py
@@ -1 +1 @@
-__version__ = '1.14.1'
+__version__ = "1.14.4"
diff --git a/docs/clearml.conf b/docs/clearml.conf
index e7b045c5..09e3ecc3 100644
--- a/docs/clearml.conf
+++ b/docs/clearml.conf
@@ -92,6 +92,8 @@ sdk {
             # Specify explicit keys
             key: ""
             secret: ""
+            # Specify profile
+            profile: ""
             # Or enable credentials chain to let Boto3 pick the right credentials. 
             # This includes picking credentials from environment variables, 
             # credential file and IAM role using metadata service. 
@@ -103,6 +105,7 @@ sdk {
 
             credentials: [
                 # specifies key/secret credentials to use when handling s3 urls (read or write)
+                # Note that all all fields in the global s3 config section are supported here
                 # {
                 #     bucket: "my-bucket-name"
                 #     key: "my-access-key"
diff --git a/docs/datasets.gif b/docs/datasets.gif
new file mode 100644
index 00000000..932893e4
Binary files /dev/null and b/docs/datasets.gif differ
diff --git a/docs/experiment_manager.gif b/docs/experiment_manager.gif
new file mode 100644
index 00000000..bd31a379
Binary files /dev/null and b/docs/experiment_manager.gif differ
diff --git a/docs/orchestration.gif b/docs/orchestration.gif
new file mode 100644
index 00000000..f8a7ba42
Binary files /dev/null and b/docs/orchestration.gif differ
diff --git a/docs/pipelines.gif b/docs/pipelines.gif
new file mode 100644
index 00000000..0b989978
Binary files /dev/null and b/docs/pipelines.gif differ
diff --git a/examples/advanced/requirements.txt b/examples/advanced/requirements.txt
index 5107c4eb..270fd233 100644
--- a/examples/advanced/requirements.txt
+++ b/examples/advanced/requirements.txt
@@ -1,3 +1,3 @@
 torch>=1.1.0
 torchvision>=0.3.0
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/automation/requirements.txt b/examples/automation/requirements.txt
index 6dac6a83..ad2bf345 100644
--- a/examples/automation/requirements.txt
+++ b/examples/automation/requirements.txt
@@ -1 +1 @@
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/cicd/requirements.txt b/examples/cicd/requirements.txt
index a3b31e82..544c593f 100644
--- a/examples/cicd/requirements.txt
+++ b/examples/cicd/requirements.txt
@@ -1,5 +1,5 @@
 tqdm==4.64.1
-clearml==1.7.2
+clearml>=1.14.4
 github3.py==3.2.0
 tabulate==0.9.0
 pandas==1.5.1
\ No newline at end of file
diff --git a/examples/datasets/requirements.txt b/examples/datasets/requirements.txt
index 5039f121..9f6ba766 100644
--- a/examples/datasets/requirements.txt
+++ b/examples/datasets/requirements.txt
@@ -4,4 +4,4 @@ torch>=1.1.0
 torchvision>=0.3.0
 pytorch-ignite
 tqdm
-clearml
+clearml>=1.14.4
diff --git a/examples/datasets/urbansounds_dataset_preprocessing.py b/examples/datasets/urbansounds_dataset_preprocessing.py
new file mode 100644
index 00000000..7230afb9
--- /dev/null
+++ b/examples/datasets/urbansounds_dataset_preprocessing.py
@@ -0,0 +1,163 @@
+import os.path
+from pathlib import Path
+
+import matplotlib as mpl
+import numpy as np
+from tqdm import tqdm
+import torchaudio
+import torch
+from clearml import Task, Dataset
+
+task = Task.init(project_name="examples/Urbansounds", task_name="preprocessing")
+
+# Let's preprocess the data and create a new ClearML dataset from it, so we can track it around
+# The cool thing is, we can easily debug, by using, you guessed it: debug samples! We can log both
+# the original sound and its processed mel spectrogram as debug samples, so we can manually check
+# if everything went as planned.
+
+
+class PreProcessor:
+    def __init__(self):
+        self.configuration = {"number_of_mel_filters": 64, "resample_freq": 22050}
+        task.connect(self.configuration)
+
+    def preprocess_sample(self, sample, original_sample_freq):
+        if self.configuration["resample_freq"] > 0:
+            resample_transform = torchaudio.transforms.Resample(
+                orig_freq=original_sample_freq,
+                new_freq=self.configuration["resample_freq"],
+            )
+            sample = resample_transform(sample)
+
+        # This will convert audio files with two channels into one
+        sample = torch.mean(sample, dim=0, keepdim=True)
+
+        # Convert audio to log-scale Mel spectrogram
+        melspectrogram_transform = torchaudio.transforms.MelSpectrogram(
+            sample_rate=self.configuration["resample_freq"],
+            n_mels=self.configuration["number_of_mel_filters"],
+        )
+        melspectrogram = melspectrogram_transform(sample)
+        melspectogram_db = torchaudio.transforms.AmplitudeToDB()(melspectrogram)
+
+        # Make sure all spectrograms are the same size
+        fixed_length = 3 * (self.configuration["resample_freq"] // 200)
+        if melspectogram_db.shape[2] < fixed_length:
+            melspectogram_db = torch.nn.functional.pad(
+                melspectogram_db, (0, fixed_length - melspectogram_db.shape[2])
+            )
+        else:
+            melspectogram_db = melspectogram_db[:, :, :fixed_length]
+
+        return melspectogram_db
+
+
+class DataSetBuilder:
+    def __init__(self):
+        self.configuration = {"dataset_path": "dataset"}
+        task.connect(self.configuration)
+
+        self.original_dataset = Dataset.get(
+            dataset_project="examples/Urbansounds",
+            dataset_name="UrbanSounds example",
+            dataset_tags=["raw"],
+            alias="Raw Dataset",
+        )
+        # This will return the pandas dataframe we added in the previous task
+        self.metadata = (
+            Task.get_task(task_id=self.original_dataset._task.id)
+            .artifacts["metadata"]
+            .get()
+        )
+        # This will download the data and return a local path to the data
+        self.original_dataset_path = Path(
+            self.original_dataset.get_mutable_local_copy(
+                self.configuration["dataset_path"], overwrite=True
+            )
+        )
+
+        # Prepare a preprocessor that will handle each sample one by one
+        self.preprocessor = PreProcessor()
+
+        # Get ready for the new one
+        self.preprocessed_dataset = None
+
+    def log_dataset_statistics(self):
+        histogram_data = self.metadata["label"].value_counts()
+        self.preprocessed_dataset.get_logger().report_table(
+            title="Raw Dataset Metadata",
+            series="Raw Dataset Metadata",
+            table_plot=self.metadata,
+        )
+        self.preprocessed_dataset.get_logger().report_histogram(
+            title="Class distribution",
+            series="Class distribution",
+            values=histogram_data,
+            iteration=0,
+            xlabels=histogram_data.index.tolist(),
+            yaxis="Amount of samples",
+        )
+
+    def build_dataset(self):
+        # Let's create a new dataset that is a child of the original one
+        # We'll add the preprocessed samples to the original dataset, leading to a new version
+        # Providing the parent dataset allows us to keep a clear lineage of our data
+        self.preprocessed_dataset = Dataset.create(
+            dataset_name="UrbanSounds example",
+            dataset_project="examples/Urbansounds",
+            dataset_tags=["preprocessed"],
+            parent_datasets=[self.original_dataset.id],
+        )
+
+        # loop through the metadata entries and preprocess each sample, then add some of them as debug samples to
+        # manually double check in the UI that everything has worked (you can watch the spectrogram and listen to the
+        # audio side by side in the debug sample UI)
+        for i, (_, data) in tqdm(enumerate(self.metadata.iterrows())):
+            _, audio_file_path, label = data.tolist()
+            sample, sample_freq = torchaudio.load(
+                self.original_dataset_path / audio_file_path, normalize=True
+            )
+            spectrogram = self.preprocessor.preprocess_sample(sample, sample_freq)
+            # Get only the filename and replace the extension, we're saving an image here
+            new_file_name = os.path.basename(audio_file_path).replace(".wav", ".npy")
+            # Get the correct folder, basically the original dataset folder + the new filename
+            spectrogram_path = (
+                self.original_dataset_path
+                / os.path.dirname(audio_file_path)
+                / new_file_name
+            )
+            # Save the numpy array to disk
+            np.save(spectrogram_path, spectrogram)
+
+            # Log every 10th sample as a debug sample to the UI, so we can manually check it
+            if i % 10 == 0:
+                # Convert the numpy array to a viewable JPEG
+                rgb_image = mpl.colormaps["viridis"](
+                    spectrogram[0, :, :].detach().numpy() * 255
+                )[:, :, :3]
+                title = os.path.splitext(os.path.basename(audio_file_path))[0]
+
+                # Report the image and the original sound, so they can be viewed side by side
+                self.preprocessed_dataset.get_logger().report_image(
+                    title=title, series="spectrogram", image=rgb_image
+                )
+                self.preprocessed_dataset.get_logger().report_media(
+                    title=title,
+                    series="original_audio",
+                    local_path=self.original_dataset_path / audio_file_path,
+                )
+        # The original data path will now also have the spectrograms in its filetree.
+        # So that's why we add it here to fill up the new dataset with.
+        self.preprocessed_dataset.add_files(self.original_dataset_path)
+        # Again add some visualizations to the task
+        self.log_dataset_statistics()
+        # We still want the metadata
+        self.preprocessed_dataset._task.upload_artifact(
+            name="metadata", artifact_object=self.metadata
+        )
+        self.preprocessed_dataset.finalize(auto_upload=True)
+
+
+if __name__ == "__main__":
+    datasetbuilder = DataSetBuilder()
+    datasetbuilder.build_dataset()
diff --git a/examples/datasets/urbansounds_get_data.py b/examples/datasets/urbansounds_get_data.py
new file mode 100644
index 00000000..9f442077
--- /dev/null
+++ b/examples/datasets/urbansounds_get_data.py
@@ -0,0 +1,96 @@
+import pandas as pd
+from pathlib import Path
+from clearml import Task, Dataset, StorageManager
+
+task = Task.init(project_name="examples/Urbansounds", task_name="download data")
+
+configuration = {
+    "selected_classes": [
+        "air_conditioner",
+        "car_horn",
+        "children_playing",
+        "dog_bark",
+        "drilling",
+        "engine_idling",
+        "gun_shot",
+        "jackhammer",
+        "siren",
+        "street_music",
+    ]
+}
+task.connect(configuration)
+
+
+def get_urbansound8k():
+    # Download UrbanSound8K dataset (https://urbansounddataset.weebly.com/urbansound8k.html)
+    # For simplicity we will use here a subset of that dataset using clearml StorageManager
+    path_to_urbansound8k = StorageManager.get_local_copy(
+        "https://allegro-datasets.s3.amazonaws.com/clearml/UrbanSound8K.zip",
+        extract_archive=True,
+    )
+    path_to_urbansound8k_csv = (
+        Path(path_to_urbansound8k) / "UrbanSound8K" / "metadata" / "UrbanSound8K.csv"
+    )
+    path_to_urbansound8k_audio = Path(path_to_urbansound8k) / "UrbanSound8K" / "audio"
+
+    return path_to_urbansound8k_csv, path_to_urbansound8k_audio
+
+
+def log_dataset_statistics(dataset, metadata):
+    histogram_data = metadata["class"].value_counts()
+    dataset.get_logger().report_table(
+        title="Raw Dataset Metadata", series="Raw Dataset Metadata", table_plot=metadata
+    )
+    dataset.get_logger().report_histogram(
+        title="Class distribution",
+        series="Class distribution",
+        values=histogram_data,
+        iteration=0,
+        xlabels=histogram_data.index.tolist(),
+        yaxis="Amount of samples",
+    )
+
+
+def build_clearml_dataset():
+    # Get a local copy of both the data and the labels
+    path_to_urbansound8k_csv, path_to_urbansound8k_audio = get_urbansound8k()
+    urbansound8k_metadata = pd.read_csv(path_to_urbansound8k_csv)
+    # Subset the data to only include the classes we want
+    urbansound8k_metadata = urbansound8k_metadata[
+        urbansound8k_metadata["class"].isin(configuration["selected_classes"])
+    ]
+
+    # Create a pandas dataframe containing labels and other info we need later (fold is for train test split)
+    metadata = pd.DataFrame(
+        {
+            "fold": urbansound8k_metadata.loc[:, "fold"],
+            "filepath": (
+                "fold"
+                + urbansound8k_metadata.loc[:, "fold"].astype(str)
+                + "/"
+                + urbansound8k_metadata.loc[:, "slice_file_name"].astype(str)
+            ),
+            "label": urbansound8k_metadata.loc[:, "classID"],
+        }
+    )
+
+    # Now create a clearml dataset to start versioning our changes and make it much easier to get the right data
+    # in other tasks as well as on different machines
+    dataset = Dataset.create(
+        dataset_name="UrbanSounds example",
+        dataset_project="examples/Urbansounds",
+        dataset_tags=["raw"],
+    )
+
+    # Add the local files we downloaded earlier
+    dataset.add_files(path_to_urbansound8k_audio)
+    # Add the metadata in pandas format, we can now see it in the webUI and have it be easily accessible
+    dataset._task.upload_artifact(name="metadata", artifact_object=metadata)
+    # Let's add some cool graphs as statistics in the plots section!
+    log_dataset_statistics(dataset, urbansound8k_metadata)
+    # Finalize and upload the data and labels of the dataset
+    dataset.finalize(auto_upload=True)
+
+
+if __name__ == "__main__":
+    build_clearml_dataset()
diff --git a/examples/distributed/requirements.txt b/examples/distributed/requirements.txt
index 5107c4eb..270fd233 100644
--- a/examples/distributed/requirements.txt
+++ b/examples/distributed/requirements.txt
@@ -1,3 +1,3 @@
 torch>=1.1.0
 torchvision>=0.3.0
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/frameworks/autokeras/requirements.txt b/examples/frameworks/autokeras/requirements.txt
index cfee7f58..a86df558 100644
--- a/examples/frameworks/autokeras/requirements.txt
+++ b/examples/frameworks/autokeras/requirements.txt
@@ -1,2 +1,2 @@
 autokeras ; python_version >= '3.7'
-clearml
+clearml>=1.14.4
diff --git a/examples/frameworks/catboost/requirements.txt b/examples/frameworks/catboost/requirements.txt
index e7efffb5..47fc59d5 100644
--- a/examples/frameworks/catboost/requirements.txt
+++ b/examples/frameworks/catboost/requirements.txt
@@ -1,4 +1,4 @@
 catboost
 numpy >= 1.19.2
 scikit_learn
-clearml
+clearml>=1.14.4
diff --git a/examples/frameworks/click/requirements.txt b/examples/frameworks/click/requirements.txt
index df43bf8e..50dfeb39 100644
--- a/examples/frameworks/click/requirements.txt
+++ b/examples/frameworks/click/requirements.txt
@@ -1,3 +1,3 @@
 click>=8.0
-clearml
+clearml>=1.14.4
 
diff --git a/examples/frameworks/fastai/legacy/requirements.txt b/examples/frameworks/fastai/legacy/requirements.txt
index e056d26c..4f63e887 100644
--- a/examples/frameworks/fastai/legacy/requirements.txt
+++ b/examples/frameworks/fastai/legacy/requirements.txt
@@ -1,4 +1,4 @@
 fastai < 2.0.0
 tensorboard
 tensorboardX
-clearml
+clearml>=1.14.4
diff --git a/examples/frameworks/fastai/requirements.txt b/examples/frameworks/fastai/requirements.txt
index ee930fd2..ebc7503d 100644
--- a/examples/frameworks/fastai/requirements.txt
+++ b/examples/frameworks/fastai/requirements.txt
@@ -1,4 +1,4 @@
 fastai >= 2.6.0
 tensorboard
 tensorboardX
-clearml
+clearml>=1.14.4
diff --git a/examples/frameworks/fire/requirements.txt b/examples/frameworks/fire/requirements.txt
index 59c7d019..79c6036b 100644
--- a/examples/frameworks/fire/requirements.txt
+++ b/examples/frameworks/fire/requirements.txt
@@ -1,2 +1,2 @@
-clearml
+clearml>=1.14.4
 fire
diff --git a/examples/frameworks/hydra/requirements.txt b/examples/frameworks/hydra/requirements.txt
index 878e0c07..029addee 100644
--- a/examples/frameworks/hydra/requirements.txt
+++ b/examples/frameworks/hydra/requirements.txt
@@ -1,3 +1,3 @@
-clearml
+clearml>=1.14.4
 hydra-core>=1.2.0
 
diff --git a/examples/frameworks/ignite/requirements.txt b/examples/frameworks/ignite/requirements.txt
index 831de90a..c90870cb 100644
--- a/examples/frameworks/ignite/requirements.txt
+++ b/examples/frameworks/ignite/requirements.txt
@@ -4,4 +4,4 @@ torch>=1.1.0
 torchvision>=0.3.0
 pytorch-ignite
 tqdm
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/frameworks/keras/legacy/requirements.txt b/examples/frameworks/keras/legacy/requirements.txt
index f37621b1..4682a0e3 100644
--- a/examples/frameworks/keras/legacy/requirements.txt
+++ b/examples/frameworks/keras/legacy/requirements.txt
@@ -1,2 +1,2 @@
-clearml
+clearml>=1.14.4
 Keras>=2.2.4
diff --git a/examples/frameworks/keras/requirements.txt b/examples/frameworks/keras/requirements.txt
index 9e45a014..68ee08c5 100644
--- a/examples/frameworks/keras/requirements.txt
+++ b/examples/frameworks/keras/requirements.txt
@@ -1,2 +1,2 @@
 tensorflow>=2.0
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/frameworks/kerastuner/requirements.txt b/examples/frameworks/kerastuner/requirements.txt
index 4677be30..b53e6589 100644
--- a/examples/frameworks/kerastuner/requirements.txt
+++ b/examples/frameworks/kerastuner/requirements.txt
@@ -1,4 +1,4 @@
 keras-tuner
 tensorflow>=2.0
 tensorflow-datasets
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/frameworks/lightgbm/requirements.txt b/examples/frameworks/lightgbm/requirements.txt
index 8508c428..4d34fd86 100644
--- a/examples/frameworks/lightgbm/requirements.txt
+++ b/examples/frameworks/lightgbm/requirements.txt
@@ -2,4 +2,4 @@ lightgbm
 scikit-learn
 pandas
 matplotlib
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/frameworks/matplotlib/requirements.txt b/examples/frameworks/matplotlib/requirements.txt
index e74f84e2..7b7dbfab 100644
--- a/examples/frameworks/matplotlib/requirements.txt
+++ b/examples/frameworks/matplotlib/requirements.txt
@@ -2,4 +2,4 @@ numpy != 1.24.0  # https://github.com/numpy/numpy/issues/22826
 matplotlib >= 3.1.1 ; python_version >= '3.6'
 matplotlib >= 2.2.4 ; python_version < '3.6'
 seaborn
-clearml
+clearml>=1.14.4
diff --git a/examples/frameworks/megengine/requirements.txt b/examples/frameworks/megengine/requirements.txt
index 75687027..8492f6ec 100644
--- a/examples/frameworks/megengine/requirements.txt
+++ b/examples/frameworks/megengine/requirements.txt
@@ -1,3 +1,3 @@
 MegEngine ; python_version < '3.9'
 tensorboardX
-clearml
+clearml>=1.14.4
diff --git a/examples/frameworks/openmmlab/requirements.txt b/examples/frameworks/openmmlab/requirements.txt
index fae81627..45580a05 100644
--- a/examples/frameworks/openmmlab/requirements.txt
+++ b/examples/frameworks/openmmlab/requirements.txt
@@ -1,4 +1,4 @@
-clearml
+clearml>=1.14.4
 mmcv>=1.5.1,<2.0.0
 torch
 torchvision
diff --git a/examples/frameworks/pytorch-lightning/requirements.txt b/examples/frameworks/pytorch-lightning/requirements.txt
index 62e05989..ec0269a6 100644
--- a/examples/frameworks/pytorch-lightning/requirements.txt
+++ b/examples/frameworks/pytorch-lightning/requirements.txt
@@ -1,4 +1,4 @@
-clearml
+clearml>=1.14.4
 pytorch-lightning >= 1.6.0
 torch
 torchvision
diff --git a/examples/frameworks/pytorch/requirements.txt b/examples/frameworks/pytorch/requirements.txt
index 7d2cdfe9..a7ae914d 100644
--- a/examples/frameworks/pytorch/requirements.txt
+++ b/examples/frameworks/pytorch/requirements.txt
@@ -1,4 +1,4 @@
-clearml
+clearml>=1.14.4
 jsonschema==3.2.0 ; python_version <= '3.5'
 matplotlib
 pytorch-ignite
diff --git a/examples/frameworks/scikit-learn/requirements.txt b/examples/frameworks/scikit-learn/requirements.txt
index 07819fbf..0b7dd082 100644
--- a/examples/frameworks/scikit-learn/requirements.txt
+++ b/examples/frameworks/scikit-learn/requirements.txt
@@ -2,4 +2,4 @@ joblib>=0.13.2
 matplotlib >= 3.1.1 ; python_version >= '3.6'
 matplotlib >= 2.2.4 ; python_version < '3.6'
 scikit-learn
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/frameworks/tensorboardx/requirements.txt b/examples/frameworks/tensorboardx/requirements.txt
index 108587ab..94f57783 100644
--- a/examples/frameworks/tensorboardx/requirements.txt
+++ b/examples/frameworks/tensorboardx/requirements.txt
@@ -2,4 +2,4 @@ tensorboardX>=1.8
 torch>=1.1.0
 torchvision>=0.3.0
 moviepy
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/frameworks/tensorflow/requirements.txt b/examples/frameworks/tensorflow/requirements.txt
index 2492b674..86f419be 100644
--- a/examples/frameworks/tensorflow/requirements.txt
+++ b/examples/frameworks/tensorflow/requirements.txt
@@ -2,4 +2,4 @@ numpy != 1.24.0  # https://github.com/numpy/numpy/issues/22826
 absl-py>=0.7.1
 tensorboard>=2.0
 tensorflow>=2.0
-clearml
+clearml>=1.14.4
diff --git a/examples/frameworks/xgboost/requirements.txt b/examples/frameworks/xgboost/requirements.txt
index 71169b2d..6eb0a2ba 100644
--- a/examples/frameworks/xgboost/requirements.txt
+++ b/examples/frameworks/xgboost/requirements.txt
@@ -2,7 +2,7 @@ numpy != 1.24.0  # https://github.com/numpy/numpy/issues/22826
 matplotlib >= 3.1.1 ; python_version >= '3.6'
 matplotlib >= 2.2.4 ; python_version < '3.6'
 scikit-learn
-clearml
+clearml>=1.14.4
 xgboost>=0.90 ; python_version >= '3'
 xgboost>=0.82 ; python_version < '3'
 # sudo apt-get install graphviz
diff --git a/examples/hyperdatasets/requirements.txt b/examples/hyperdatasets/requirements.txt
index a021820d..94393694 100644
--- a/examples/hyperdatasets/requirements.txt
+++ b/examples/hyperdatasets/requirements.txt
@@ -1,5 +1,5 @@
 allegroai~=3.5.7
-clearml
+clearml>=1.14.4
 numpy
 Pillow
 torch
diff --git a/examples/optimization/hyper-parameter-optimization/requirements.txt b/examples/optimization/hyper-parameter-optimization/requirements.txt
index 770f214c..ae5af43a 100644
--- a/examples/optimization/hyper-parameter-optimization/requirements.txt
+++ b/examples/optimization/hyper-parameter-optimization/requirements.txt
@@ -1,3 +1,3 @@
 keras
 tensorflow
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/pipeline/requirements.txt b/examples/pipeline/requirements.txt
index 788f94d0..cdeb8ab9 100644
--- a/examples/pipeline/requirements.txt
+++ b/examples/pipeline/requirements.txt
@@ -3,4 +3,4 @@ matplotlib >= 3.1.1 ; python_version >= '3.6'
 matplotlib >= 2.2.4 ; python_version < '3.6'
 scikit-learn
 pandas
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/reporting/requirements.txt b/examples/reporting/requirements.txt
index 0b7c42fc..bb9393a3 100644
--- a/examples/reporting/requirements.txt
+++ b/examples/reporting/requirements.txt
@@ -1,5 +1,5 @@
 bokeh>=1.4.0
-clearml
+clearml>=1.14.4
 matplotlib >= 3.1.1 ; python_version >= '3.6'
 matplotlib >= 2.2.4 ; python_version < '3.6'
 numpy != 1.24.0 # https://github.com/numpy/numpy/issues/22826
diff --git a/examples/scheduler/requirements.txt b/examples/scheduler/requirements.txt
index 6dac6a83..ad2bf345 100644
--- a/examples/scheduler/requirements.txt
+++ b/examples/scheduler/requirements.txt
@@ -1 +1 @@
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/services/aws-autoscaler/requirements.txt b/examples/services/aws-autoscaler/requirements.txt
index ae1e1883..65830dcd 100644
--- a/examples/services/aws-autoscaler/requirements.txt
+++ b/examples/services/aws-autoscaler/requirements.txt
@@ -1,5 +1,5 @@
 boto3
 pyYaml
 six
-clearml
+clearml>=1.14.4
 pathlib2
diff --git a/examples/services/cleanup/requirements.txt b/examples/services/cleanup/requirements.txt
index 6dac6a83..ad2bf345 100644
--- a/examples/services/cleanup/requirements.txt
+++ b/examples/services/cleanup/requirements.txt
@@ -1 +1 @@
-clearml
\ No newline at end of file
+clearml>=1.14.4
\ No newline at end of file
diff --git a/examples/services/monitoring/requirements.txt b/examples/services/monitoring/requirements.txt
index 89296b93..93395c35 100644
--- a/examples/services/monitoring/requirements.txt
+++ b/examples/services/monitoring/requirements.txt
@@ -1,2 +1,2 @@
-clearml
+clearml>=1.14.4
 slack_sdk > 3.0.0