clearml/examples/distributed/subprocess_example.py

# TRAINS - example of multiple sub-processes interacting and reporting to a single master experiment

import multiprocessing
import os
import subprocess
import sys
import time
from argparse import ArgumentParser

from trains import Task

# fake data for us to "process"
data = (
    ['a', '2'], ['b', '4'], ['c', '6'], ['d', '8'],
    ['e', '1'], ['f', '3'], ['g', '5'], ['h', '7'],
)


def mp_worker(arguments):
    print('sub process', os.getpid())
    inputs, the_time = arguments
    from random import randint
    additional_parameters = {'stuff_' + str(randint(0, 100)): 'some stuff ' + str(randint(0, 100))}
    Task.current_task().connect(additional_parameters)
    print(" Process %s\tWaiting %s seconds" % (inputs, the_time))
    time.sleep(int(the_time))
    print(" Process %s\tDONE" % inputs)


def mp_handler(use_subprocess):
    if use_subprocess:
        process = multiprocessing.Pool(4)
    else:
        process = multiprocessing.pool.ThreadPool(4)
    process.map(mp_worker, data)
    process.close()
    print('DONE main !!!')


if __name__ == '__main__':
    parser = ArgumentParser()
    parser.add_argument('--num_workers', help='integer value', type=int, default=3)
    parser.add_argument('--use_subprocess', help='integer value', type=int, default=1)
    # this argument we will not be logging, see below Task.init
    parser.add_argument('--counter', help='integer value', type=int, default=-1)

    args = parser.parse_args()
    print(os.getpid(), 'ARGS:', args)

    # We have to initialize the task in the master process,
    # it will make sure that any sub-process calling Task.init will get the master task object
    # notice that we exclude the `counter` argument, so we can launch multiple sub-processes with trains-agent
    # otherwise, the `counter` will always be set to the original value.
    task = Task.init('examples', 'Popen example', auto_connect_arg_parser={'counter': False})

    # we can connect multiple dictionaries, each from different process, as long as the keys have different names
    param = {'args_{}'.format(args.num_workers): 'some value {}'.format(args.num_workers)}
    task.connect(param)

    # check if we need to start the process, meaning counter is negative
    counter = args.num_workers if args.counter < 0 else args.counter

    p = None
    # launch sub-process, every subprocess will launch the next in the chain, until we launch them all.
    # We could also launch all of them here, but that would have been to simple for us J
    if counter > 0:
        cmd = [sys.executable, sys.argv[0],
               '--counter', str(counter - 1),
               '--num_workers', str(args.num_workers),
               '--use_subprocess', str(args.use_subprocess)]
        print(cmd)
        p = subprocess.Popen(cmd, cwd=os.getcwd())

    # the actual "processing" is done here
    mp_handler(args.use_subprocess)
    print('Done logging')

    # wait for the process we launched
    # this means every subprocess will be waiting for the process it launched and
    # the master process will exit after all of them are completed
    if p and counter > 0:
        p.wait()
    print('Exiting')
Added distributed examples 2020-05-24 12:37:55 +00:00			`# TRAINS - example of multiple sub-processes interacting and reporting to a single master experiment`

			`import multiprocessing`
			`import os`
			`import subprocess`
			`import sys`
			`import time`
			`from argparse import ArgumentParser`

			`from trains import Task`

Improve example documentation 2020-05-24 12:47:52 +00:00			`# fake data for us to "process"`
Added distributed examples 2020-05-24 12:37:55 +00:00			`data = (`
			`['a', '2'], ['b', '4'], ['c', '6'], ['d', '8'],`
			`['e', '1'], ['f', '3'], ['g', '5'], ['h', '7'],`
			`)`


			`def mp_worker(arguments):`
			`print('sub process', os.getpid())`
			`inputs, the_time = arguments`
			`from random import randint`
			`additional_parameters = {'stuff_' + str(randint(0, 100)): 'some stuff ' + str(randint(0, 100))}`
			`Task.current_task().connect(additional_parameters)`
			`print(" Process %s\tWaiting %s seconds" % (inputs, the_time))`
			`time.sleep(int(the_time))`
			`print(" Process %s\tDONE" % inputs)`


			`def mp_handler(use_subprocess):`
			`if use_subprocess:`
			`process = multiprocessing.Pool(4)`
			`else:`
			`process = multiprocessing.pool.ThreadPool(4)`
			`process.map(mp_worker, data)`
			`process.close()`
			`print('DONE main !!!')`


			`if __name__ == '__main__':`
			`parser = ArgumentParser()`
			`parser.add_argument('--num_workers', help='integer value', type=int, default=3)`
			`parser.add_argument('--use_subprocess', help='integer value', type=int, default=1)`
Improve example documentation 2020-05-24 12:47:52 +00:00			`# this argument we will not be logging, see below Task.init`
			`parser.add_argument('--counter', help='integer value', type=int, default=-1)`
Added distributed examples 2020-05-24 12:37:55 +00:00
			`args = parser.parse_args()`
			`print(os.getpid(), 'ARGS:', args)`

			`# We have to initialize the task in the master process,`
			`# it will make sure that any sub-process calling Task.init will get the master task object`
Improve example documentation 2020-05-24 12:47:52 +00:00			# notice that we exclude the `counter` argument, so we can launch multiple sub-processes with trains-agent
			# otherwise, the `counter` will always be set to the original value.
			`task = Task.init('examples', 'Popen example', auto_connect_arg_parser={'counter': False})`
Added distributed examples 2020-05-24 12:37:55 +00:00
			`# we can connect multiple dictionaries, each from different process, as long as the keys have different names`
			`param = {'args_{}'.format(args.num_workers): 'some value {}'.format(args.num_workers)}`
			`task.connect(param)`

			`# check if we need to start the process, meaning counter is negative`
			`counter = args.num_workers if args.counter < 0 else args.counter`

			`p = None`
Improve example documentation 2020-05-24 12:47:52 +00:00			`# launch sub-process, every subprocess will launch the next in the chain, until we launch them all.`
			`# We could also launch all of them here, but that would have been to simple for us J`
Added distributed examples 2020-05-24 12:37:55 +00:00			`if counter > 0:`
			`cmd = [sys.executable, sys.argv[0],`
			`'--counter', str(counter - 1),`
			`'--num_workers', str(args.num_workers),`
			`'--use_subprocess', str(args.use_subprocess)]`
			`print(cmd)`
			`p = subprocess.Popen(cmd, cwd=os.getcwd())`

Improve example documentation 2020-05-24 12:47:52 +00:00			`# the actual "processing" is done here`
Added distributed examples 2020-05-24 12:37:55 +00:00			`mp_handler(args.use_subprocess)`
			`print('Done logging')`
Improve example documentation 2020-05-24 12:47:52 +00:00
			`# wait for the process we launched`
			`# this means every subprocess will be waiting for the process it launched and`
			`# the master process will exit after all of them are completed`
Added distributed examples 2020-05-24 12:37:55 +00:00			`if p and counter > 0:`
			`p.wait()`
			`print('Exiting')`