threading.md

import time
import threading

def longRunningTask(niters):
    for i in range(niters):
        if i % 2 == 0: print('Tick')
        else:          print('Tock')
        time.sleep(0.5)

t = threading.Thread(target=longRunningTask, args=(8,))

t.start()

while t.is_alive():
    time.sleep(0.4)
    print('Waiting for thread to finish...')
print('Finished!')
t = threading.Thread(target=longRunningTask, args=(6, ))
t.start()

print('Joining thread ...')
t.join()
print('Finished!')
class LongRunningThread(threading.Thread):
    def __init__(self, niters, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.niters = niters

    def run(self):
        for i in range(self.niters):
            if i % 2 == 0: print('Tick')
            else:          print('Tock')
            time.sleep(0.5)

t = LongRunningThread(6)
t.start()
t.join()
print('Done')
t = threading.Thread(target=longRunningTask)
t.daemon = True
def task():
    for i in range(5):
        print(f'{i} Woozle ', end='')
        time.sleep(0.1)
        print('Wuzzle')

threads = [threading.Thread(target=task) for i in range(5)]
for t in threads:
    t.start()
lock = threading.Lock()

def task():

    for i in range(5):
        with lock:
            print(f'{i} Woozle ', end='')
            time.sleep(0.1)
            print('Wuzzle')

threads = [threading.Thread(target=task) for i in range(5)]
for t in threads:
    t.start()
def task():
    for i in range(5):
        lock.acquire()
        print(f'{i} Woozle ', end='')
        time.sleep(0.1)
        print('Wuzzle')
        lock.release()
def mutex(func, lock):
    def wrapper(*args):
        with lock:
            func(*args)
    return wrapper

class MyClass(object):

    def __init__(self):
        lock = threading.Lock()
        self.safeFunc1 = mutex(self.safeFunc1, lock)
        self.safeFunc2 = mutex(self.safeFunc2, lock)

    def safeFunc1(self):
        time.sleep(0.1)
        print('safeFunc1 start')
        time.sleep(0.2)
        print('safeFunc1 end')

    def safeFunc2(self):
        time.sleep(0.1)
        print('safeFunc2 start')
        time.sleep(0.2)
        print('safeFunc2 end')

mc = MyClass()

f1threads = [threading.Thread(target=mc.safeFunc1) for i in range(4)]
f2threads = [threading.Thread(target=mc.safeFunc2) for i in range(4)]

for t in f1threads + f2threads:
    t.start()
import numpy as np

processingFinished = threading.Event()

def processData(data):
    print('Processing data ...')
    time.sleep(2)
    print('Result:', data.mean())
    processingFinished.set()

data = np.random.randint(1, 100, 100)

t = threading.Thread(target=processData, args=(data,))
t.start()

processingFinished.wait()
print('Processing finished!')
with mp.Pool(processes=16) as pool:
    # do stuff with the pool
import                    time
import multiprocessing as mp
import numpy           as np

def crunchImage(imgfile):

    # Load a nifti image and calculate some
    # metric from the image. Use your
    # imagination to fill in this function.
    time.sleep(2)
    np.random.seed()
    result = np.random.randint(1, 100, 1)[0]

    return result


imgfiles = [f'{i:02d}.nii.gz' for i in range(20)]

print(f'Crunching {len(imgfiles)} images...')

start = time.time()

with mp.Pool(processes=16) as p:
     results = p.map(crunchImage, imgfiles)

end = time.time()

for imgfile, result in zip(imgfiles, results):
   print(f'Result for {imgfile}: {result}')

print('Total execution time: {:0.2f} seconds'.format(end - start))
def crunchImage(imgfile, modality):
    time.sleep(2)

    np.random.seed()

    if modality == 't1':
        result = np.random.randint(1, 100, 1)
    elif modality == 't2':
        result = np.random.randint(100, 200, 1)

    return result[0]


imgfiles   = [f't1_{i:02d}.nii.gz' for i in range(10)] + \
             [f't2_{i:02d}.nii.gz' for i in range(10)]
modalities = ['t1'] * 10 + ['t2'] * 10

args = [(f, m) for f, m in zip(imgfiles, modalities)]

print('Crunching images...')

start = time.time()

with mp.Pool(processes=16) as pool:
     results = pool.starmap(crunchImage, args)

end = time.time()

for imgfile, modality, result in zip(imgfiles, modalities, results):
    print(f'{imgfile} [{modality}]: {result}')

print('Total execution time: {:0.2f} seconds'.format(end - start))
import                    time
import multiprocessing as mp
import numpy           as np


def linear_registration(src, ref):
    time.sleep(1)
    return np.eye(4)


def nonlinear_registration(src, ref, affine):

    time.sleep(3)

    # this number represents a non-linear warp
    # field - use your imagination people!
    np.random.seed()
    return np.random.randint(1, 100, 1)[0]


t1s = [f'{i:02d}_t1.nii.gz' for i in range(20)]
std = 'MNI152_T1_2mm.nii.gz'

print('Running structural-to-standard registration '
      f'on {len(t1s)} subjects...')


# Run linear registration on all the T1s.
start = time.time()
with mp.Pool(processes=16) as pool:

    # We build a list of AsyncResult objects
    linresults = [pool.apply_async(linear_registration, (t1, std))
                  for t1 in t1s]

    # Then we wait for each job to finish,
    # and replace its AsyncResult object
    # with the actual result - an affine
    # transformation matrix.
    for i, r in enumerate(linresults):
        linresults[i] = r.get()


end = time.time()

print('Linear registrations completed in '
      f'{end - start:0.2f} seconds')


# Run non-linear registration on all the T1s,
# using the linear registrations to initialise.
start = time.time()
with mp.Pool(processes=16) as pool:
    nlinresults = [pool.apply_async(nonlinear_registration, (t1, std, aff))
                   for (t1, aff) in zip(t1s, linresults)]

    # Wait for each non-linear reg to finish,
    # and store the resulting warp field.
    for i, r in enumerate(nlinresults):
        nlinresults[i] = r.get()


end = time.time()

print('Non-linear registrations completed in '
      '{:0.2f} seconds'.format(end - start))

print('Non linear registrations:')
for t1, result in zip(t1s, nlinresults):
    print(f'{t1} : {result}')
import                    time
import functools       as ft
import multiprocessing as mp
import numpy           as np

# Store the parameters that are required
# to create our memory-mapped arrays, as
# we need to re-use them a couple of times.
#
# Note that in practice you would usually
# want to store these files in a temporary
# directory, and/or ensure that they are
# deleted once you are finished.
data_params  = dict(filename='data.mmap',  shape=(91, 109, 91, 50), dtype=np.float32)
model_params = dict(filename='model.mmap', shape=(91, 109, 91),     dtype=np.float32)

# Load our data as a memory-mapped array (we
# are using random data for this example)
data    = np.memmap(**data_params, mode='w+')
data[:] = np.random.random((91, 109, 91, 50)).astype(np.float32)
data.flush()

# Pre-allocate space to store the fitted
# model parameters
model = np.memmap(**model_params, mode='w+')
def fit_model(indata, outdata, sliceidx):

    indata  = np.memmap(**indata,  mode='r')
    outdata = np.memmap(**outdata, mode='r+')

    # sleep to simulate expensive model fitting
    print(f'Fitting model at slice {sliceidx}')
    time.sleep(1)
    outdata[:, :, sliceidx] = indata[:, :, sliceidx, :].mean() + sliceidx
fit_function = ft.partial(fit_model, data_params, model_params)
slice_idxs   = list(range(91))

with mp.Pool(processes=16) as pool:
    pool.map(fit_function, slice_idxs)

print(model)
import sys
import subprocess as sp
def memusage(msg):
    if sys.platform == 'darwin':
        total = sp.run(['sysctl', 'hw.memsize'], capture_output=True).stdout.decode()
        total = int(total.split()[1]) // 1048576
        usage = sp.run('vm_stat', capture_output=True).stdout.decode()
        usage = usage.strip().split('\n')
        usage = [l.split(':') for l in usage]
        usage = {k.strip() : v.strip() for k, v in usage}
        usage = int(usage['Pages free'][:-1]) / 256.0
        usage = int(total - usage)
    else:
        stdout = sp.run(['free', '--mega'], capture_output=True).stdout.decode()
        stdout = stdout.split('\n')[1].split()
        total  = int(stdout[1])
        usage  = int(stdout[2])
    print(f'Memory usage {msg}: {usage} / {total} MB')
import                    time
import multiprocessing as mp
import numpy           as np

memusage('before creating data')

# allocate 500MB of data
data = np.random.random(500 * (1048576 // 8))

# Assign nelems values to each worker
# process (hard-coded so we need 12
# jobs to complete the task)
nelems =  len(data) // 12

memusage('after creating data')

# Each job process nelems values,
# starting from the specified offset
def process_chunk(offset):
    time.sleep(1)
    return data[offset:offset + nelems].sum()

# Generate an offset into the data for each job -
# we will call process_chunk for each offset
offsets = range(0, len(data), nelems)

# Create our worker process pool
with mp.Pool(4) as pool:

    results = pool.map_async(process_chunk, offsets)

    # Wait for all of the jobs to finish
    elapsed = 0
    while not results.ready():
        memusage(f'after {elapsed} seconds')
        time.sleep(1)
        elapsed += 1

    results = results.get()

print('Total sum:   ', sum(results))
print('Sanity check:', data.sum())
data[offset:offset + nelems] += 1
import multiprocessing as mp
import ctypes
import numpy as np
np.set_printoptions(suppress=True)


def process_chunk(shape, idxs):

    # Get references to our
    # input/output data, and
    # create Numpy array views
    # into them.
    sindata  = process_chunk.input_data
    soutdata = process_chunk.output_data
    indata   = np.ctypeslib.as_array(sindata) .reshape(shape)
    outdata  = np.ctypeslib.as_array(soutdata).reshape(shape)

    # Do the calculation on
    # the specified voxels
    outdata[idxs] = indata[idxs] ** 2
def process_dataset(data):

    nprocs   = 8
    origData = data

    # Create arrays to store the
    # input and output data
    sindata  = mp.RawArray(ctypes.c_double, data.size)
    soutdata = mp.RawArray(ctypes.c_double, data.size)
    data     = np.ctypeslib.as_array(sindata).reshape(data.shape)
    outdata  = np.ctypeslib.as_array(soutdata).reshape(data.shape)

    # Copy the input data
    # into shared memory
    data[:]  = origData

    # Make the input/output data
    # accessible to the process_chunk
    # function. This must be done
    # *before* the worker pool is
    # created - even though we are
    # doing things differently to the
    # read-only example, we are still
    # making the data arrays accessible
    # at the *module* level, so the
    # memory they are stored in can be
    # shared with the child processes.
    process_chunk.input_data  = sindata
    process_chunk.output_data = soutdata

    # number of voxels to be computed
    # by each worker process.
    nvox = int(data.size / nprocs)

    # Generate coordinates for
    # every voxel in the image
    xlen, ylen, zlen = data.shape
    xs, ys, zs = np.meshgrid(np.arange(xlen),
                             np.arange(ylen),
                             np.arange(zlen))

    xs = xs.flatten()
    ys = ys.flatten()
    zs = zs.flatten()

    # We're going to pass each worker
    # process a list of indices, which
    # specify the data items which that
    # worker process needs to compute.
    xs = [xs[nvox * i:nvox * i + nvox] for i in range(nprocs)] + [xs[nvox * nprocs:]]
    ys = [ys[nvox * i:nvox * i + nvox] for i in range(nprocs)] + [ys[nvox * nprocs:]]
    zs = [zs[nvox * i:nvox * i + nvox] for i in range(nprocs)] + [zs[nvox * nprocs:]]

    # Build the argument lists for
    # each worker process.
    args = [(data.shape, (x, y, z)) for x, y, z in zip(xs, ys, zs)]

    # Create a pool of worker
    # processes and run the jobs.
    with mp.Pool(processes=nprocs) as pool:
        pool.starmap(process_chunk, args)

    return outdata
indata  = np.array(np.arange(64).reshape((4, 4, 4)), dtype=np.float64)
outdata = process_dataset(indata)

print('Input')
print(indata)

print('Output')
print(outdata)