import escape as esc

# to activate serialization of objects
import escape.serialization as ser
import numpy as np

esc.require("0.9.8")

Loading material database from /home/dkor/Data/Development/workspace_escape/escape-core/python/src/escape/scattering/../data/mdb/materials.db

import escape.serialization

# creating a cluster with six nodes and connect a client
import ipyparallel as ipp

cluster = ipp.Cluster(n=16)
cluster.start_cluster_sync()
rc = cluster.connect_client_sync()
rc.wait_for_engines(16)

Starting 16 engines with <class 'ipyparallel.cluster.launcher.LocalEngineSetLauncher'>

X = esc.var("X")

b = esc.par("b", 5)
a = esc.par("a", 100)
c = esc.par("c", 0.5)

F = a * esc.pow(esc.cos(X * b), 2.0) * esc.exp(-c * X)
I = esc.integral(F, b, 0, 500, numpoints=61, epsabs=1e-5, epsrel=1e-5, maxiter=300)
# linspace return view of an array,
# thus making a copy of it to avoid copying by the kernel
x = np.linspace(-10, 10, 500, dtype=float).copy()
y = np.zeros(x.shape, dtype=float)

w1 = F.show(coordinates=x).config(title="F(X; a, b, c)")
w2 = I.show(coordinates=x).config(title="I(X; a, c)")
esc.show(w1, w2)

# computation times for cluster and multithreading
def compute_parallel(func, x, y):
    # multithreading
    nth = np.arange(1, 17, 1, dtype=int)
    tms_mth = np.zeros(shape=nth.shape, dtype=float)
    for i, n in enumerate(nth):
        k = esc.kernel("Parallel threads", func, numthreads=int(n))
        t = %timeit -o -q k(x, y)
        tms_mth[i] = t.average * 1000
    # multiprocessing single threads per node
    nrc1 = np.arange(1, 17, 1, dtype=int)
    tms_rc_1 = np.zeros(shape=nrc1.shape, dtype=float)
    for i, n in enumerate(nrc1):
        k = esc.kernel(
            "Cluster kernel", func, multithreaded=False, rc=rc, rc_ids=list(range(0, n))
        )
        t = %timeit -o -q k(x, y)
        tms_rc_1[i] = t.average * 1000
    # multiprocessing two threads per node
    nrc2 = np.arange(1, 9, 1, dtype=int)
    tms_rc_2 = np.zeros(shape=nrc2.shape, dtype=float)
    for i, n in enumerate(nrc2):
        k = esc.kernel("Cluster kernel", func, numthreads=2, rc=rc, rc_ids=list(range(0, n)))
        t = %timeit -o -q k(x, y)
        tms_rc_2[i] = t.average * 1000
    # multiprocessing three threads per node
    nrc3 = np.arange(1, 6, 1, dtype=int)
    tms_rc_3 = np.zeros(shape=nrc3.shape, dtype=float)
    for i, n in enumerate(nrc3):
        k = esc.kernel("Cluster kernel", func, numthreads=3, rc=rc, rc_ids=list(range(0, n)))
        t = %timeit -o -q k(x, y)
        tms_rc_3[i] = t.average * 1000
    return (
        (nth, tms_mth),
        (nrc1, tms_rc_1),
        (nrc2 * 2, tms_rc_2),
        (nrc3 * 3, tms_rc_3),
    )


def plot_data(data, title="", ylog=False):
    import matplotlib.pyplot as plt
    fig = plt.figure()
    fig.suptitle(title)
    ax = fig.add_subplot(111)

    labels = [
        "Multithreading",
        "Cluster - 1 thread per node",
        "Cluster - 2 thread per node",
        "Cluster - 3 thread per node",
    ]
    for i in range(0, 4):
        ax.plot(data[i][0], data[i][1], "o--", label=labels[i])

    if ylog:
        ax.set_yscale('log')
    
    ax.set_xlabel("Number of used threads")
    ax.set_ylabel("Computation time [msec]")

    ax.legend()
    plt.show()

# single core
print("Single core results")
k = esc.kernel("Single kernel", I, multithreaded=False)
t = %timeit -o k(x, y)

Single core results
545 ms ± 12.4 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

data = compute_parallel(I, x, y)
plot_data(data, "Slow function, small arrays (500 items)")

x2 = np.linspace(-10, 10, 5000000, dtype=float).copy()
y2 = np.zeros(x2.shape, dtype=float)

# simple kernel without parallel computation
kf = esc.kernel("Single kernel", F, multithreaded=False)
%timeit kf(x2, y2)

396 ms ± 3.1 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

data = compute_parallel(F, x2, y2)
plot_data(data, "Fast function, large arrays (5x10⁶ items)")

x3 = np.linspace(-10, 10, 50000, dtype=float).copy()
y3 = np.zeros(x3.shape, dtype=float)

# simple kernel without parallel computation
kis = esc.kernel("Single kernel", I, multithreaded=False)
%timeit kis(x3, y3)

53.9 s ± 656 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)

data = compute_parallel(I, x3, y3)

plot_data(data, "Slow function, large arrays (50000 items)", ylog=True)

Cluster kernel. Parallel computing using networked computers.¶

Example 1. "Slow" functor. Small arrays.¶

Example 2. "Fast" functor, large arrays.¶

Example 3. "Slow" functor, large arrays.¶

Interpretation of the results¶

Cluster with several PCs¶