git clone https://gitlab.esrf.fr/workflow/ewokstutorials/ewoksfordevs

node1 = {
    "id": "node1",
    "task_type": "class",
    "task_identifier": "ewokscore.tests.examples.tasks.sumtask.SumTask",
}
node2 = {
    "id": "node2",
    "task_type": "class",
    "task_identifier": "ewokscore.tests.examples.tasks.sumtask.SumTask",
}

node3 = {
    "id": "node3",
    "task_type": "class",
    "task_identifier": "ewokscore.tests.examples.tasks.sumtask.SumTask",
}
node4 = {
    "id": "node4",
    "task_type": "class",
    "task_identifier": "ewokscore.tests.examples.tasks.sumtask.SumTask",
}

link1 = {"source": "node1", "target": "node3"}
link2 = {"source": "node2", "target": "node3"}
link3 = {"source": "node3", "target": "node4"}

link1["data_mapping"] = [
    {"source_output": "result", "target_input": "a"}
]
link2["data_mapping"] = [
    {"source_output": "result", "target_input": "b"}
]
link3["data_mapping"] = [
    {"source_output": "result", "target_input": "a"}
]

node1["default_inputs"] = [
    {"name": "a", "value": 2},
    {"name": "b", "value": 3},
]
node2["default_inputs"] = [
    {"name": "a", "value": 4},
    {"name": "b", "value": 5},
]

workflow = {
    "graph": {"id": "workflow1"},
    "nodes": [node1, node2, node3, node4],
    "links": [link1, link2, link3],
}

pip install ewoks

from ewoks import execute_graph

execute_graph(workflow)

{'result': 14}

from ewoks import convert_graph

convert_graph(workflow, "results/workflow1.json")

'results/workflow1.json'

!ewoks execute results/workflow1.json --outputs=end --merge-outputs

###################################
# Execute workflow 'results/workflow1.json'
###################################

RESULTS:
{'result': 14}

FINISHED

w = {"graph": {"id": "workflow1"}, "nodes": [...], "links": [...]}

execute_graph(workflow, engine="...")

%%time
execute_graph(
    "results/workflow1.json",
    inputs=[{"name": "delay", "value": 1, "all": True}],
)

CPU times: user 9.17 ms, sys: 4.19 ms, total: 13.4 ms
Wall time: 4.03 s

{'result': 14}

%%time
execute_graph(
    "results/workflow1.json",
    inputs=[{"name": "delay", "value": 1, "all": True}],
    engine="ppf",
)

CPU times: user 37.9 ms, sys: 28.4 ms, total: 66.3 ms
Wall time: 3.12 s

{'result': 14}

from ewoks import execute_graph

execute_graph(
    "results/workflow1.json",
    engine="ppf",
    inputs=[{"name": "delay", "value": 1, "all": True}],
    pool_type='thread' # Only required for Windows
)

execute_graph(
    workflow,
    inputs=[
        {"name": "a", "value": 1, "id": "node1"},
        {"name": "b", "value": 1, "id": "node2"},
    ],
)

{'result': 9}

!ewoks execute results/workflow1.json --outputs=end --merge-outputs \
       -p node1:a=1 -p node2:b=1  # noqa E999

###################################
# Execute workflow 'results/workflow1.json'
###################################

RESULTS:
{'result': 9}

FINISHED

execute_graph(workflow)

{'result': 9}

!ewoks execute results/workflow1.json --outputs=end --merge-outputs

###################################
# Execute workflow 'results/workflow1.json'
###################################

RESULTS:
{'result': 14}

FINISHED

execute_graph(workflow, merge_outputs=False)

{'node4': {'result': 9}}

!ewoks execute results/workflow1.json --outputs=end

###################################
# Execute workflow 'results/workflow1.json'
###################################

RESULTS:
{'node4': {'result': 14}}

FINISHED

execute_graph(
    workflow,
    outputs=[
        {"name": "result", "id": "node2"},
        {"name": "result", "id": "node4"},
    ],
    merge_outputs=False,
)

{'node2': {'result': 5}, 'node4': {'result': 9}}

execute_graph(workflow, outputs=[{"all": True}], merge_outputs=False)

{'node1': {'result': 4},
 'node2': {'result': 5},
 'node3': {'result': 9},
 'node4': {'result': 9}}

!ewoks execute results/workflow1.json --outputs=all

###################################
# Execute workflow 'results/workflow1.json'
###################################

RESULTS:
{'node1': {'result': 5},
 'node2': {'result': 9},
 'node3': {'result': 14},
 'node4': {'result': 14}}

FINISHED

execute_graph(
    workflow,
    inputs=[
        {"name": "a", "value": 2, "id": "node1"},
        {"name": "a", "value": 3, "id": "node2"},
    ],
    outputs=[
        {"name": "result", "id": "node1"},
        {"name": "result", "id": "node4"},
    ],
    merge_outputs=False,
)

pip install "ewoksserver[frontend]"

ewoks-server --port 5174  # The default port is 8000

RESOURCE DIRECTORY:
/path/to/resource/directory

CELERY:
Not configured (local workflow execution)

EWOKS:
{...}

Uvicorn running on http://127.0.0.1:5174 (Press CTRL+C to quit)

pip install "ewoksserver[frontend]"
ewoks-server --port 5174

%%writefile results/tasks.py
from ewokscore import Task

class Add(
    Task,
    input_names=["a"],
    optional_input_names=["b"],
    output_names=["sum"],
):
    def run(self):
        if self.missing_inputs.b:
            self.outputs.sum = self.inputs.a
        else:
            self.outputs.sum = self.inputs.a + self.inputs.b

Overwriting results/tasks.py

%%writefile -a results/tasks.py


import numpy


class Linspace1(
    Task,
    optional_input_names=["start", "stop", "num"],
    output_names=["numbers"],
):
    def run(self):
        start = self.get_input_value("start", 0)
        stop = self.get_input_value("stop", 1)
        num = self.get_input_value("num", 1)
        self.outputs.numbers = numpy.linspace(start, stop, num)

Appending to results/tasks.py

%%writefile -a results/tasks.py


class Linspace2(
    Task,
    optional_input_names=["start", "stop", "num"],
    output_names=["numbers"],
):
    """Same as Linspace1, alternative implementation"""

    def run(self):
        inputs = self.get_input_values()
        inputs.setdefault("start", 0)
        inputs.setdefault("stop", 1)
        inputs.setdefault("num", 1)
        self.outputs.numbers = numpy.linspace(**inputs)

Appending to results/tasks.py

node1 = {
    "id": "node1",
    "task_type": "class",
    "task_identifier": "results.tasks.Add",
}
node2 = {
    "id": "node2",
    "task_type": "class",
    "task_identifier": "results.tasks.Add",
}
node3 = {
    "id": "node3",
    "task_type": "class",
    "task_identifier": "results.tasks.Add",
}
node4 = {
    "id": "node4",
    "task_type": "class",
    "task_identifier": "results.tasks.Linspace2",
}

link1 = {"source": "node1", "target": "node3"}
link2 = {"source": "node2", "target": "node3"}
link3 = {"source": "node3", "target": "node4"}
link1["data_mapping"] = [
    {"source_output": "sum", "target_input": "a"}
]
link2["data_mapping"] = [
    {"source_output": "sum", "target_input": "b"}
]
link3["data_mapping"] = [
    {"source_output": "sum", "target_input": "num"}
]

workflow = {
    "graph": {"id": "workflow2"},
    "nodes": [node1, node2, node3, node4],
    "links": [link1, link2, link3],
}

convert_graph(
    workflow,
    "results/workflow2.json",
    inputs=[{"name": "a", "value": 1}, {"name": "b", "value": 1}],
)

'results/workflow2.json'

execute_graph("results/workflow2.json")

{'numbers': array([0.        , 0.33333333, 0.66666667, 1.        ])}

!ewoks execute results/workflow2.json --outputs=all --merge-outputs

###################################
# Execute workflow 'results/workflow2.json'
###################################

RESULTS:
{'numbers': array([0.        , 0.33333333, 0.66666667, 1.        ]), 'sum': 4}

FINISHED

from ewokscore import Task


class Add(
    Task,
    input_names=["a"],
    optional_input_names=["b"],
    output_names=["sum"],
):
    def run(self):
        if self.missing_inputs.b:
            self.outputs.sum = self.inputs.a
        else:
            self.outputs.sum = self.inputs.a + self.inputs.b

ewoks-server --port 5174

pip install "ewoks[orange]" pyqt5

ewoks execute results/workflow2.json --engine=orange

ewoks-server --port 5174

pip install "ewoksndreg[full]"

ewoks-server --port 5174 --rediscover-tasks

pip install "ewoksndreg[full]"
ewoks-canvas

pip install "ewoksjob[sql,redis]" ewoks

pip install "ewoksjob[sql,redis,worker]"

pip install "ewoksjob[monitor]"

%%writefile results/celeryconfig_sql.py
broker_url = "sqla+sqlite:///celery.db"
result_backend = "db+sqlite:///celery_results.db"

result_serializer = "pickle"
accept_content = [
    "application/json",
    "application/x-python-serialize",
]
result_expires = 600
task_remote_tracebacks = True

Overwriting results/celeryconfig_sql.py

apt install redis-server
conda install redis-server

ewoksjob --config=results.celeryconfig_sql worker

-------------- celery@lindenolf v5.3.0b1 (dawn-chorus)
--- ***** ----- 
-- ******* ---- Linux-5.4.0-144-generic-x86_64 ...
- *** --- * --- 
- ** ---------- [config]
- ** ---------- .> app:         ewoks:0x7ff87d66a700
- ** ---------- .> transport:   sqla+sqlite:///celery.db
- ** ---------- .> results:     sqlite:///celery_results.db
- *** --- * --- .> concurrency: 4 (prefork)
-- ******* ---- .> task events: OFF (enable -E to monitor tasks)
--- ***** ----- 
 -------------- [queues]
                .> celery  exchange=celery(direct) key=celery

ewoksjob --config=results.celeryconfig_redis worker

export EWOKS_CONFIG_URI=results.celeryconfig_sql

export EWOKS_CONFIG_URI=results.celeryconfig_sql  # Linux and macOS
set EWOKS_CONFIG_URI=results.celeryconfig_sql  # Windows

from ewoks import execute_graph

result = execute_graph(*args, **kwargs)

ewoks submit results/workflow2.json --outputs=end --wait inf

ewoks submit results/workflow2.json

Workflow 'results/workflow2.json' submitted (ID: d3d20d06-20da-4861-8ddf-6cf70c0bab0b)

export EWOKS_CONFIG_URI=results.celeryconfig_sql  # Linux and macOS
set EWOKS_CONFIG_URI=results.celeryconfig_sql  # Windows

pip install "ewoksjob[sql,redis,worker,slurm]"

ssh myname@rnice

scontrol token lifespan=86400

SLURM_JWT=eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJleHAiOjE2Nzk1NjU5ODUsImlhdCI6MTY3OTU2NTk4NCwic3VuIjoiZGVub2xmIn0.s9uGkTPg9xNO21LG5a10fdqvfQfnfVZ4ad58bVYncrg

ewoksjob --config=results.celeryconfig_sql worker --pool=slurm \
 --slurm-url=http://... \
 --slurm-user=myname \
 --slurm-token=eyJhbGciOiJIUzI1NiIs...

export EWOKS_CONFIG_URI=results.celeryconfig_sql
export SLURM_URL=http://...
export SLURM_USER=myname
export SLURM_TOKEN=eyJhbGciOiJIUzI1NiIs...

ewoksjob worker --pool=slurm

module load ewoks

ewoksjob worker --pool=slurm \
 --slurm-pre-script="module load ewoks" \
 -sp time_limit=240 \
 -sp current_working_directory=/home/esrf/${USER}/ewoksfordevs

from ewoksjob.client import submit

# Optionally override the worker's slurm parameters set with `-sp`
wd = "/home/esrf/myname/ewoksfordevs"
kwargs["_slurm_spawn_arguments"] = {
    "parameters": {
        "time_limit": 240,
        "current_working_directory": wd,
    },
    "pre_script": "module load ewoks",
}

# If the workflow is defined on the client side
# send it as a python dictionary
future = submit(args=("results/workflow1.json",), kwargs=kwargs)
result = future.get(timeout=None)

ewoks submit results/workflow1.json --wait inf

pyslurmutils status -m 1 --url=... --user=... --token=...

export EWOKS_CONFIG_URI=results.celeryconfig_sql

ewoksjob worker --pool=slurm \
  --slurm-pre-script="module load ewoks" \
  --slurm-log-directory=/home/esrf/${USER}/slurm/ \
  -sp current_working_directory=/home/esrf/${USER}/ewoksfordevs \
  -sp time_limit=10

ewoks submit results/workflow1.json --wait inf

from blissdata.h5api import dynamic_hdf5

with dynamic_hdf5.File("/path/to/file.h5") as f:
    ...

from silx.io import h5py_utils

with h5py_utils.open_item("/path/to/result.h5", "/", mode="a") as f:
    ...

from ewoksdata.data.hdf5.dataset_writer import DatasetWriter

with DatasetWriter(group, "intensity") as writer:
    for data in ...:
        writer.add_point(data)

/data/visitor/ch6562/id31/20230309/PROCESSED_DATA

python3 -m venv worker_env
source worker_env/bin/activate
pip install "ewoksjob[blissworker]" pyfai blissdata \
            blissoda ewoksdata silx

python3 -m venv client_env
source client_env/bin/activate
pip install "ewoksjob[beacon,redis]" ewoks

ewoks execute results/workflow2.json -l info

from ewoks import execute_graph

result = execute_graph(..., upload_parameters=...)

from ewoks import execute_graph

execute_graph(..., convert_destination="/path/to/file.json")

engine	Loops	Conditional Links	Parallel execution	Interaction (GUI)	An Ewoks task is enough
`None`	$\color{red}{\text{✗}}$	$\color{red}{\text{✗}}$	$\color{red}{\text{✗}}$	$\color{red}{\text{✗}}$	$\color{green}{\text{✓}}$
`"dask"`	$\color{red}{\text{✗}}$	$\color{red}{\text{✗}}$	$\color{green}{\text{✓}}$	$\color{red}{\text{✗}}$	$\color{green}{\text{✓}}$
`"ppf"`	$\color{green}{\text{✓}}$	$\color{green}{\text{✓}}$	$\color{green}{\text{✓}}$	$\color{red}{\text{✗}}$	$\color{green}{\text{✓}}$
`"orange"`	$\color{red}{\text{✗}}$	$\color{red}{\text{✗}}$	$\color{orange}{\text{(✓)}}$	$\color{green}{\text{✓}}$	$\color{red}{\text{✗}}$

Introduction¶

Resources¶

Slides¶

Ewoks Documentation¶

Tutorial Resources¶

When to use Ewoks¶

Program¶

Part 1: Ewoks workflows¶

Part 2: Ewoks Tasks¶

Part 3: Ewoks Integration¶

Part 4: Final remarks¶

Part 1: Ewoks Workflows¶

Ewoks workflow definition¶

Create Ewoks Workflows¶

Create a workflow in Python¶

Define workflow nodes¶

Define workflow links¶

Define workflow inputs¶

Define workflow¶

Execute Ewoks workflows¶

Execute workflow from python¶

Execute workflow from the command line¶

✏️ Exercise: make a workflow and execute it¶

Execution engine¶

✏️ Exercise: execute a workflow with different engines¶

Workflow execution inputs and outputs¶

Workflow inputs¶

Workflow outputs¶

✏️ Exercise: execute a workflow with inputs/outputs¶

Workflow GUI¶

✏️ Exercise: use the web GUI¶

Part 2: Ewoks Tasks¶

Create workflow tasks¶

✏️ Exercise: create ewoks tasks and use them in a workflow¶

Use new tasks in the GUI¶

✏️ Exercise: use new tasks in a GUI¶

Use third-party task libraries¶

Find task libraries¶

Use task libraries¶

✏️ Exercise: create an image alignment workflow in Orange and load it in the web app or vice versa¶

Part 3: Ewoks Integration¶

Remote execution¶

Celery configuration¶

Start and test a worker¶

With Redis¶

Submit a test workflow in the client environment.¶

✏️ Exercise: setup and test remote execution¶

Submit a workflow from Python¶

Submit a workflow from the command line¶

✏️ Exercise: submit a workflow remotely¶

Slurm execution¶

Create a Slurm access token¶

Start a Slurm worker¶

Submit a workflow to Slurm¶

✏️ Exercise: submit a workflow to Slurm¶

Online data processing in Bliss¶

Celery configuration¶

Workflow for online and offline processing¶

Read Bliss data during or after the scan with blissdata.¶

Deal with concurrent writing from parallel workflows¶

Optimize saving in HDF5¶

Build the saving path in a robust way¶

✏️ Exercise: process a live XRPD scan¶

Part 4: Final remarks¶

Ewoks features not covered¶

Conditional links¶

Sub-Workflows as nodes in other workflows¶

Desktop GUI¶

Task output persistence¶

Ewoks events¶

Celery worker events¶

Data portal integration¶

Data provenance¶

Deploy software on Slurm¶

Read Bliss data during or after the scan with `blissdata`.¶