pangeo-data · guillaumeeb · Sep 20, 2022 · Sep 25, 2022 · Sep 26, 2022 · Oct 5, 2022
diff --git a/README.md b/README.md
@@ -3,15 +3,16 @@
 Benchmarking &amp; Scaling Studies of the Pangeo Platform
 
 - [Benchmarking](#benchmarking)
-  - [Creating an Environment](#creating-an-environment)
+  - [Creating an Environment on an HPC Center](#creating-an-environment-on-an-hpc-center)
+  - [Environment on a Kubernetes based system](#environment-on-a-kubernetes-based-system)
   - [Benchmark Configuration](#benchmark-configuration)
   - [Running the Benchmarks](#running-the-benchmarks)
   - [Benchmark Results](#benchmark-results)
   - [Visualization](#visualization)
 
-## Creating an Environment
+## Creating an Environment on an HPC Center
 
-To run the benchmarks, it's recommended to create a dedicated conda environment by running:
+To run the benchmarks on an HPC platform, it's recommended to create a dedicated conda environment by running:
 
 ```bash
 conda env create -f ./binder/environment.yml
@@ -31,33 +32,31 @@ and then run the post build script:
 ./binder/postBuild
 ```
 
-## Benchmark Configuration
+## Environment on a Kubernetes based system
 
-The `benchmark-configs` directory contains YAML files that are used to run benchmarks on different machines. So far, the following HPC systems' configs are provided:
+To run the benchmark on any Cloud platform using Kubernetes, it is recommanded to use [pangeo/pangeo-notebook Docker image](https://github.com/pangeo-data/pangeo-docker-images/tree/master/pangeo-notebook).
 
-```bash
-$ tree ./benchmark-configs/
-benchmark-configs/
-├── cheyenne.yaml
-└── hal.yaml
-└── wrangler.yaml
+This package currently assumes a Dask Gateway cluster is available from the Kubernetes environment.
 
-```
+## Benchmark Configuration
+
+The `benchmark-configs` directory contains YAML files that are used to run benchmarks on different machines. So far, HPC systems config have been provided for several clusters: Cheyenne from NCAR, HAL from CNES, Wrangler from TACC. It also contains configurations for CESNET Center based on a Kubernetes deployment over Openstack. There might be several configurations for each center.
 
 In case you are interested in running the benchmarks on another system, you will need to create a new YAML file for your system with the right configurations. See the existing config files for reference.
 
 ## Running the Benchmarks
+
 ### from command line
 
 To run the benchmarks, a command utility `pangeobench` is provided in this repository.
-To use it to benchmark Pangeo computation, you need to specify subcommand `run` and the location of the benchmark configuration
+To use it to benchmark Pangeo computation, you need to specify subcommand `run` and the location of the benchmark configuration.
 
 ```bash
-./pangebench run benchmark-configs/cheyenne.computation.yaml
+./pangeobench run benchmark-configs/cheyenne.pri2.yaml
 ```
 
 
-To use it to benchmark Pangeo IO with weak scaling analysis, you need to specify subcommand `run` and the location of the benchmark configuration
+To use it to benchmark Pangeo IO with weak scaling analysis, you need to specify subcommand `run` and the location of the benchmark configuration.
 
 
 ```bash
@@ -72,7 +71,7 @@ First, create data files:
 ```
 Second, upload data files to S3 object store if you need to benchmark S3 object store:
 ```bash
-./pangebench upload --config_file benchmark-configs/cheyenne.write.yaml
+./pangeobench upload --config_file benchmark-configs/cheyenne.write.yaml
 ```
 
 Last, read data files:
@@ -91,8 +90,8 @@ Commands:
   run     Run benchmarking
   upload  Upload benchmarking files from local directory to S3 object store
 ```
-## Running the Benchmarks
-### from jupyter notebook.
+
+### from Jupyter notebook.
 
 To run the benchmarks from jupyter notebook, install 'pangeo-bench' kernel to your jupyter notebook enviroment, then start run.ipynb notebook.  You will need to specify the configuration file as described above in your notebook.
 

diff --git a/benchmark-configs/EOSC-CESNET-small.readwrite.yaml b/benchmark-configs/EOSC-CESNET-small.readwrite.yaml
@@ -0,0 +1,27 @@
+operation_choice: readwrite
+machine: EOSC-CESNET-small
+cluster_manager: gateway
+cluster_kwargs:
+  worker_memory: 4
+chunk_per_worker: 2
+spil: false
+freq: 1D
+parameters:
+  fixed_totalsize: False
+  number_of_workers_per_nodes:
+    - 1
+  number_of_nodes:
+    - 1
+    - 4
+  chunk_size:
+    - 32MB
+    - 64MB
+  chunking_scheme:
+    - temporal
+  io_format:
+    - zarr
+  filesystem:
+    - s3
+profile: default
+bucket: pangeo-benchmarking
+endpoint_url: https://object-store.cloud.muni.cz
diff --git a/benchmark-configs/EOSC-CESNET.readwrite.yaml b/benchmark-configs/EOSC-CESNET.readwrite.yaml
@@ -0,0 +1,35 @@
+operation_choice: readwrite
+machine: EOSC-CESNET
+cluster_manager: gateway
+cluster_kwargs:
+  worker_memory: 4
+chunk_per_worker: 10
+spil: false
+freq: 1D
+parameters:
+  fixed_totalsize: False
+  number_of_workers_per_nodes:
+    - 1
+  number_of_nodes:
+    - 1
+    - 4
+    - 8
+    - 16
+    - 32
+  chunk_size:
+    - 32MB
+    - 64MB
+    - 128MB
+    - 256MB
+    - 512MB
+    - 1024MB
+  chunking_scheme:
+    - temporal
+    - auto
+  io_format:
+    - zarr
+  filesystem:
+    - s3
+profile: default
+bucket: pangeo-benchmarking
+endpoint_url: https://object-store.cloud.muni.cz
diff --git a/benchmark-configs/cheyenne.pri1-a.yaml b/benchmark-configs/cheyenne.pri1-a.yaml
@@ -1,12 +1,18 @@
+operation_choice: readwrite
 machine: cheyenne
-job_scheduler: pbs
-queue: regular
-walltime: 1:00:00
-maxmemory_per_node: 109gb
-maxcore_per_node: 36
+cluster_manager: pbs
+cluster_kwargs:
+  queue: regular
+  walltime: 1:00:00
+  memory: 109gb
+  cores: 36
+  local_directory: "$TMPDIR"
+  interface: "ib0"
 chunk_per_worker: 10
 spil: false
+freq: 1D
 parameters:
+  fixed_totalsize: False
   number_of_workers_per_nodes:
     - 1
   number_of_threads_per_workers: 1
@@ -18,3 +24,9 @@ parameters:
     - spatial
     - temporal
     - auto
+  io_format:
+    - zarr
+    - netcdf
+  filesystem:
+    - posix
+local_dir: test_pri1-a
diff --git a/benchmark-configs/cheyenne.pri1-b.yaml b/benchmark-configs/cheyenne.pri1-b.yaml
@@ -1,12 +1,18 @@
+operation_choice: readwrite
 machine: cheyenne
-job_scheduler: pbs
-queue: regular
-walltime: 1:00:00
-maxmemory_per_node: 109gb
-maxcore_per_node: 36
+cluster_manager: pbs
+cluster_kwargs:
+  queue: regular
+  walltime: 1:00:00
+  memory: 109gb
+  cores: 36
+  local_directory: "$TMPDIR"
+  interface: "ib0"
 chunk_per_worker: 10
 spil: false
+freq: 1D
 parameters:
+  fixed_totalsize: False
   number_of_workers_per_nodes:
     - 1
   number_of_threads_per_workers: 1
@@ -18,3 +24,9 @@ parameters:
     - spatial
     - temporal
     - auto
+  io_format:
+    - zarr
+    - netcdf
+  filesystem:
+    - posix
+local_dir: test_pri1-b
diff --git a/benchmark-configs/cheyenne.pri2.yaml b/benchmark-configs/cheyenne.pri2.yaml
@@ -1,12 +1,18 @@
+operation_choice: readwrite
 machine: cheyenne
-job_scheduler: pbs
-queue: regular
-walltime: 1:00:00
-maxmemory_per_node: 109gb
-maxcore_per_node: 36
+cluster_manager: pbs
+cluster_kwargs:
+  queue: regular
+  walltime: 1:00:00
+  memory: 109gb
+  cores: 36
+  local_directory: "$TMPDIR"
+  interface: "ib0"
 chunk_per_worker: 10
 spil: false
+freq: 1D
 parameters:
+  fixed_totalsize: False
   number_of_workers_per_nodes:
     - 1
   number_of_threads_per_workers: 1
@@ -25,3 +31,9 @@ parameters:
     - spatial
     - temporal
     - auto
+  io_format:
+    - zarr
+    - netcdf
+  filesystem:
+    - posix
+local_dir: test_pri2
diff --git a/benchmark-configs/cheyenne.readwrite.yaml b/benchmark-configs/cheyenne.readwrite.yaml
@@ -1,10 +1,13 @@
 operation_choice: readwrite
 machine: cheyenne
-job_scheduler: pbs
-queue: regular
-walltime: 1:00:00
-maxmemory_per_node: 109gb
-maxcore_per_node: 36
+cluster_manager: pbs
+cluster_kwargs:
+  queue: regular
+  walltime: 1:00:00
+  memory: 109gb
+  cores: 36
+  local_directory: "$TMPDIR"
+  interface: "ib0"
 chunk_per_worker: 10
 spil: false
 freq: 1D

diff --git a/benchmark-configs/cheyenne.write.yaml b/benchmark-configs/cheyenne.write.yaml
@@ -1,10 +1,13 @@
 operation_choice: write
 machine: cheyenne
-job_scheduler: pbs
-queue: regular
-walltime: 1:00:00
-maxmemory_per_node: 109gb
-maxcore_per_node: 36
+cluster_manager: pbs
+cluster_kwargs:
+  queue: regular
+  walltime: 1:00:00
+  memory: 109gb
+  cores: 36
+  local_directory: "$TMPDIR"
+  interface: "ib0"
 chunk_per_worker: 10
 spil: false
 freq: 1D

diff --git a/benchmark-configs/cheyenne.yaml b/benchmark-configs/cheyenne.yaml
diff --git a/benchmark-configs/hal.yaml b/benchmark-configs/hal.yaml
diff --git a/benchmark-configs/hal1D.yaml b/benchmark-configs/hal1D.yaml
@@ -1,11 +1,18 @@
+operation_choice: readwrite
 machine: hal1D
-job_scheduler: pbs
-queue: batch
-walltime: 1:00:00
-maxmemory_per_node: 128gb
-maxcore_per_node: 24
+cluster_manager: pbs
+cluster_kwargs:
+  queue: batch
+  walltime: 1:00:00
+  memory: 128gb
+  cores: 24
+  local_directory: "$TMPDIR"
+  interface: "ib0"
+chunk_per_worker: 10
 spil: false
+freq: 1D
 parameters:
+  fixed_totalsize: False
   number_of_workers_per_nodes:
     - 1
   number_of_threads_per_workers: 1
@@ -24,3 +31,9 @@ parameters:
     - spatial
     - temporal
     - auto
+  io_format:
+    - zarr
+    - netcdf
+  filesystem:
+    - posix
+local_dir: test_1D