spcl · JessieeeNotLi · Oct 30, 2025 · Nov 3, 2025 · Nov 4, 2025 · Nov 4, 2025
diff --git a/.circleci/config.yml b/.circleci/config.yml
diff --git a/.github/workflows/lint.yml b/.github/workflows/lint.yml
@@ -0,0 +1,55 @@
+name: Lint
+
+on:
+  push:
+  pull_request:
+
+jobs:
+  linting:
+    runs-on: ubuntu-latest
+
+    steps:
+      - name: Check out code
+        uses: actions/checkout@v4
+
+      - name: Set up Python
+        id: setup-python
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.x'
+
+      - name: Cache virtualenv
+        uses: actions/cache@v4
+        with:
+          path: python-venv
+          key: venv-${{ runner.os }}-${{ steps.setup-python.outputs.python-version }}-${{ hashFiles('requirements.txt') }}-${{ github.ref_name }}
+          restore-keys: |
+            venv-${{ runner.os }}-${{ steps.setup-python.outputs.python-version }}-${{ hashFiles('requirements.txt') }}-
+            venv-${{ runner.os }}-${{ steps.setup-python.outputs.python-version }}-
+
+      - name: Install system packages
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y libcurl4-openssl-dev
+
+      - name: Install Python dependencies (via install.py)
+        run: |
+          python3 install.py --no-aws --no-azure --no-gcp --no-openwhisk --no-local
+
+      - name: Black (check)
+        run: |
+          . python-venv/bin/activate
+          black benchmarks --check --config .black.toml
+
+      - name: Flake8 (lint)
+        run: |
+          . python-venv/bin/activate
+          # write to file and echo to stdout (requires flake8 with --tee support)
+          flake8 benchmarks --config=.flake8.cfg --tee --output-file flake-reports
+
+      - name: Upload flake report
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: flake-reports
+          path: flake-reports
diff --git a/.gitmodules b/.gitmodules
@@ -3,4 +3,4 @@
   url = https://github.com/mcopik/pypapi.git
 [submodule "benchmarks-data"]
 	path = benchmarks-data
-  url = https://github.com/spcl/serverless-benchmarks-data.git
+  url = https://github.com/McLavish/serverless-benchmarks-data-dphpc.git
diff --git a/.mypy.ini b/.mypy.ini
@@ -3,6 +3,9 @@
 [mypy-docker]
 ignore_missing_imports = True
 
+[mypy-docker.*]
+ignore_missing_imports = True
+
 [mypy-tzlocal]
 ignore_missing_imports = True
 

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -0,0 +1,30 @@
+# .pre-commit-config.yaml
+repos:
+  - repo: local
+    hooks:
+      - id: flake8-local
+        name: flake8 (project env)
+        language: python
+        additional_dependencies: ["flake8==7.1.1"]
+        entry: flake8
+        args: ["--config=.flake8.cfg"]
+        types: [python]
+        files: ^(sebs/|benchmarks/)
+  - repo: local
+    hooks:
+      - id: black-check-local
+        name: black --check (project env)
+        language: python
+        additional_dependencies: ["black==22.8.0"]
+        entry: black
+        args: ["--config=.black.toml", "--check", "--diff"]
+        types: [python]
+        files: ^(sebs/|benchmarks/)
+  # - repo: local
+  #   hooks:
+  #     - id: mypy-local
+  #       name: mypy (project venv)
+  #       language: system
+  #       entry: bash -lc 'python -m mypy --config-file=.mypy.ini sebs'
+  #       types: [python]
+
diff --git a/.vscode/settings.json b/.vscode/settings.json
@@ -0,0 +1,15 @@
+{
+  "[python]": {
+    "editor.defaultFormatter": "ms-python.black-formatter",
+    "editor.formatOnSave": true
+  },
+
+  "black-formatter.importStrategy": "fromEnvironment",
+  "black-formatter.path": [],
+  "black-formatter.args": ["--config=.black.toml"],
+
+  "flake8.importStrategy": "fromEnvironment",
+  "flake8.path": [],
+  "flake8.args": ["--config=.flake8.cfg"],
+  "flake8.enabled": true
+}
diff --git a/benchmarks-data b/benchmarks-data
diff --git a/benchmarks/000.microbenchmarks/010.sleep/input.py b/benchmarks/000.microbenchmarks/010.sleep/input.py
@@ -1,12 +1,11 @@
+size_generators = {"test": 1, "small": 100, "large": 1000}
 
-size_generators = {
-    'test' : 1,
-    'small' : 100,
-    'large': 1000
-}
 
 def buckets_count():
     return (0, 0)
 
-def generate_input(data_dir, size, benchmarks_bucket, input_paths, output_paths, upload_func, nosql_func):
-    return { 'sleep': size_generators[size] }
+
+def generate_input(
+    data_dir, size, benchmarks_bucket, input_paths, output_paths, upload_func, nosql_func
+):
+    return {"sleep": size_generators[size]}
diff --git a/benchmarks/000.microbenchmarks/010.sleep/python/function.py b/benchmarks/000.microbenchmarks/010.sleep/python/function.py
@@ -1,9 +1,9 @@
-
 from time import sleep
 
+
 def handler(event):
 
     # start timing
-    sleep_time = event.get('sleep')
+    sleep_time = event.get("sleep")
     sleep(sleep_time)
-    return { 'result': sleep_time }
+    return {"result": sleep_time}
diff --git a/benchmarks/000.microbenchmarks/020.network-benchmark/input.py b/benchmarks/000.microbenchmarks/020.network-benchmark/input.py
@@ -2,10 +2,12 @@ def buckets_count():
     return 0, 1
 
 
-def generate_input(data_dir, size, benchmarks_bucket, input_paths, output_paths, upload_func, nosql_func):
+def generate_input(
+    data_dir, size, benchmarks_bucket, input_paths, output_paths, upload_func, nosql_func
+):
     return {
-        'bucket': {
-            'bucket': benchmarks_bucket,
-            'output': output_paths[0],
+        "bucket": {
+            "bucket": benchmarks_bucket,
+            "output": output_paths[0],
         },
     }
diff --git a/benchmarks/000.microbenchmarks/020.network-benchmark/python/function.py b/benchmarks/000.microbenchmarks/020.network-benchmark/python/function.py
@@ -1,27 +1,26 @@
 import csv
-import json
 import os.path
 import socket
 from datetime import datetime
-from time import sleep
 
 from . import storage
 
+
 def handler(event):
 
-    request_id = event['request-id']
-    address = event['server-address']
-    port = event['server-port']
-    repetitions = event['repetitions']
-    output_bucket = event.get('bucket').get('bucket')
-    output_prefix = event.get('bucket').get('output')
+    request_id = event["request-id"]
+    address = event["server-address"]
+    port = event["server-port"]
+    repetitions = event["repetitions"]
+    output_bucket = event.get("bucket").get("bucket")
+    output_prefix = event.get("bucket").get("output")
     times = []
     i = 0
     socket.setdefaulttimeout(3)
     server_socket = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
     server_socket.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
-    server_socket.bind(('', 0))
-    message = request_id.encode('utf-8')
+    server_socket.bind(("", 0))
+    message = request_id.encode("utf-8")
     adr = (address, port)
     consecutive_failures = 0
     while i < repetitions + 1:
@@ -43,16 +42,16 @@ def handler(event):
         consecutive_failures = 0
         server_socket.settimeout(2)
     server_socket.close()
-   
+
     if consecutive_failures != 5:
-        with open('/tmp/data.csv', 'w', newline='') as csvfile:
-            writer = csv.writer(csvfile, delimiter=',')
-            writer.writerow(["id", "client_send", "client_rcv"]) 
+        with open("/tmp/data.csv", "w", newline="") as csvfile:
+            writer = csv.writer(csvfile, delimiter=",")
+            writer.writerow(["id", "client_send", "client_rcv"])
             for row in times:
                 writer.writerow(row)
-      
+
         client = storage.storage.get_instance()
-        filename = 'results-{}.csv'.format(request_id)
-        key = client.upload(output_bucket, os.path.join(output_prefix, filename), '/tmp/data.csv')
+        filename = "results-{}.csv".format(request_id)
+        key = client.upload(output_bucket, os.path.join(output_prefix, filename), "/tmp/data.csv")
 
-    return { 'result': key }
+    return {"result": key}
-    if consecutive_failures != 5:
-        with open('/tmp/data.csv', 'w', newline='') as csvfile:
-            writer = csv.writer(csvfile, delimiter=',')
-            writer.writerow(["id", "client_send", "client_rcv"]) 
-        with open("/tmp/data.csv", "w", newline="") as csvfile:
-            writer = csv.writer(csvfile, delimiter=",")
-            writer.writerow(["id", "client_send", "client_rcv"])
-            for row in times:
-                writer.writerow(row)
-      
-
-        client = storage.storage.get_instance()
-        filename = 'results-{}.csv'.format(request_id)
-        key = client.upload(output_bucket, os.path.join(output_prefix, filename), '/tmp/data.csv')
-        filename = "results-{}.csv".format(request_id)
-        key = client.upload(output_bucket, os.path.join(output_prefix, filename), "/tmp/data.csv")
-
-    return { 'result': key }
-    return {"result": key}
+    key = None
+    if consecutive_failures != 5:
+        with open("/tmp/data.csv", "w", newline="") as csvfile:
+            writer = csv.writer(csvfile, delimiter=",")
+            writer.writerow(["id", "client_send", "client_rcv"])
+            for row in times:
+                writer.writerow(row)
+
+        client = storage.storage.get_instance()
+        filename = "results-{}.csv".format(request_id)
+        key = client.upload(output_bucket, os.path.join(output_prefix, filename), "/tmp/data.csv")
+
+    return {"result": key}
-    if consecutive_failures != 5:
-        with open('/tmp/data.csv', 'w', newline='') as csvfile:
-            writer = csv.writer(csvfile, delimiter=',')
-            writer.writerow(["id", "client_send", "client_rcv"]) 
-        with open("/tmp/data.csv", "w", newline="") as csvfile:
-            writer = csv.writer(csvfile, delimiter=",")
-            writer.writerow(["id", "client_send", "client_rcv"])
-            for row in times:
-                writer.writerow(row)
-      
-
-        client = storage.storage.get_instance()
-        filename = 'results-{}.csv'.format(request_id)
-        key = client.upload(output_bucket, os.path.join(output_prefix, filename), '/tmp/data.csv')
-        filename = "results-{}.csv".format(request_id)
-        key = client.upload(output_bucket, os.path.join(output_prefix, filename), "/tmp/data.csv")
-
-    return { 'result': key }
-    return {"result": key}
+    key = None
+    if consecutive_failures != 5:
+        with open("/tmp/data.csv", "w", newline="") as csvfile:
+            writer = csv.writer(csvfile, delimiter=",")
+            writer.writerow(["id", "client_send", "client_rcv"])
+            for row in times:
+                writer.writerow(row)
+
+        client = storage.storage.get_instance()
+        filename = "results-{}.csv".format(request_id)
+        key = client.upload(output_bucket, os.path.join(output_prefix, filename), "/tmp/data.csv")
+
+    return {"result": key}
diff --git a/benchmarks/000.microbenchmarks/030.clock-synchronization/input.py b/benchmarks/000.microbenchmarks/030.clock-synchronization/input.py
@@ -1,12 +1,13 @@
-
-
 def buckets_count():
     return 0, 1
 
-def generate_input(data_dir, size, benchmarks_bucket, input_paths, output_paths, upload_func, nosql_func):
+
+def generate_input(
+    data_dir, size, benchmarks_bucket, input_paths, output_paths, upload_func, nosql_func
+):
     return {
-        'bucket': {
-            'bucket': benchmarks_bucket,
-            'output': output_paths[0],
+        "bucket": {
+            "bucket": benchmarks_bucket,
+            "output": output_paths[0],
         },
     }
+41 −0		200.multimedia/210.thumbnailer/README.md
+5 −2		200.multimedia/220.video-processing/README.md
+7 −0		300.utilities/311.compression/README.md
+12 −0		400.inference/411.image-recognition/README.md
+ −		400.inference/412.language-bert/model/bert-tiny-onnx.tar.gz
+15 −0		400.inference/412.language-bert/text/sentences.jsonl
+ −		400.inference/413.image-classification/data/512px-Cacatua_moluccensis_-Cincinnati_Zoo-8a.jpg
+ −		400.inference/413.image-classification/data/782px-Pumiforme.JPG
+ −		400.inference/413.image-classification/data/800px-20180630_Tesla_Model_S_70D_2015_midnight_blue_left_front.jpg
+ −		400.inference/413.image-classification/data/800px-7weeks_old.JPG
+ −		400.inference/413.image-classification/data/800px-Jammlich_crop.jpg
+ −		400.inference/413.image-classification/data/800px-Porsche_991_silver_IAA.jpg
+ −		400.inference/413.image-classification/data/800px-Sardinian_Warbler.jpg
+ −		400.inference/413.image-classification/data/800px-Welsh_Springer_Spaniel.jpg
+8 −0		400.inference/413.image-classification/data/val_map.txt
+ −		400.inference/413.image-classification/model/resnet50.tar.gz
+13 −0		500.scientific/504.dna-visualisation/README.md
+5 −0		README.md