securefederatedai
diff --git a/‎.github/actions/tr_post_test_run/action.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/actions/tr_post_test_run/action.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/pq_pipeline.yml‎
Lines changed: 12 additions & 0 deletions b/‎.github/workflows/pq_pipeline.yml‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎.github/workflows/tr_verifiable_dataset_e2e.yml‎
Lines changed: 81 additions & 0 deletions b/‎.github/workflows/tr_verifiable_dataset_e2e.yml‎
Lines changed: 81 additions & 0 deletions
diff --git a/‎tests/end_to_end/models/collaborator.py‎
Lines changed: 23 additions & 0 deletions b/‎tests/end_to_end/models/collaborator.py‎
Lines changed: 23 additions & 0 deletions
@@ -24,7 +24,7 @@ runs:
       id: tar_files
       if: ${{ always() }}
       run: |
-        tar -cvf result.tar --exclude="cert" --exclude="data" --exclude="__pycache__" --exclude="tensor.db" --exclude="workspace.tar" $HOME/results
+        tar -cvf result.tar --exclude="cert" --exclude="data" --exclude="__pycache__" --exclude="tensor.db" --exclude="workspace.tar" --exclude="minio_data" $HOME/results
         # Model name might contain forward slashes, convert them to underscore. 
         tmp=${{ env.MODEL_NAME }}
         echo "MODEL_NAME_MODIFIED=${tmp//\//_}" >> $GITHUB_ENV
 
@@ -158,6 +158,16 @@ jobs:
     with:
       commit_id: ${{ needs.set_commit_id_for_all_jobs.outputs.commit_id }}
 
+  tr_verifiable_dataset_e2e:
+    if: |
+      (github.event_name == 'schedule' && github.repository_owner == 'securefederatedai') ||
+      (github.event_name == 'workflow_dispatch')
+    name: TaskRunner Verifiable Dataset E2E
+    needs: task_runner_e2e
+    uses: ./.github/workflows/tr_verifiable_dataset_e2e.yml
+    with:
+      commit_id: ${{ needs.set_commit_id_for_all_jobs.outputs.commit_id }}
+
   run_trivy:
     if: |
       (github.event_name == 'schedule' && github.repository_owner == 'securefederatedai') ||
@@ -198,6 +208,7 @@ jobs:
       wf_mnist_local_runtime,
       wf_watermark_e2e,
       wf_secagg_e2e,
+      task_runner_connectivity_e2e,
       task_runner_e2e,
       task_runner_resiliency_e2e,
       task_runner_fedeval_e2e,
@@ -206,6 +217,7 @@ jobs:
       task_runner_dockerized_e2e,
       task_runner_secret_ssl_e2e,
       task_runner_flower_app_pytorch,
+      tr_verifiable_dataset_e2e,
       run_trivy,
       run_bandit
     ]
 
@@ -0,0 +1,81 @@
+---
+# Task Runner Verifiable Dataset E2E
+
+name: TR_Verifiable_Dataset_E2E  # Please do not modify the name as it is used in the composite action
+
+on:
+  workflow_call:
+    inputs:
+      commit_id:
+        required: false
+        type: string
+  workflow_dispatch:
+    inputs:
+      num_rounds:
+        description: "Number of rounds to train"
+        required: false
+        default: "2"
+        type: string
+      num_collaborators:
+        description: "Number of collaborators"
+        required: false
+        default: "2"
+        type: string
+
+permissions:
+  contents: read
+
+# Environment variables common for all the jobs
+# DO NOT use double quotes for the values of the environment variables
+env:
+  NUM_ROUNDS: ${{ inputs.num_rounds || 2 }}
+  NUM_COLLABORATORS: ${{ inputs.num_collaborators || 2 }}
+  COMMIT_ID: ${{ inputs.commit_id || github.sha }} # use commit_id from the calling workflow
+
+jobs:
+  test_with_s3: # Run it only if the runner machine has enough memory and CPU
+    name: With S3 (torch/histology_s3, 3.11)
+    runs-on: ubuntu-22.04
+    timeout-minutes: 120
+    env:
+      MODEL_NAME: "torch/histology_s3"
+      PYTHON_VERSION: "3.11"
+
+    steps:
+      - name: Checkout OpenFL repository
+        id: checkout_openfl
+        uses: actions/checkout@v4
+        with:
+          ref: ${{ env.COMMIT_ID }}
+
+      - name: Pre test run
+        uses: ./.github/actions/tr_pre_test_run
+        if: ${{ always() }}
+
+      - name: Install MinIO
+        id: install_minio
+        run: |
+          wget https://dl.min.io/server/minio/release/linux-amd64/minio
+          chmod +x minio
+          sudo mv minio /usr/local/bin/
+
+      - name: Install MinIO Client
+        id: install_minio_client
+        run: |
+          wget https://dl.min.io/client/mc/release/linux-amd64/mc
+          chmod +x mc
+          sudo mv mc /usr/local/bin/
+
+      - name: Run Task Runner E2E tests with S3
+        id: run_tests
+        run: |
+          python -m pytest -s tests/end_to_end/test_suites/tr_verifiable_dataset_tests.py \
+          -m task_runner_with_s3 --model_name ${{ env.MODEL_NAME }} \
+          --num_rounds ${{ env.NUM_ROUNDS }} --num_collaborators ${{ env.NUM_COLLABORATORS }}
+          echo "Task Runner E2E tests with S3 run completed"
+
+      - name: Post test run
+        uses: ./.github/actions/tr_post_test_run
+        if: ${{ always() }}
+        with:
+          test_type: "With_S3"
@@ -246,3 +246,26 @@ def ping_aggregator(self):
             log.error(f"{error_msg}: {e}")
             raise e
         return True
+
+    def calculate_hash(self):
+        """
+        Calculate the hash of the data directory and store in hash.txt file
+        Returns:
+            bool: True if successful, else False
+        """
+        try:
+            log.info(f"Calculating hash for {self.collaborator_name}")
+            cmd = f"fx collaborator calchash --data_path {self.data_directory_path}"
+            error_msg = "Failed to calculate hash"
+            return_code, output, error = fh.run_command(
+                cmd,
+                error_msg=error_msg,
+                container_id=self.container_id,
+                workspace_path=self.workspace_path,
+            )
+            fh.verify_cmd_output(output, return_code, error, error_msg, f"Calculated hash for {self.collaborator_name}")
+
+        except Exception as e:
+            log.error(f"{error_msg}: {e}")
+            raise e
+        return True