This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Test Illumina Genotyping Array | ||
# Controls when the workflow will run | ||
on: | ||
#run on push to feature branch "kp_GHA_Terra_auth_PD-2682" - REMOVE WHEN DONE TESTING | ||
# push: | ||
# branches: | ||
# - kp_GHA_Terra_auth_PD-2682 | ||
pull_request: | ||
branches: [ "develop", "staging", "master" ] | ||
# Only run if files in these paths changed: pipelines/broad/genotyping/illumina, tasks, verification, .github/workflows/test_illumina_genotyping_array.yml | ||
#################################### | ||
# SET PIPELINE SPECIFIC PATHS HERE # | ||
#################################### | ||
paths: | ||
- 'pipelines/broad/genotyping/illumina/**' | ||
- 'tasks/**' | ||
- 'verification/**' | ||
- '.github/workflows/test_illumina_genotyping_array.yml' | ||
# Allows you to run this workflow manually from the Actions tab | ||
workflow_dispatch: | ||
inputs: | ||
useCallCache: | ||
description: 'Use call cache (default: true)' | ||
required: false | ||
default: "true" | ||
updateTruth: | ||
description: 'Update truth files (default: false)' | ||
required: false | ||
default: "false" | ||
env: | ||
PROJECT_NAME: WARP | ||
# Github repo name | ||
REPOSITORY_NAME: ${{ github.event.repository.name }} | ||
jobs: | ||
run_pipeline: | ||
runs-on: ubuntu-latest | ||
# Add "id-token" with the intended permissions. | ||
permissions: | ||
contents: 'read' | ||
id-token: 'write' | ||
steps: | ||
# actions/checkout MUST come before auth | ||
- uses: 'actions/checkout@v3' | ||
- id: 'auth' | ||
name: 'Authenticate to Google Cloud' | ||
uses: 'google-github-actions/auth@v2' | ||
with: | ||
token_format: 'access_token' | ||
# Centralized in dsp-tools-k8s; ask in #dsp-devops-champions for help troubleshooting | ||
# This is provided by the DevOps team - do not change! | ||
workload_identity_provider: 'projects/1038484894585/locations/global/workloadIdentityPools/github-wi-pool/providers/github-wi-provider' | ||
# This is our tester service account | ||
service_account: '[email protected]' | ||
access_token_lifetime: '3600' #seconds, default is 3600 | ||
access_token_scopes: 'profile, email, openid' | ||
# ... further steps are automatically authenticated | ||
- name: Check working directory | ||
run: | | ||
echo "Current directory:" | ||
pwd | ||
ls -lht | ||
- name: Submit job, poll status, and get outputs | ||
id: pipeline_run | ||
run: | | ||
# Set common environment variables | ||
TOKEN="${{ steps.auth.outputs.access_token }}" | ||
NAMESPACE="warp-pipelines" | ||
WORKSPACE="WARP Tests" | ||
USE_CALL_CACHE="${{ github.event.inputs.useCallCache }}" | ||
UPDATE_TRUTH="${{ github.event.inputs.updateTruth }}" | ||
# TODO: Need to get the test type (Plumbing/ Scientific) from inputs or based on the target branch | ||
TEST_TYPE="Plumbing" # Placeholder for now | ||
CURRENT_TIME=$(date +"%Y-%m-%d-%H-%M-%S") | ||
######################################## | ||
# SET PIPELINE SPECIFIC VARIABLES HERE # | ||
######################################## | ||
PIPELINE_NAME="IlluminaGenotypingArray" | ||
PIPELINE_DIR="pipelines/broad/genotyping/illumina" | ||
# TODO: Need to set the truth and result paths appropriately | ||
TRUTH_PATH="gs://broad-warp-test-storage/illumina_genotyping_array/truth" | ||
RESULTS_PATH="gs://broad-warp-test-storage/illumina_genotyping_array/results/$CURRENT_TIME" | ||
# Function to call the Firecloud API using the firecloud_api.py script | ||
firecloud_action() { | ||
python3 scripts/firecloud_api/firecloud_api.py --token "$TOKEN" --namespace "$NAMESPACE" --workspace "$WORKSPACE" --action "$1" "${@:2}" | ||
} | ||
# Convert USE_CALL_CACHE to a boolean-friendly format ("true" -> true, "false" -> false) | ||
if [ "$USE_CALL_CACHE" = "true" ]; then | ||
USE_CALL_CACHE_BOOL=true | ||
else | ||
USE_CALL_CACHE_BOOL=false | ||
fi | ||
# Create the submission_data.json file which will be the same for all inputs | ||
SUBMISSION_DATA_FILE="submission_data.json" | ||
# Use a heredoc to generate the JSON file content dynamically | ||
cat <<EOF > "$SUBMISSION_DATA_FILE" | ||
{ | ||
"methodConfigurationNamespace": "warp-pipelines", | ||
"methodConfigurationName": "$PIPELINE_NAME", | ||
"useCallCache": $USE_CALL_CACHE_BOOL, | ||
"deleteIntermediateOutputFiles": false, | ||
"useReferenceDisks": true, | ||
"memoryRetryMultiplier": 1.2, | ||
"workflowFailureMode": "NoNewCalls", | ||
"userComment": "Automated submission", | ||
"ignoreEmptyOutputs": false | ||
} | ||
EOF | ||
echo "Created submission data file: $SUBMISSION_DATA_FILE" | ||
# Loop through each file in the appropriate test inputs directory | ||
INPUTS_DIR=$PIPELINE_DIR/test_inputs/$TEST_TYPE | ||
for input_file in $INPUTS_DIR/*; do | ||
# Update input_file as needed for test | ||
test_input_file=$(python3 scripts/firecloud_api/UpdateTestInputs.py --truth_path $TRUTH_PATH \ | ||
--results_path $RESULTS_PATH \ | ||
--inputs_json $input_file \ | ||
--update_truth UPDATE_TRUTH) | ||
# Upload the input file to the workspace | ||
firecloud_action upload_file --pipeline_name $PIPELINE_NAME --test_input_file "$test_input_file" | ||
echo "Submitting job for input file: $input_file" | ||
# Submit job for the input file | ||
# 1. Create a new submission | ||
# 2. Poll submission status and get workflow IDs and statuses | ||
# 3. Iterate over the Workflow IDs to get outputs | ||
done | ||
##################################### LEFT OFF HERE ####################################### | ||
# TODO: move the submission and monitoring into the for loop to occur for each input file # | ||
########################################################################################### | ||
# 1. Submit a new workflow using the generated submission_data.json | ||
SUBMISSION_ID=$(firecloud_action submit --submission_data_file "$SUBMISSION_DATA_FILE") | ||
# Check if submission was successful | ||
if [ -z "$SUBMISSION_ID" ]; then | ||
echo "Submission failed." # Log failure to stdout | ||
echo "submission_id=" >> $GITHUB_OUTPUT # Set empty submission id | ||
exit 1 | ||
fi | ||
echo "Submission ID: $SUBMISSION_ID" | ||
echo "submission_id=$SUBMISSION_ID" >> $GITHUB_OUTPUT # Write the submission ID to GITHUB_OUTPUT | ||
# 2. Poll submission status and get workflow IDs and statuses | ||
echo "Polling submission status..." | ||
RESPONSE=$(firecloud_action poll_status --submission_id "$SUBMISSION_ID") | ||
# Parse the JSON response to get the workflow ID and statuses | ||
echo "Workflows and their statuses:" | ||
echo "$RESPONSE" | jq | ||
# Check if RESPONSE is empty | ||
if [ -z "$RESPONSE" ]; then | ||
echo "Failed to retrieve Workflow IDs." # Log failure to stdout | ||
exit 1 | ||
fi | ||
# Extract workflows and their statuses | ||
WORKFLOW_STATUSES=$(echo "$RESPONSE" | jq -r 'to_entries | map(.key + ": " + .value) | .[]') | ||
echo "workflow_statuses=$WORKFLOW_STATUSES" >> $GITHUB_OUTPUT # Write workflow statuses to GITHUB_OUTPUT | ||
# Generate markdown summary table for workflows and statuses | ||
WORKFLOW_TABLE=$(echo "$RESPONSE" | jq -r 'to_entries | ["Workflow ID | Status", "--- | ---"] + map(.key + " | " + .value) | .[]') | ||
# Print workflow table to stdout | ||
echo "$WORKFLOW_TABLE" | ||
# 3. Iterate over the Workflow IDs to get outputs | ||
OUTPUTS="" | ||
echo "Retrieving workflow outputs..." | ||
for WORKFLOW_ID in $(echo "$RESPONSE" | jq -r 'keys[]'); do | ||
WORKFLOW_OUTPUT=$(firecloud_action get_outputs --submission_id "$SUBMISSION_ID" --workflow_id "$WORKFLOW_ID" --pipeline_name "$PIPELINE_NAME") | ||
OUTPUTS+="$WORKFLOW_OUTPUT"$'\n' | ||
done | ||
echo "Workflow outputs retrieved successfully." | ||
echo "Raw output before jq:" | ||
echo "$OUTPUTS" | ||
echo "outputs=$OUTPUTS" >> $GITHUB_OUTPUT # Write the outputs to GITHUB_OUTPUT | ||
# Handle null values, strings, and numbers in the outputs by converting everything to a string and replacing null with '-' | ||
OUTPUTS_TABLE=$(echo "$OUTPUTS" | jq -r 'to_entries | ["Output | Value", "--- | ---"] + map(.key + " | " + (if .value == null then "-" else (.value | tostring) end)) | .[]') | ||
#print outputs table to stdout | ||
echo "$OUTPUTS_TABLE" | ||
- name: Print Summary on Success | ||
if: success() | ||
run: | | ||
echo "# :white_check_mark: Pipeline Execution Summary :white_check_mark:" >> $GITHUB_STEP_SUMMARY | ||
echo "- **Pipeline Name**: IlluminaGenotypingArray" >> $GITHUB_STEP_SUMMARY | ||
echo "- **Submission ID**: ${{ steps.pipeline_run.outputs.submission_id }}" >> $GITHUB_STEP_SUMMARY | ||
echo "" >> $GITHUB_STEP_SUMMARY | ||
echo "## Workflows and their statuses" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY | ||
echo "${{ steps.pipeline_run.outputs.workflow_statuses }}" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY | ||
echo "## Workflow Outputs" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY | ||
echo "${{ steps.pipeline_run.outputs.outputs }}" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY | ||
echo " :shipit: " >> $GITHUB_STEP_SUMMARY | ||
- name: Print Summary on Failure | ||
if: failure() | ||
run: | | ||
echo "# :x: Pipeline Execution Summary (on Failure) :x: " >> $GITHUB_STEP_SUMMARY | ||
echo "- **Pipeline Name**: IlluminaGenotypingArray" >> $GITHUB_STEP_SUMMARY | ||
echo "- **Submission ID**: ${{ steps.pipeline_run.outputs.submission_id }}" >> $GITHUB_STEP_SUMMARY | ||
echo "" >> $GITHUB_STEP_SUMMARY | ||
echo "## Workflows and their statuses (if available)" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY | ||
echo "${{ steps.pipeline_run.outputs.workflow_statuses }}" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY | ||
echo "## Workflow Outputs (if available)" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY | ||
echo "${{ steps.pipeline_run.outputs.outputs }}" >> $GITHUB_STEP_SUMMARY | ||
echo "\`\`\`" >> $GITHUB_STEP_SUMMARY |