Skip to content

Commit

Permalink
2.Pre-compiled end-to-end gpu driver validation
Browse files Browse the repository at this point in the history
Signed-off-by: shiva kumar <[email protected]>
  • Loading branch information
shivakunv committed Aug 27, 2024
1 parent b7e165e commit 10c55f0
Showing 1 changed file with 22 additions and 21 deletions.
43 changes: 22 additions & 21 deletions .github/workflows/ci-precompiled.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -89,27 +89,28 @@ jobs:
OPERATOR_OPTIONS: "--set driver.repository=${{ env.PRIVATE_REGISTRY }}/nvidia --set driver.usePrecompiled=true"
run: |
rc=0
for driver_version in ${DRIVER_VERSIONS}; do
echo "Running e2e for DRIVER_VERSION=$driver_version"
DRIVER_VERSION=$(echo "${driver_version}" | cut -d '.' -f 1)
status=0
# Use ARG3=OPERATOR_OPTIONS as KERNEL_FLAVOR in case of kernel upgrade
./tests/ci-run-e2e.sh "${UPGRADE_KERNEL_SCRIPT}" "${DRIVER_VERSION}" "${KERNEL_FLAVOR}" || status=$?
# On the target system, all scripts/test-case exit with code 1 for error handling.
# However, since reboot-related disconnections break the SSH connection
# and can cause the entire job to exit, we should ignore all errors except
# exit code 1. During a reboot, exit code 1 will not be thrown, so handling
# other errors as code 1 will ensure proper management of reboot scenarios
if [ $status -eq 1 ]; then
echo "e2e validation failed for driver branch $DRIVER_VERSION and kernel flavor $KERNEL_FLAVOR with status $status"
rc=$status
fi
sleep 30
./tests/scripts/remote_retry.sh
./tests/ci-run-e2e.sh "${TEST_CASE}" "${DRIVER_VERSION}" "${OPERATOR_OPTIONS}" || status=$?
done
./tests/scripts/pull.sh /tmp/logs logs
exit $rc
echo "SHIVA"
# for driver_version in ${DRIVER_VERSIONS}; do
# echo "Running e2e for DRIVER_VERSION=$driver_version"
# DRIVER_VERSION=$(echo "${driver_version}" | cut -d '.' -f 1)
# status=0
# # Use ARG3=OPERATOR_OPTIONS as KERNEL_FLAVOR in case of kernel upgrade
# ./tests/ci-run-e2e.sh "${UPGRADE_KERNEL_SCRIPT}" "${DRIVER_VERSION}" "${KERNEL_FLAVOR}" || status=$?
# # On the target system, all scripts/test-case exit with code 1 for error handling.
# # However, since reboot-related disconnections break the SSH connection
# # and can cause the entire job to exit, we should ignore all errors except
# # exit code 1. During a reboot, exit code 1 will not be thrown, so handling
# # other errors as code 1 will ensure proper management of reboot scenarios
# if [ $status -eq 1 ]; then
# echo "e2e validation failed for driver branch $DRIVER_VERSION and kernel flavor $KERNEL_FLAVOR with status $status"
# rc=$status
# fi
# sleep 30
# ./tests/scripts/remote_retry.sh
# ./tests/ci-run-e2e.sh "${TEST_CASE}" "${DRIVER_VERSION}" "${OPERATOR_OPTIONS}" || status=$?
# done
# ./tests/scripts/pull.sh /tmp/logs logs
# exit $rc

- name: Archive test logs
if: ${{ failure() }}
Expand Down

0 comments on commit 10c55f0

Please sign in to comment.