Self-hosted runner with slow tests (scheduled)

CI nightlies cpu/gpu & cleanup #20

Workflow file for this run

.github/workflows/nightly-tests.yml at 614e342

	# Inspired by
	# https://github.com/huggingface/peft/blob/main/.github/workflows/nightly.yml
	name: Self-hosted runner with slow tests (scheduled)

	on:
	pull_request: # TODO(aliberts): for testing, delete before merge
	branches:
	- main
	workflow_dispatch:
	schedule:
	- cron: "0 2 * * *"

	env:
	RUN_SLOW: "yes"
	IS_GITHUB_CI: "1"
	# To be able to run tests on CUDA 12.2
	NVIDIA_DISABLE_REQUIRE: "1"
	# SLACK_API_TOKEN: ${{ secrets.SLACK_API_TOKEN }}


	jobs:
	# run_all_tests_cpu:
	# strategy:
	# fail-fast: false
	# runs-on: ubuntu-latest
	# env:
	# CUDA_VISIBLE_DEVICES: "0"
	# TEST_TYPE: "single_gpu"
	# container:
	# image: huggingface/lerobot-cpu:latest
	# credentials:
	# username: ${{ secrets.DOCKERHUB_USERNAME }}
	# password: ${{ secrets.DOCKERHUB_PASSWORD }}
	# defaults:
	# run:
	# shell: bash
	# working-directory: /lerobot
	# steps:
	# - name: Check
	# run: \|
	# pwd
	# python --version
	# which python
	# ls -glh
	# ls -glh /opt/venv/
	# ls -glh /opt/venv/lib
	# ls -glh /opt/venv/lib/python3.10/site-packages
	# - name: Tests
	# env:
	# DATA_DIR: tests/data
	# MUJOCO_GL: egl
	# MUJOCO_EGL_DEVICE_ID: 0
	# run: \|
	# unset DISPLAY
	# pytest -v --cov=./lerobot --cov-report=xml tests
	# - name: Tests end-to-end
	# env:
	# DATA_DIR: tests/data
	# MUJOCO_GL: egl
	# run: \|
	# make test-ete

	run_all_tests_single_gpu:
	strategy:
	fail-fast: false
	runs-on: [single-gpu, nvidia-gpu, t4, ci]
	env:
	CUDA_VISIBLE_DEVICES: "0"
	TEST_TYPE: "single_gpu"
	container:
	image: huggingface/lerobot-gpu:latest
	options: --gpus all --shm-size "16gb" -e NVIDIA_DISABLE_REQUIRE=true -e DATA_DIR=tests/data/ -e MUJOCO_GL=egl
	credentials:
	username: ${{ secrets.DOCKERHUB_USERNAME }}
	password: ${{ secrets.DOCKERHUB_PASSWORD }}
	defaults:
	run:
	shell: bash
	working-directory: /lerobot
	steps:
	# - uses: actions/checkout@v4
	- name: Nvidia-smi
	run: nvidia-smi
	- name: Install EGL
	run: apt-get update && apt-get install -y libegl1-mesa-dev
	- name: Test
	env:
	DATA_DIR: tests/data
	MUJOCO_GL: egl
	run: \|
	pytest -v --cov=./lerobot --cov-report=xml tests
	- name: Tests end-to-end
	env:
	DATA_DIR: tests/data
	MUJOCO_GL: egl
	run: \|
	make test-ete
	- name: Tailscale Wait
	if: ${{ failure() \|\| runner.debug == '1' }}
	uses: huggingface/tailscale-action@main
	with:
	waitForSSH: true
	authkey: ${{ secrets.TAILSCALE_SSH_AUTHKEY }}
	slackChannel: ${{ secrets.SLACK_CIFEEDBACK_CHANNEL }}
	slackToken: ${{ secrets.SLACK_CIFEEDBACK_BOT_TOKEN }}

	# - name: Generate Report
	# if: always()
	# run: \|
	# pip install slack_sdk tabulate
	# python scripts/log_reports.py >> $GITHUB_STEP_SUMMARY

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

CI nightlies cpu/gpu & cleanup #20

Workflow file

CI nightlies cpu/gpu & cleanup #20

Jobs

Run details

Workflow file for this run