Fix rope_cache_length computation for models with rope_local_base_freq #8072

Workflow file for this run

.github/workflows/cpu-tests.yml at 814f44c

	name: CPU tests

	on:
	push:
	branches: [main]
	pull_request_target:
	branches: [main]
	types: [opened, reopened, ready_for_review, labeled, synchronize]
	pull_request: {} # todo
	workflow_dispatch: {}

	# lock down all permissions by default
	permissions:
	contents: read # needed to check out code
	checks: write # needed for test results
	pull-requests: read # needed for PR metadata
	actions: read # needed to use actions
	security-events: none
	statuses: write # needed to update commit status

	concurrency:
	group: ${{ github.workflow }}-${{ github.ref }}-${{ github.head_ref }}
	cancel-in-progress: ${{ startsWith(github.event_name, 'pull_request') }}

	defaults:
	run:
	shell: bash

	env:
	HF_HOME: .cache-HF # Define HF_HOME for caching
	TRANSFORMERS_CACHE: .cache-HF/transformers
	DATASETS_CACHE: .cache-HF/datasets
	HF_DATASETS_CACHE: .cache-HF/datasets
	TORCH_URL: "https://download.pytorch.org/whl/cpu/"

	jobs:
	testing-imports:
	runs-on: ${{ matrix.os }}
	if: github.event_name != 'pull_request_target'
	strategy:
	fail-fast: false
	matrix:
	os: ["ubuntu-22.04", "ubuntu-24.04", "macOS-14", "windows-2022"]
	python-version: ["3.10"]
	timeout-minutes: 10
	steps:
	- name: Checkout generic
	uses: actions/checkout@v6
	- uses: actions/setup-python@v6
	with:
	python-version: ${{ matrix.python-version }}

	- name: Install minimal dependencies
	run: \|
	pip install . -U --extra-index-url="${TORCH_URL}"
	pip list

	- name: Testing package imports
	# make sure all modules are still importable with only the minimal dependencies available
	run: \|
	modules=$(
	find litgpt -type f -name "*.py" \| \
	sed 's/\.py$//' \| sed 's/\//./g' \| \
	sed 's/.__init__//g' \| xargs -I {} echo "import {};"
	)
	echo "$modules"
	python -c "$modules"

	pytester:
	# Route PRs based on contributor type to avoid duplicate runs:
	# - Collaborators: use pull_request (tests workflow changes from PR)
	# - External forks: use pull_request_target (uses trusted workflow from main)
	# - Always run for push to main and workflow_dispatch
	if: \|
	(github.event_name == 'pull_request' && contains('OWNER,MEMBER,COLLABORATOR', github.event.pull_request.author_association)) \|\|
	(github.event_name == 'pull_request_target' && !contains('OWNER,MEMBER,COLLABORATOR', github.event.pull_request.author_association)) \|\|
	(github.event_name != 'pull_request' && github.event_name != 'pull_request_target')
	runs-on: ${{ matrix.os }}
	strategy:
	fail-fast: false
	matrix:
	os: ["ubuntu-22.04"]
	python-version: ["3.10", "3.11", "3.12", "3.13"]
	requires: ["latest"]
	include:
	- { os: "ubuntu-22.04", python-version: "3.10", requires: "oldest" }
	- { os: "windows-2022", python-version: "3.10", requires: "latest" }
	- { os: "macOS-14", python-version: "3.10", requires: "latest" }
	timeout-minutes: 35
	steps:
	- name: Checkout generic
	uses: actions/checkout@v6
	if: github.event_name != 'pull_request_target'
	- name: Checkout for `pull_request_target`
	uses: actions/checkout@v6
	if: github.event_name == 'pull_request_target'
	with:
	ref: ${{ github.event.pull_request.head.sha }}
	- uses: actions/setup-python@v6
	with:
	python-version: ${{ matrix.python-version }}
	cache-dependency-path: pyproject.toml
	cache: "pip"

	# Add caching for HF models and tokenizers
	- name: HF cache
	uses: actions/cache@v5
	continue-on-error: true
	with:
	path: .cache-HF
	key: hf-cache_${{ runner.os }}-py${{ matrix.python-version }}
	restore-keys: \|
	hf-cache_${{ runner.os }}-py${{ matrix.python-version }}
	hf-cache_${{ runner.os }}-
	hf-cache_

	- name: Set min. dependencies
	if: matrix.requires == 'oldest'
	run: \|
	pip install 'lightning-utilities[cli]>=0.15.1'
	python -m lightning_utilities.cli requirements set-oldest --req_files=pyproject.toml
	- name: Install dependencies
	run: \|
	pip install '.[extra,compiler,test]' -U --upgrade-strategy eager --extra-index-url="${TORCH_URL}"
	pip list

	- name: Run tests
	env:
	HF_TOKEN: ${{ secrets.HF_TOKEN }}
	run: pytest -v litgpt/ tests/ --timeout=180 --durations=100

	- name: Show cache
	run: \|
	pip install -q py-tree
	python -m py_tree -d 1 .cache-HF

	testing-guardian:
	runs-on: ubuntu-latest
	needs: [pytester, testing-imports]
	if: \|
	(github.event_name == 'pull_request_target' && !contains('OWNER,MEMBER,COLLABORATOR', github.event.pull_request.author_association)) \|\|
	(github.event_name == 'pull_request' && contains('OWNER,MEMBER,COLLABORATOR', github.event.pull_request.author_association))
	steps:
	- run: echo "${{ needs.pytester.result }}"
	- name: failing...
	if: needs.pytester.result == 'failure'
	run: exit 1
	- name: cancelled or skipped...
	if: contains(fromJSON('["cancelled", "skipped"]'), needs.pytester.result)
	timeout-minutes: 1
	run: sleep 90

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Fix rope_cache_length computation for models with rope_local_base_freq #8072

Workflow file

Fix rope_cache_length computation for models with rope_local_base_freq #8072

Uh oh!

Workflow file for this run