Skip to content

[BugFix] Infer reward model pad token from model tokenizer #11023

[BugFix] Infer reward model pad token from model tokenizer

[BugFix] Infer reward model pad token from model tokenizer #11023

Workflow file for this run

name: Build M1 Wheels
on:
pull_request:
push:
branches:
- nightly
- main
- release/*
tags:
# NOTE: Binary build pipelines should only get triggered on release candidate builds
# Release candidate tags look like: v1.11.0-rc1
- v[0-9]+.[0-9]+.[0-9]+-rc[0-9]+
workflow_dispatch:
inputs:
build-cpu:
description: 'Build CPU wheels'
required: false
type: boolean
default: true
workflow_call:
inputs:
test-infra-ref:
description: 'PyTorch test-infra ref (main for nightly, release/X.Y for stable)'
required: false
type: string
default: 'main'
tensordict-source:
description: 'TensorDict source: stable (PyPI), git, or auto (branch-based detection)'
required: false
type: string
default: 'auto'
channel:
description: 'Build channel: nightly, test, release, or empty for auto-detection'
required: false
type: string
default: ''
with-cpu:
description: 'Build with CPU (enable/disable)'
required: false
type: string
default: 'enable'
permissions:
id-token: write
contents: read
env:
# TensorDict source passed to build scripts
# Note: This may not propagate to pytorch/test-infra called workflows;
# scripts also use GITHUB_REF_NAME for branch-based detection as fallback.
TENSORDICT_SOURCE: ${{ inputs.tensordict-source || 'auto' }}
jobs:
generate-matrix:
uses: pytorch/test-infra/.github/workflows/generate_binary_build_matrix.yml@main
with:
package-type: wheel
os: macos-arm64
test-infra-repository: pytorch/test-infra
test-infra-ref: ${{ inputs.test-infra-ref || 'main' }}
channel: ${{ inputs.channel || '' }}
use-only-dl-pytorch-org: ${{ inputs.channel == 'release' && 'true' || 'false' }}
python-versions: '["3.10", "3.11", "3.12", "3.13", "3.14"]'
# macOS only supports CPU builds
with-cpu: ${{ inputs.with-cpu || (github.event_name == 'workflow_dispatch' && (inputs.build-cpu && 'enable' || 'disable')) || 'enable' }}
build:
needs: generate-matrix
strategy:
fail-fast: false
matrix:
include:
- repository: pytorch/rl
smoke-test-script: test/smoke_test.py
package-name: torchrl
pre-script: .github/scripts/pre-build-script.sh
name: ${{ matrix.repository }}
uses: pytorch/test-infra/.github/workflows/build_wheels_macos.yml@main
with:
repository: ${{ matrix.repository }}
ref: ""
test-infra-repository: pytorch/test-infra
test-infra-ref: ${{ inputs.test-infra-ref || 'main' }}
build-matrix: ${{ needs.generate-matrix.outputs.matrix }}
package-name: ${{ matrix.package-name }}
runner-type: macos-m2-15
smoke-test-script: ${{ matrix.smoke-test-script }}
trigger-event: ${{ github.event_name }}
env-var-script: .github/scripts/td_script.sh