From 47cfc61800b4441a4bb15fed980b71ccd1a7d6de Mon Sep 17 00:00:00 2001 From: Sebastian Raschka Date: Sun, 18 Jan 2026 11:42:03 -0600 Subject: [PATCH 1/2] link GRPO notebook (#950) --- README.md | 7 +++++++ reasoning-from-scratch | 2 +- 2 files changed, 8 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index e6b1a26..2d7bae6 100644 --- a/README.md +++ b/README.md @@ -212,6 +212,13 @@ More bonus material from the [Reasoning From Scratch](https://github.com/rasbt/r - [Multiple-Choice Evaluation (MMLU)](https://github.com/rasbt/reasoning-from-scratch/blob/main/chF/02_mmlu) - [LLM Leaderboard Evaluation](https://github.com/rasbt/reasoning-from-scratch/blob/main/chF/03_leaderboards) - [LLM-as-a-Judge Evaluation](https://github.com/rasbt/reasoning-from-scratch/blob/main/chF/04_llm-judge) +- **Inference Scaling** + - [Self-Consistency](https://github.com/rasbt/reasoning-from-scratch/blob/main/ch04/01_main-chapter-code/ch04_main.ipynb) + - [Self-Refinement](https://github.com/rasbt/reasoning-from-scratch/blob/main/ch05/01_main-chapter-code/ch05_main.ipynb) + +- **Reinforcement Learning** (RL) + - [RLVR with GRPO From Scratch](https://github.com/rasbt/reasoning-from-scratch/blob/main/ch06/01_main-chapter-code/ch06_main.ipynb) +
  diff --git a/reasoning-from-scratch b/reasoning-from-scratch index a8cfd55..edcae1d 160000 --- a/reasoning-from-scratch +++ b/reasoning-from-scratch @@ -1 +1 @@ -Subproject commit a8cfd55fca9ff37177d675442de77601c3281728 +Subproject commit edcae1d894192a2d7c036bfea43922cb140dea10 From 59d9262047a4ec444161d113a0f24e7e90c79ca8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?P=C3=A1draic=20Slattery?= Date: Mon, 19 Jan 2026 19:22:29 +0100 Subject: [PATCH 2/2] chore: Update outdated GitHub Actions versions (#951) --- .github/workflows/basic-tests-latest-python.yml | 4 ++-- .github/workflows/basic-tests-linux-uv.yml | 4 ++-- .github/workflows/basic-tests-macos-uv.yml | 4 ++-- .github/workflows/basic-tests-old-pytorch.yml | 4 ++-- .github/workflows/basic-tests-pip.yml | 4 ++-- .github/workflows/basic-tests-pixi.yml | 2 +- .github/workflows/basic-tests-pytorch-rc.yml | 4 ++-- .github/workflows/basic-tests-windows-uv-pip.yml | 4 ++-- .github/workflows/check-links.yml | 4 ++-- .github/workflows/check-spelling-errors.yml | 4 ++-- .github/workflows/pep8-linter.yml | 4 ++-- 11 files changed, 21 insertions(+), 21 deletions(-) diff --git a/.github/workflows/basic-tests-latest-python.yml b/.github/workflows/basic-tests-latest-python.yml index 3359fed..a01654f 100644 --- a/.github/workflows/basic-tests-latest-python.yml +++ b/.github/workflows/basic-tests-latest-python.yml @@ -22,10 +22,10 @@ jobs: runs-on: ubuntu-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.13" diff --git a/.github/workflows/basic-tests-linux-uv.yml b/.github/workflows/basic-tests-linux-uv.yml index 1ef96b2..67d886b 100644 --- a/.github/workflows/basic-tests-linux-uv.yml +++ b/.github/workflows/basic-tests-linux-uv.yml @@ -28,10 +28,10 @@ jobs: name: Code tests (Linux) runs-on: ubuntu-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python (uv) - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.13" diff --git a/.github/workflows/basic-tests-macos-uv.yml b/.github/workflows/basic-tests-macos-uv.yml index ec3dbd2..3cac9f0 100644 --- a/.github/workflows/basic-tests-macos-uv.yml +++ b/.github/workflows/basic-tests-macos-uv.yml @@ -28,10 +28,10 @@ jobs: name: Code tests (macOS) runs-on: macos-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python (uv) - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.13" diff --git a/.github/workflows/basic-tests-old-pytorch.yml b/.github/workflows/basic-tests-old-pytorch.yml index b486196..fec3884 100644 --- a/.github/workflows/basic-tests-old-pytorch.yml +++ b/.github/workflows/basic-tests-old-pytorch.yml @@ -26,10 +26,10 @@ jobs: pytorch-version: [ 2.3.0, 2.5.0 ] steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.13" diff --git a/.github/workflows/basic-tests-pip.yml b/.github/workflows/basic-tests-pip.yml index 5351ff8..1575683 100644 --- a/.github/workflows/basic-tests-pip.yml +++ b/.github/workflows/basic-tests-pip.yml @@ -28,10 +28,10 @@ jobs: name: Pip Tests (Ubuntu Only) runs-on: ubuntu-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.10" # tests for backwards compatibility diff --git a/.github/workflows/basic-tests-pixi.yml b/.github/workflows/basic-tests-pixi.yml index 2195a21..fc7fbe1 100644 --- a/.github/workflows/basic-tests-pixi.yml +++ b/.github/workflows/basic-tests-pixi.yml @@ -31,7 +31,7 @@ jobs: os: [ubuntu-latest, windows-latest] steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up pixi (without caching) uses: prefix-dev/setup-pixi@v0.8.2 diff --git a/.github/workflows/basic-tests-pytorch-rc.yml b/.github/workflows/basic-tests-pytorch-rc.yml index e2cbe43..c58996f 100644 --- a/.github/workflows/basic-tests-pytorch-rc.yml +++ b/.github/workflows/basic-tests-pytorch-rc.yml @@ -22,10 +22,10 @@ jobs: runs-on: ubuntu-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.13" diff --git a/.github/workflows/basic-tests-windows-uv-pip.yml b/.github/workflows/basic-tests-windows-uv-pip.yml index ff9eee5..41f333d 100644 --- a/.github/workflows/basic-tests-windows-uv-pip.yml +++ b/.github/workflows/basic-tests-windows-uv-pip.yml @@ -24,10 +24,10 @@ jobs: steps: - name: Checkout Code - uses: actions/checkout@v4 + uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: '3.11' diff --git a/.github/workflows/check-links.yml b/.github/workflows/check-links.yml index a16c69f..c754471 100644 --- a/.github/workflows/check-links.yml +++ b/.github/workflows/check-links.yml @@ -13,10 +13,10 @@ jobs: runs-on: ubuntu-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.10" diff --git a/.github/workflows/check-spelling-errors.yml b/.github/workflows/check-spelling-errors.yml index 0fe1949..5e6c2fd 100644 --- a/.github/workflows/check-spelling-errors.yml +++ b/.github/workflows/check-spelling-errors.yml @@ -13,10 +13,10 @@ jobs: runs-on: ubuntu-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.10" diff --git a/.github/workflows/pep8-linter.yml b/.github/workflows/pep8-linter.yml index 8755fd7..8596569 100644 --- a/.github/workflows/pep8-linter.yml +++ b/.github/workflows/pep8-linter.yml @@ -10,9 +10,9 @@ jobs: flake8: runs-on: ubuntu-latest steps: - - uses: actions/checkout@v4 + - uses: actions/checkout@v6 - name: Set up Python - uses: actions/setup-python@v5 + uses: actions/setup-python@v6 with: python-version: "3.13" - name: Install ruff (a faster flake 8 equivalent)