From f72e5290fdd96934a4ef9dced1e114208be66bf8 Mon Sep 17 00:00:00 2001 From: "github-actions[bot]" <41898282+github-actions[bot]@users.noreply.github.com> Date: Sun, 21 Jun 2026 19:09:53 +0000 Subject: [PATCH] chore: release 0.8.12 Signed-off-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> --- .release-please-manifest.json | 2 +- CHANGELOG.md | 22 ++++++++++++++++++++++ Makefile | 2 +- charts/foreman/Chart.yaml | 4 ++-- charts/llmkube/Chart.yaml | 4 ++-- pkg/cli/version.go | 2 +- 6 files changed, 29 insertions(+), 7 deletions(-) diff --git a/.release-please-manifest.json b/.release-please-manifest.json index 9e805262..4e101ebb 100644 --- a/.release-please-manifest.json +++ b/.release-please-manifest.json @@ -1,3 +1,3 @@ { - ".": "0.8.11" + ".": "0.8.12" } diff --git a/CHANGELOG.md b/CHANGELOG.md index d811e941..32fdf2f5 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -5,6 +5,28 @@ All notable changes to LLMKube will be documented in this file. The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/), and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html). +## [0.8.12](https://github.com/defilantech/LLMKube/compare/v0.8.11...v0.8.12) (2026-06-21) + + +### Features + +* **cli:** download heartbeat for llmkube deploy --wait ([#719](https://github.com/defilantech/LLMKube/issues/719)) ([#780](https://github.com/defilantech/LLMKube/issues/780)) ([e6f9774](https://github.com/defilantech/LLMKube/commit/e6f9774816177a36136877dc0a31ffc63021179a)) +* **cli:** make cache list per-InferenceService cache aware ([#731](https://github.com/defilantech/LLMKube/issues/731)) ([#767](https://github.com/defilantech/LLMKube/issues/767)) ([d03c9ee](https://github.com/defilantech/LLMKube/commit/d03c9eed3727639a322d7143fe6ec993505fc66d)) +* **controller:** shield inference pods from disruption during startup ([#660](https://github.com/defilantech/LLMKube/issues/660)) ([#781](https://github.com/defilantech/LLMKube/issues/781)) ([370084a](https://github.com/defilantech/LLMKube/commit/370084a64282e848cc7238077272c354a8fa01ca)) +* **foreman:** codegen-drift check in the coder fast gate ([#775](https://github.com/defilantech/LLMKube/issues/775)) ([#778](https://github.com/defilantech/LLMKube/issues/778)) ([b04a28d](https://github.com/defilantech/LLMKube/commit/b04a28dcbd0660c4c21e36bedc17a83a0e62620b)) +* **metal-agent:** event-driven endpoint withdrawal/recovery on health transitions ([#662](https://github.com/defilantech/LLMKube/issues/662)) ([#771](https://github.com/defilantech/LLMKube/issues/771)) ([7848d18](https://github.com/defilantech/LLMKube/commit/7848d1803be8322855d2635954f2afbe4dbc3cef)) +* **metal-agent:** honor spec.runtime per-CR for multi-runtime dispatch ([#525](https://github.com/defilantech/LLMKube/issues/525)) ([#783](https://github.com/defilantech/LLMKube/issues/783)) ([aa210c3](https://github.com/defilantech/LLMKube/commit/aa210c346f8ae06742fb29f3ecc0f9d7e9247528)) +* **metrics:** TTFT histogram, request error counter, vLLM metrics flag ([#409](https://github.com/defilantech/LLMKube/issues/409)) ([#769](https://github.com/defilantech/LLMKube/issues/769)) ([563b0c9](https://github.com/defilantech/LLMKube/commit/563b0c9f96a176f471ca45d4aade64f0aa3022b6)) + + +### Bug Fixes + +* **controller:** make checkAcceleratorAvailability DRA-aware ([#754](https://github.com/defilantech/LLMKube/issues/754)) ([#776](https://github.com/defilantech/LLMKube/issues/776)) ([804063b](https://github.com/defilantech/LLMKube/commit/804063b8339b74a409fd7ee037390993b8de52a0)) +* **controller:** preserve agent-written schedulingStatus on reconcile ([#643](https://github.com/defilantech/LLMKube/issues/643)) ([#774](https://github.com/defilantech/LLMKube/issues/774)) ([4321028](https://github.com/defilantech/LLMKube/commit/4321028391b609cadcad5584d95df304150ec451)) +* **controller:** reconcileService updates existing Service on endpoint changes ([#720](https://github.com/defilantech/LLMKube/issues/720)) ([#773](https://github.com/defilantech/LLMKube/issues/773)) ([70222ae](https://github.com/defilantech/LLMKube/commit/70222aed216b38d042212f1553cac72024f8d48c)) +* **metal-agent:** clear SchedulingStatus on memory-check-pass ([#777](https://github.com/defilantech/LLMKube/issues/777)) ([#779](https://github.com/defilantech/LLMKube/issues/779)) ([ed1c4eb](https://github.com/defilantech/LLMKube/commit/ed1c4eb2dc4012d56440c8225cff950f0055d7f4)) +* **metal-agent:** prevent zero-byte stub files from failed model downloads ([#642](https://github.com/defilantech/LLMKube/issues/642)) ([#772](https://github.com/defilantech/LLMKube/issues/772)) ([d737e47](https://github.com/defilantech/LLMKube/commit/d737e47677798311754e56119e4ef570778e573e)) + ## [0.8.11](https://github.com/defilantech/LLMKube/compare/v0.8.10...v0.8.11) (2026-06-20) diff --git a/Makefile b/Makefile index 37a44e8e..4008be40 100644 --- a/Makefile +++ b/Makefile @@ -1,5 +1,5 @@ # Image URL to use all building/pushing image targets -IMG ?= ghcr.io/defilantech/llmkube-controller:0.8.11 # x-release-please-version +IMG ?= ghcr.io/defilantech/llmkube-controller:0.8.12 # x-release-please-version # Get the currently used golang install path (in GOPATH/bin, unless GOBIN is set) ifeq (,$(shell go env GOBIN)) diff --git a/charts/foreman/Chart.yaml b/charts/foreman/Chart.yaml index 746727c8..f034a80d 100644 --- a/charts/foreman/Chart.yaml +++ b/charts/foreman/Chart.yaml @@ -10,8 +10,8 @@ description: | coupling is that the foreman-operator's RBAC reads inference.llmkube.dev CRDs that llmkube installs. type: application -version: 0.8.11 -appVersion: 0.8.11 +version: 0.8.12 +appVersion: 0.8.12 keywords: - llmkube - foreman diff --git a/charts/llmkube/Chart.yaml b/charts/llmkube/Chart.yaml index 3a64b4db..9f916f6b 100644 --- a/charts/llmkube/Chart.yaml +++ b/charts/llmkube/Chart.yaml @@ -4,8 +4,8 @@ description: >- A Helm chart for LLMKube - Kubernetes operator for GPU-accelerated LLM inference type: application -version: 0.8.11 -appVersion: 0.8.11 +version: 0.8.12 +appVersion: 0.8.12 keywords: - llm - kubernetes diff --git a/pkg/cli/version.go b/pkg/cli/version.go index 91830afc..2766e7ad 100644 --- a/pkg/cli/version.go +++ b/pkg/cli/version.go @@ -24,7 +24,7 @@ import ( var ( // Version is set during build via ldflags or updated by release-please - Version = "0.8.11" // x-release-please-version + Version = "0.8.12" // x-release-please-version // GitCommit is set during build GitCommit = "unknown" // BuildDate is set during build