From b7428a0e1f1062eab6e3658a331f45617d5da20a Mon Sep 17 00:00:00 2001 From: mgoin Date: Wed, 15 Oct 2025 18:12:10 -0400 Subject: [PATCH 1/6] Add thumbnail previews for each post Signed-off-by: mgoin --- _layouts/home.html | 42 ++++++++++++++++++ _posts/2025-01-14-struct-decode-intro.md | 1 + _posts/2025-01-21-stack-release.md | 4 +- _posts/2025-02-24-ptpc-fp8-rocm.md | 2 - _posts/2025-04-05-llama4.md | 2 - _posts/2025-04-11-transformers-backend.md | 2 - _posts/2025-04-23-openrlhf-vllm.md | 6 +-- _posts/2025-06-30-minimax-m1.md | 5 ++- _posts/2025-09-11-qwen3-next.md | 2 - _posts/2025-09-16-vllm-meetup.md | 3 +- _posts/2025-09-29-deepseek-v3-2.md | 4 +- _posts/2025-10-09-blackwell-inferencemax.md | 9 ++-- assets/css/style.scss | 48 +++++++++++++++++++++ 13 files changed, 105 insertions(+), 25 deletions(-) create mode 100644 _layouts/home.html create mode 100644 assets/css/style.scss diff --git a/_layouts/home.html b/_layouts/home.html new file mode 100644 index 0000000..d743475 --- /dev/null +++ b/_layouts/home.html @@ -0,0 +1,42 @@ +--- +layout: default +--- + +
+ {%- if page.title -%} +

{{ page.title }}

+ {%- endif -%} + + {{ content }} + + {% if site.paginate %} + {% assign posts = paginator.posts %} + {% else %} + {% assign posts = site.posts %} + {% endif %} + + {%- if posts.size > 0 -%} +
    + {%- assign date_format = site.minima.date_format | default: "%b %-d, %Y" -%} + {%- for post in posts -%} +
  • + {%- if post.image -%} +
    + + {{ post.title | escape }} + +
    + {%- endif -%} +
    + +

    + + {{ post.title | escape }} + +

    +
    +
  • + {%- endfor -%} +
+ {%- endif -%} +
diff --git a/_posts/2025-01-14-struct-decode-intro.md b/_posts/2025-01-14-struct-decode-intro.md index 6116b46..dabc4ee 100644 --- a/_posts/2025-01-14-struct-decode-intro.md +++ b/_posts/2025-01-14-struct-decode-intro.md @@ -2,6 +2,7 @@ layout: post title: "Structured Decoding in vLLM: a gentle introduction" author: "Guest Post by BentoML and Red Hat" +image: /assets/figures/struct-decode-intro/vllm-xgrammar-decode-time-per-output-token.png --- **TL/DR**: diff --git a/_posts/2025-01-21-stack-release.md b/_posts/2025-01-21-stack-release.md index 81c7248..93bd90e 100644 --- a/_posts/2025-01-21-stack-release.md +++ b/_posts/2025-01-21-stack-release.md @@ -1,8 +1,6 @@ --- layout: post -title: "High Performance and Easy Deployment of vLLM in K8S with “vLLM production-stack”" -thumbnail-img: /assets/figures/stack/stack-thumbnail.png -share-img: /assets/figures/stack/stack-thumbnail.png +title: "High Performance and Easy Deployment of vLLM in K8S with "vLLM production-stack"" author: LMCache Team image: /assets/figures/stack/stack-thumbnail.png --- diff --git a/_posts/2025-02-24-ptpc-fp8-rocm.md b/_posts/2025-02-24-ptpc-fp8-rocm.md index 5c76b7e..8ef998f 100644 --- a/_posts/2025-02-24-ptpc-fp8-rocm.md +++ b/_posts/2025-02-24-ptpc-fp8-rocm.md @@ -3,8 +3,6 @@ layout: post title: "PTPC-FP8: Boosting vLLM Performance on AMD ROCm" author: "AMD and Embedded LLM" image: /assets/figures/ptpc/PTPC-tumbnail.png -thumbnail-img: /assets/figures/ptpc/PTPC-tumbnail.png -share-img: /assets/figures/ptpc/PTPC-tumbnail.png math: true --- diff --git a/_posts/2025-04-05-llama4.md b/_posts/2025-04-05-llama4.md index 42aca6a..a8e6df2 100644 --- a/_posts/2025-04-05-llama4.md +++ b/_posts/2025-04-05-llama4.md @@ -3,8 +3,6 @@ layout: post title: "Llama 4 in vLLM" author: "The vLLM Team" image: /assets/figures/llama4/perf.png -thumbnail-img: /assets/figures/llama4/perf.png -share-img: /assets/figures/llama4/perf.png --- We're excited to announce that vLLM now supports the [Llama 4 herd of models](https://ai.meta.com/blog/llama-4-multimodal-intelligence/): **Scout** (17B-16E) and **Maverick** (17B-128E). You can run these powerful long-context, natively multi-modal (up to 8-10 images with good results), mixture-of-experts models in vLLM today by updating to version v0.8.3 or later: diff --git a/_posts/2025-04-11-transformers-backend.md b/_posts/2025-04-11-transformers-backend.md index 88691b9..68c4f90 100644 --- a/_posts/2025-04-11-transformers-backend.md +++ b/_posts/2025-04-11-transformers-backend.md @@ -3,8 +3,6 @@ layout: post title: "Transformers backend integration in vLLM" author: "The Hugging Face Team" image: /assets/figures/transformers-backend/transformers-backend.png -thumbnail-img: /assets/figures/transformers-backend/transformers-backend.png -share-img: /assets/figures/transformers-backend/transformers-backend.png --- The [Hugging Face Transformers library](https://huggingface.co/docs/transformers/main/en/index) diff --git a/_posts/2025-04-23-openrlhf-vllm.md b/_posts/2025-04-23-openrlhf-vllm.md index 6b6e39d..c5e77ea 100644 --- a/_posts/2025-04-23-openrlhf-vllm.md +++ b/_posts/2025-04-23-openrlhf-vllm.md @@ -1,10 +1,8 @@ --- layout: post title: "Accelerating RLHF with vLLM, Best Practice from OpenRLHF" -author: "The OpenRLHF Team" -image: /assets/figures/openrlhf-vllm/ray.png -thumbnail-img: /assets/figures/openrlhf-vllm/ray.png -share-img: /assets/figures/openrlhf-vllm/ray.png +author: "The OpenRLHF Team" +image: /assets/figures/openrlhf-vllm/ray.png --- As demand grows for training reasoning-capable large language models (LLMs), Reinforcement Learning from Human Feedback (RLHF) has emerged as a cornerstone technique. However, conventional RLHF pipelines—especially those using Proximal Policy Optimization (PPO)—are often hindered by substantial computational overhead. This challenge is particularly pronounced with models that excel at complex reasoning tasks (such as OpenAI-o1 and DeepSeek-R1), where generating long chain-of-thought (CoT) outputs can account for up to 90% of total training time. These models must produce detailed, step-by-step reasoning that can span thousands of tokens, making inference significantly more time-consuming than the training phase itself. As a pioneering inference framework, vLLM provides a user-friendly interface for generating RLHF samples and updating model weights. diff --git a/_posts/2025-06-30-minimax-m1.md b/_posts/2025-06-30-minimax-m1.md index d49c0ca..0e0404a 100644 --- a/_posts/2025-06-30-minimax-m1.md +++ b/_posts/2025-06-30-minimax-m1.md @@ -2,8 +2,9 @@ layout: post title: "MiniMax-M1 Hybrid Architecture Meets vLLM: Long Context, Fast Inference" author: "MiniMax" -benchmark-img: /assets/figures/minimax-m1/benchmark.png -moe-img: /assets/figures/minimax-m1/moe.png +image: /assets/figures/minimax-m1/benchmark.png +benchmark-img: /assets/figures/minimax-m1/benchmark.png +moe-img: /assets/figures/minimax-m1/moe.png lightning_attention-img: /assets/figures/minimax-m1/lightning_attention.png --- diff --git a/_posts/2025-09-11-qwen3-next.md b/_posts/2025-09-11-qwen3-next.md index 7b75274..cb1eeea 100644 --- a/_posts/2025-09-11-qwen3-next.md +++ b/_posts/2025-09-11-qwen3-next.md @@ -3,8 +3,6 @@ layout: post title: "vLLM Now Supports Qwen3-Next: Hybrid Architecture with Extreme Efficiency" author: "The vLLM Team" image: /assets/figures/qwen3-next/qwen.png -thumbnail-img: /assets/figures/qwen3-next/qwen.png -share-img: /assets/figures/qwen3-next/qwen.png --- We’re excited to announce that **vLLM now supports Qwen3-Next**, the latest generation of foundation models from the Qwen team. Qwen3-Next introduces a **hybrid architecture with extreme efficiency for long context support**, and vLLM offers full support of its functionalities. diff --git a/_posts/2025-09-16-vllm-meetup.md b/_posts/2025-09-16-vllm-meetup.md index 4f9cd42..e329c61 100644 --- a/_posts/2025-09-16-vllm-meetup.md +++ b/_posts/2025-09-16-vllm-meetup.md @@ -1,7 +1,8 @@ --- layout: post title: "The First vLLM Meetup in Korea" -author: "vLLM Team" +author: "vLLM Team" +image: /assets/figures/vllm-meetup/image-3.png ---

diff --git a/_posts/2025-09-29-deepseek-v3-2.md b/_posts/2025-09-29-deepseek-v3-2.md index c3983e2..cf43b75 100644 --- a/_posts/2025-09-29-deepseek-v3-2.md +++ b/_posts/2025-09-29-deepseek-v3-2.md @@ -1,10 +1,8 @@ --- layout: post title: "DeepSeek-V3.2-Exp in vLLM: Fine-Grained Sparse Attention in Action" -author: "vLLM Team" +author: "vLLM Team" image: /assets/figures/deepseek-v3-2/dsa-explained.png -thumbnail-img: /assets/figures/deepseek-v3-2/dsa-explained.png -share-img: /assets/figures/deepseek-v3-2/dsa-explained.png --- ### Introduction diff --git a/_posts/2025-10-09-blackwell-inferencemax.md b/_posts/2025-10-09-blackwell-inferencemax.md index 2c71c43..ba40ecf 100644 --- a/_posts/2025-10-09-blackwell-inferencemax.md +++ b/_posts/2025-10-09-blackwell-inferencemax.md @@ -1,7 +1,8 @@ ---- -layout: post -title: "SemiAnalysis InferenceMAX: vLLM and NVIDIA Accelerate Blackwell Inference" -author: "vLLM Team" +--- +layout: post +title: "SemiAnalysis InferenceMAX: vLLM and NVIDIA Accelerate Blackwell Inference" +author: "vLLM Team" +image: /assets/figures/blackwell-inferencemax/gpt-oss-120b-1k-1k.png --- ### Introduction diff --git a/assets/css/style.scss b/assets/css/style.scss new file mode 100644 index 0000000..7e305f0 --- /dev/null +++ b/assets/css/style.scss @@ -0,0 +1,48 @@ +--- +--- + +@import "{{ site.theme }}"; + +.post-list { + list-style: none; + margin-left: 0; +} + +.post-item { + display: flex; + gap: 1.5rem; + margin-bottom: 2rem; + padding-bottom: 2rem; + border-bottom: 1px solid #e8e8e8; +} + +.post-thumbnail { + flex-shrink: 0; + width: 200px; +} + +.post-thumbnail img { + width: 100%; + height: auto; + border-radius: 4px; + display: block; +} + +.post-content { + flex: 1; + min-width: 0; +} + +.post-content h3 { + margin-top: 0; +} + +@media (max-width: 600px) { + .post-item { + flex-direction: column; + } + + .post-thumbnail { + width: 100%; + } +} From a30898b716579fabda64f1f3dc856188bd1da503 Mon Sep 17 00:00:00 2001 From: mgoin Date: Wed, 15 Oct 2025 18:14:51 -0400 Subject: [PATCH 2/6] bad theme Signed-off-by: mgoin --- assets/css/style.scss | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/assets/css/style.scss b/assets/css/style.scss index 7e305f0..d33b22f 100644 --- a/assets/css/style.scss +++ b/assets/css/style.scss @@ -1,7 +1,7 @@ --- --- -@import "{{ site.theme }}"; +@import "minima"; .post-list { list-style: none; From cc910bc13c20f85520d5fde442f7590682eb398d Mon Sep 17 00:00:00 2001 From: mgoin Date: Wed, 15 Oct 2025 18:18:32 -0400 Subject: [PATCH 3/6] Fixes Signed-off-by: mgoin --- _layouts/home.html | 39 ++++++++++++++++++++++++ _posts/2025-01-21-stack-release.md | 2 +- assets/css/style.scss | 48 ------------------------------ 3 files changed, 40 insertions(+), 49 deletions(-) delete mode 100644 assets/css/style.scss diff --git a/_layouts/home.html b/_layouts/home.html index d743475..a4e8d7f 100644 --- a/_layouts/home.html +++ b/_layouts/home.html @@ -2,6 +2,45 @@ layout: default --- + +

{%- if page.title -%}

{{ page.title }}

diff --git a/_posts/2025-01-21-stack-release.md b/_posts/2025-01-21-stack-release.md index 93bd90e..3250bdc 100644 --- a/_posts/2025-01-21-stack-release.md +++ b/_posts/2025-01-21-stack-release.md @@ -1,6 +1,6 @@ --- layout: post -title: "High Performance and Easy Deployment of vLLM in K8S with "vLLM production-stack"" +title: "High Performance and Easy Deployment of vLLM in K8S with vLLM production-stack" author: LMCache Team image: /assets/figures/stack/stack-thumbnail.png --- diff --git a/assets/css/style.scss b/assets/css/style.scss deleted file mode 100644 index d33b22f..0000000 --- a/assets/css/style.scss +++ /dev/null @@ -1,48 +0,0 @@ ---- ---- - -@import "minima"; - -.post-list { - list-style: none; - margin-left: 0; -} - -.post-item { - display: flex; - gap: 1.5rem; - margin-bottom: 2rem; - padding-bottom: 2rem; - border-bottom: 1px solid #e8e8e8; -} - -.post-thumbnail { - flex-shrink: 0; - width: 200px; -} - -.post-thumbnail img { - width: 100%; - height: auto; - border-radius: 4px; - display: block; -} - -.post-content { - flex: 1; - min-width: 0; -} - -.post-content h3 { - margin-top: 0; -} - -@media (max-width: 600px) { - .post-item { - flex-direction: column; - } - - .post-thumbnail { - width: 100%; - } -} From aeceb696712cbfcd8475829b504122520ec8cd34 Mon Sep 17 00:00:00 2001 From: mgoin Date: Wed, 15 Oct 2025 18:28:03 -0400 Subject: [PATCH 4/6] Update theme Signed-off-by: mgoin --- _layouts/home.html | 84 +++++++++++++++++-------------------------- _sass/custom.scss | 10 ++++++ assets/css/style.scss | 7 ++++ 3 files changed, 49 insertions(+), 52 deletions(-) create mode 100644 _sass/custom.scss create mode 100644 assets/css/style.scss diff --git a/_layouts/home.html b/_layouts/home.html index a4e8d7f..2b543d8 100644 --- a/_layouts/home.html +++ b/_layouts/home.html @@ -2,45 +2,6 @@ layout: default --- - -
{%- if page.title -%}

{{ page.title }}

@@ -55,27 +16,46 @@

{{ page.title }}

{% endif %} {%- if posts.size > 0 -%} + {%- if page.list_title -%} +

{{ page.list_title }}

+ {%- endif -%} + + {% if site.paginate %} +
+ +
+ {%- endif %} {%- endif -%} +
diff --git a/_sass/custom.scss b/_sass/custom.scss new file mode 100644 index 0000000..6b80ebd --- /dev/null +++ b/_sass/custom.scss @@ -0,0 +1,10 @@ +// Minimal thumbnail styling +.post-thumbnail { + float: left; + width: 80px; + height: 80px; + margin-right: 1rem; + margin-bottom: 0.5rem; + border-radius: 4px; + object-fit: cover; +} diff --git a/assets/css/style.scss b/assets/css/style.scss new file mode 100644 index 0000000..ec5e215 --- /dev/null +++ b/assets/css/style.scss @@ -0,0 +1,7 @@ +--- +--- + +@import + "minima/skins/{{ site.minima.skin | default: 'auto' }}", + "minima/initialize", + "custom"; From 13d8a588bb7bfc3e241ef34d7d47749696f0b2be Mon Sep 17 00:00:00 2001 From: mgoin Date: Wed, 15 Oct 2025 18:32:11 -0400 Subject: [PATCH 5/6] Try again Signed-off-by: mgoin --- _sass/custom.scss | 10 ---------- _sass/minima/custom-styles.scss | 11 +++++++++++ assets/css/style.scss | 7 ------- 3 files changed, 11 insertions(+), 17 deletions(-) delete mode 100644 _sass/custom.scss delete mode 100644 assets/css/style.scss diff --git a/_sass/custom.scss b/_sass/custom.scss deleted file mode 100644 index 6b80ebd..0000000 --- a/_sass/custom.scss +++ /dev/null @@ -1,10 +0,0 @@ -// Minimal thumbnail styling -.post-thumbnail { - float: left; - width: 80px; - height: 80px; - margin-right: 1rem; - margin-bottom: 0.5rem; - border-radius: 4px; - object-fit: cover; -} diff --git a/_sass/minima/custom-styles.scss b/_sass/minima/custom-styles.scss index 14a2eb7..d6b2d73 100644 --- a/_sass/minima/custom-styles.scss +++ b/_sass/minima/custom-styles.scss @@ -1,3 +1,14 @@ img { background-color: $lm-background-color; +} + +// Minimal thumbnail styling for blog post list +.post-list .post-thumbnail { + float: left; + width: 80px; + height: 80px; + margin-right: 1rem; + margin-bottom: 0.5rem; + border-radius: 4px; + object-fit: cover; } \ No newline at end of file diff --git a/assets/css/style.scss b/assets/css/style.scss deleted file mode 100644 index ec5e215..0000000 --- a/assets/css/style.scss +++ /dev/null @@ -1,7 +0,0 @@ ---- ---- - -@import - "minima/skins/{{ site.minima.skin | default: 'auto' }}", - "minima/initialize", - "custom"; From 0aafc57f89bf2f6c3c47bcaa62d772eee3ce2fac Mon Sep 17 00:00:00 2001 From: mgoin Date: Wed, 15 Oct 2025 18:36:47 -0400 Subject: [PATCH 6/6] Just use image Signed-off-by: mgoin --- _layouts/home.html | 61 --------------------------------- _sass/minima/custom-styles.scss | 11 ------ 2 files changed, 72 deletions(-) delete mode 100644 _layouts/home.html diff --git a/_layouts/home.html b/_layouts/home.html deleted file mode 100644 index 2b543d8..0000000 --- a/_layouts/home.html +++ /dev/null @@ -1,61 +0,0 @@ ---- -layout: default ---- - -
- {%- if page.title -%} -

{{ page.title }}

- {%- endif -%} - - {{ content }} - - {% if site.paginate %} - {% assign posts = paginator.posts %} - {% else %} - {% assign posts = site.posts %} - {% endif %} - - {%- if posts.size > 0 -%} - {%- if page.list_title -%} -

{{ page.list_title }}

- {%- endif -%} -
    - {%- assign date_format = site.minima.date_format | default: "%b %-d, %Y" -%} - {%- for post in posts -%} -
  • - {%- if post.image -%} - - {%- endif -%} - -

    - - {{ post.title | escape }} - -

    - {%- if site.show_excerpts -%} - {{ post.excerpt }} - {%- endif -%} -
  • - {%- endfor -%} -
- - {% if site.paginate %} -
- -
- {%- endif %} - {%- endif -%} - -
diff --git a/_sass/minima/custom-styles.scss b/_sass/minima/custom-styles.scss index d6b2d73..14a2eb7 100644 --- a/_sass/minima/custom-styles.scss +++ b/_sass/minima/custom-styles.scss @@ -1,14 +1,3 @@ img { background-color: $lm-background-color; -} - -// Minimal thumbnail styling for blog post list -.post-list .post-thumbnail { - float: left; - width: 80px; - height: 80px; - margin-right: 1rem; - margin-bottom: 0.5rem; - border-radius: 4px; - object-fit: cover; } \ No newline at end of file