Skip to content

Commit 8b8f5cd

Browse files
authored
paper: unify and update abs layout (#1623)
Signed-off-by: xunzhuo <xunzhuo@vllm-semantic-router.ai>
1 parent efe400d commit 8b8f5cd

File tree

5 files changed

+263
-53
lines changed

5 files changed

+263
-53
lines changed

paper/Makefile

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,9 +12,10 @@ OUTNAME = white-paper
1212
TEX = pdflatex
1313
BIB = bibtex
1414
TEXFLAGS = -interaction=nonstopmode -halt-on-error -file-line-error -jobname=$(OUTNAME)
15+
LOGO = ../website/static/img/artworks/vllm-sr-logo.dark.pdf
1516

1617
SECTIONS = $(wildcard sections/*.tex)
17-
SOURCES = $(MAIN).tex $(SECTIONS) references.bib
18+
SOURCES = $(MAIN).tex $(SECTIONS) references.bib vllm.cls $(LOGO)
1819

1920
# Generated files to clean
2021
AUX_EXTS = aux bbl blg log out toc lof lot fls fdb_latexmk synctex.gz nav snm vrb run.xml bcf

paper/main.tex

Lines changed: 28 additions & 48 deletions
Original file line numberDiff line numberDiff line change
@@ -1,57 +1,50 @@
11
% vLLM Semantic Router: Signal Driven Decision Routing for Mixture-of-Modality Models
22
% Main document -- compile with: pdflatex main && bibtex main && pdflatex main && pdflatex main
33

4-
\documentclass{article}
4+
\documentclass{vllm}
55

6-
\usepackage{iclr2026_conference}
6+
% ---------- template / layout ----------
7+
\usepackage[margin=1.2in]{geometry}
8+
\graphicspath{{../website/static/img/}}
79

810
% ---------- packages ----------
9-
\usepackage[utf8]{inputenc}
10-
\usepackage[T1]{fontenc}
11-
\usepackage{graphicx}
12-
\usepackage{amsmath,amssymb,amsthm}
1311
\usepackage{amsfonts}
14-
\usepackage{booktabs}
15-
\usepackage{multirow}
16-
\usepackage{enumitem}
12+
\usepackage{amsmath,amssymb,amsthm}
13+
\usepackage{mathtools}
1714
\usepackage{algorithm}
1815
\usepackage{algorithmic}
16+
\usepackage[noabbrev,nameinlink]{cleveref}
17+
\usepackage{enumitem}
1918
\usepackage{float}
2019
\usepackage{listings}
21-
\usepackage{xcolor}
22-
\usepackage{hyperref}
23-
\usepackage{cleveref}
24-
\usepackage{subcaption}
2520
\usepackage{tabularx}
26-
\usepackage{url}
2721
\usepackage{tikz}
28-
\usetikzlibrary{shapes,shapes.geometric,arrows,positioning,fit,calc,backgrounds,decorations.pathreplacing}
22+
\usepackage{cite}
23+
\usetikzlibrary{shapes,shapes.geometric,arrows,arrows.meta,positioning,fit,calc,backgrounds,decorations.pathreplacing,matrix,shadows,patterns}
2924

3025
% ---------- theorem environments ----------
26+
\theoremstyle{definition}
3127
\newtheorem{definition}{Definition}
28+
\theoremstyle{plain}
3229
\newtheorem{theorem}{Theorem}
3330
\newtheorem{proposition}{Proposition}
3431

3532
% ---------- listing style ----------
3633
\lstset{
3734
basicstyle=\ttfamily\small,
38-
keywordstyle=\color{blue}\bfseries,
39-
commentstyle=\color{gray},
40-
stringstyle=\color{red!70!black},
35+
keywordstyle=\color{metablue}\bfseries,
36+
commentstyle=\color{black!55},
37+
stringstyle=\color{metafg},
4138
breaklines=true,
4239
frame=single,
4340
numbers=left,
44-
numberstyle=\tiny\color{gray},
41+
numberstyle=\tiny\color{black!45},
4542
captionpos=b,
4643
tabsize=2
4744
}
4845

49-
% ---------- hyperref setup ----------
46+
% ---------- hyperref metadata ----------
5047
\hypersetup{
51-
colorlinks=true,
52-
linkcolor=blue!70!black,
53-
citecolor=green!50!black,
54-
urlcolor=blue!60!black,
5548
pdfauthor={vLLM Semantic Router Team},
5649
pdftitle={vLLM Semantic Router: Signal Driven Decision Routing for Mixture-of-Modality Models}
5750
}
@@ -65,39 +58,28 @@
6558
\newcommand{\vsr}{\texttt{vllm-sr}}
6659

6760
\setlength{\emergencystretch}{2em}
68-
\iclrfinalcopy
6961

70-
\title{%
71-
\textbf{vLLM Semantic Router:}\\[-1pt]
72-
{\fontsize{11}{12.5}\selectfont\mbox{Signal Driven Decision Routing for Mixture-of-Modality Models}}%
73-
}
62+
\title{vLLM Semantic Router}
63+
\subtitle{Signal Driven Decision Routing for Mixture-of-Modality Models}
7464

7565
\author{%
76-
\parbox[t]{0.965\textwidth}{\centering\small\normalfont
77-
Xunzhuo Liu, Huamin Chen, Samzong Lu, Yossi Ovadia, Guohong Wen, Hao Wu, \\
78-
Zhengda Tan, Jintao Zhang, Senan Zedan, Yehudit Kerido, Liav Weiss,
79-
Haichen Zhang, Bishen Yu, Asaad Balum, Noa Limoy,
80-
Abdallah Samara, Baofa Fan, Sanjeev Rampal, Brent Salisbury, Ryan Cook, Zhijie Wang,
81-
Qiping Pan, Rehan Khan, Avishek Goswami, Houston H.\ Zhang, Shuyi Wang,
82-
Ziang Tang, Fang Han, Zohaib Hassan, Jianqiao Zheng, Avinash Changrani%
83-
}%
66+
Xunzhuo Liu, Huamin Chen, Samzong Lu, Yossi Ovadia, Guohong Wen, Hao Wu,\\
67+
Zhengda Tan, Jintao Zhang, Senan Zedan, Yehudit Kerido, Liav Weiss, Haichen Zhang,\\
68+
Bishen Yu, Asaad Balum, Noa Limoy, Abdallah Samara, Baofa Fan, Sanjeev Rampal,\\
69+
Brent Salisbury, Ryan Cook, Zhijie Wang, Qiping Pan, Rehan Khan, Avishek Goswami,\\
70+
Houston H.\ Zhang, Shuyi Wang, Ziang Tang, Fang Han, Zohaib Hassan, Jianqiao Zheng,\\
71+
Avinash Changrani%
8472
}
8573

86-
\date{February 2026}
74+
\date{March 2026}
75+
\abstract{\input{sections/abstract}}
8776

8877
% =====================================================================
8978
% DOCUMENT
9079
% =====================================================================
9180
\begin{document}
9281

9382
\maketitle
94-
\begingroup
95-
\renewcommand{\thefootnote}{}
96-
\footnotetext{Corresponding repository: \href{https://github.com/vllm-project/semantic-router}{GitHub repository}}
97-
\endgroup
98-
99-
% --- Abstract ---
100-
\input{sections/abstract}
10183

10284
% --- Introduction ---
10385
\input{sections/introduction}
@@ -147,16 +129,14 @@
147129
% --- Evaluation ---
148130
\input{sections/evaluation}
149131

150-
151-
152132
% --- Related Work ---
153133
\input{sections/related_work}
154134

155135
% --- Conclusion ---
156136
\input{sections/conclusion}
157137

158138
% --- Bibliography ---
159-
\bibliographystyle{iclr2026_conference}
139+
\bibliographystyle{unsrt}
160140
\bibliography{references}
161141

162142
\end{document}

paper/sections/abstract.tex

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,3 @@
1-
% sections/abstract.tex
2-
3-
\begin{abstract}
41
As large language models (LLMs) diversify across modalities, capabilities, and cost profiles, the problem of \emph{intelligent request routing}---selecting the right model for each query at inference time---has become a critical systems challenge.
52
We present \textbf{\sysname{}}, a signal-driven decision routing framework for Mixture-of-Modality (MoM) model deployments.
63

@@ -13,4 +10,3 @@
1310
Matched decisions drive \emph{semantic model routing} via thirteen selection algorithms, while per-decision plugin chains enforce safety constraints including a three-stage \emph{HaluGate} hallucination detection pipeline and a lightweight episodic memory system with \emph{ReflectionGate} for personalized multi-turn context.
1411
A typed neural-symbolic DSL specifies these routing policies and compiles them to multiple deployment targets, enabling configuration-first adaptation without code changes.
1512
Together, these components show that composable signal orchestration enables a single framework to serve diverse deployment scenarios with differentiated cost, privacy, and safety policies.
16-
\end{abstract}

0 commit comments

Comments
 (0)