%PDF-1.7
%
1 0 obj
<< /Metadata 3 0 R /Names 4 0 R /OpenAction 5 0 R /Outlines 6 0 R /PageMode /UseOutlines /Pages 7 0 R /Type /Catalog >>
endobj
2 0 obj
<< /Author (Raja Gond; Aditya K Kamath; Ramachandran Ramjee; Ashish Panwar) /Creator (arXiv GenPDF \(tex2pdf:57610bf\)) /DOI (https://doi.org/10.48550/arXiv.2601.17768) /License (http://creativecommons.org/licenses/by/4.0/) /PTEX.Fullbanner (This is pdfTeX, Version 3.141592653-2.6-1.40.28 \(TeX Live 2025\) kpathsea version 6.4.1) /Producer (pikepdf 8.15.1) /Title (LLM-42: Enabling Determinism in LLM Inference with Verified Speculation) /Trapped /False /arXivID (https://arxiv.org/abs/2601.17768v2) >>
endobj
3 0 obj
<< /Subtype /XML /Type /Metadata /Length 1709 >>
stream
LLM-42: Enabling Determinism in LLM Inference with Verified SpeculationRaja GondAditya K KamathRamachandran RamjeeAshish Panwarhttp://creativecommons.org/licenses/by/4.0/cs.LGcs.AIcs.DC
endstream
endobj
4 0 obj
<< /Dests 8 0 R >>
endobj
5 0 obj
<< /D [ 9 0 R /Fit ] /S /GoTo >>
endobj
6 0 obj
<< /Count 7 /First 10 0 R /Last 11 0 R /Type /Outlines >>
endobj
7 0 obj
<< /Count 15 /Kids [ 12 0 R 13 0 R 14 0 R ] /Type /Pages >>
endobj
8 0 obj
<< /Kids [ 15 0 R 16 0 R 17 0 R 18 0 R ] /Limits [ (Doc-Start) (table.caption.9) ] >>
endobj
9 0 obj
<< /Annots [ 19 0 R 20 0 R 21 0 R 22 0 R 23 0 R 24 0 R 25 0 R 26 0 R 27 0 R 28 0 R 29 0 R 30 0 R 31 0 R 32 0 R 33 0 R 34 0 R 35 0 R 36 0 R 37 0 R ] /Contents [ 38 0 R 39 0 R 40 0 R 41 0 R ] /MediaBox [ 0 0 612 792 ] /Parent 12 0 R /Resources 42 0 R /Type /Page >>
endobj
10 0 obj
<< /A 43 0 R /Next 44 0 R /Parent 6 0 R /Title 45 0 R >>
endobj
11 0 obj
<< /A 46 0 R /Parent 6 0 R /Prev 47 0 R /Title 48 0 R >>
endobj
12 0 obj
<< /Count 6 /Kids [ 9 0 R 49 0 R 50 0 R 51 0 R 52 0 R 53 0 R ] /Parent 7 0 R /Type /Pages >>
endobj
13 0 obj
<< /Count 6 /Kids [ 54 0 R 55 0 R 56 0 R 57 0 R 58 0 R 59 0 R ] /Parent 7 0 R /Type /Pages >>
endobj
14 0 obj
<< /Count 3 /Kids [ 60 0 R 61 0 R 62 0 R ] /Parent 7 0 R /Type /Pages >>
endobj
15 0 obj
<< /Kids [ 63 0 R 64 0 R 65 0 R 66 0 R 67 0 R 68 0 R ] /Limits [ (Doc-Start) (cite.patel2023splitwise) ] >>
endobj
16 0 obj
<< /Kids [ 69 0 R 70 0 R 71 0 R 72 0 R 73 0 R 74 0 R ] /Limits [ (cite.pod-attn) (page.15) ] >>
endobj
17 0 obj
<< /Kids [ 75 0 R 76 0 R 77 0 R 78 0 R 79 0 R 80 0 R ] /Limits [ (page.2) (table.caption.2) ] >>
endobj
18 0 obj
<< /Kids [ 81 0 R ] /Limits [ (table.caption.21) (table.caption.9) ] >>
endobj
19 0 obj
<< /A << /D (Hfootnote.1) /S /GoTo >> /Border [ 0 0 0 ] /C [ 1 0 0 ] /H /I /Rect [ 91.05 353.547 97.227 366.311 ] /Subtype /Link /Type /Annot >>
endobj
20 0 obj
<< /A << /D (cite.kaplan2020scalinglaws) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 263.913 155.249 276.067 166.153 ] /Subtype /Link /Type /Annot >>
endobj
21 0 obj
<< /A << /D (cite.openai2022gpt4techreport) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 278.781 155.249 290.935 166.153 ] /Subtype /Link /Type /Annot >>
endobj
22 0 obj
<< /A << /D (cite.atil2024nondeterminism) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 157.96 131.897 164.993 142.243 ] /Subtype /Link /Type /Annot >>
endobj
23 0 obj
<< /A << /D (cite.he2025nondeterminism) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 166.824 131.897 178.899 142.243 ] /Subtype /Link /Type /Annot >>
endobj
24 0 obj
<< /A << /D (cite.song2024greedy) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 180.73 131.897 192.804 142.243 ] /Subtype /Link /Type /Annot >>
endobj
25 0 obj
<< /A << /D (cite.yuan2025fp32death) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 194.635 131.897 206.71 142.243 ] /Subtype /Link /Type /Annot >>
endobj
26 0 obj
<< /A << /D (cite.zhang2025-deterministic-tp) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 353.216 467.108 365.032 478.012 ] /Subtype /Link /Type /Annot >>
endobj
27 0 obj
<< /A << /D (cite.song2024greedy) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 362.958 443.198 375.112 454.102 ] /Subtype /Link /Type /Annot >>
endobj
28 0 obj
<< /A << /D (cite.rainbird2025deterministic) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 485.425 443.198 492.499 454.102 ] /Subtype /Link /Type /Annot >>
endobj
29 0 obj
<< /A << /D (cite.Anadkat2025consistent) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 458.262 419.288 465.236 430.192 ] /Subtype /Link /Type /Annot >>
endobj
30 0 obj
<< /A << /D (cite.Charlie2025) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 467.029 419.288 478.985 430.192 ] /Subtype /Link /Type /Annot >>
endobj
31 0 obj
<< /A << /D (cite.he2025nondeterminism) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 366.183 407.041 378.158 417.387 ] /Subtype /Link /Type /Annot >>
endobj
32 0 obj
<< /A << /D (Hfootnote.2) /S /GoTo >> /Border [ 0 0 0 ] /C [ 1 0 0 ] /H /I /Rect [ 416.177 382.572 422.353 395.336 ] /Subtype /Link /Type /Annot >>
endobj
33 0 obj
<< /A << /D (cite.SGLangTeam2025) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 465.655 263.021 477.61 273.925 ] /Subtype /Link /Type /Annot >>
endobj
34 0 obj
<< /A << /D (cite.vllm-batch-invariant-2025) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 479.403 263.021 491.358 273.925 ] /Subtype /Link /Type /Annot >>
endobj
35 0 obj
<< /A << /D (cite.tritonfusedkernel-splitk-meta) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 529.535 166.53 541.381 177.433 ] /Subtype /Link /Type /Annot >>
endobj
36 0 obj
<< /A << /D (cite.nvidia_cutlass_blog) /S /GoTo >> /Border [ 0 0 0 ] /C [ 0 1 0 ] /H /I /Rect [ 543.15 166.53 554.995 177.433 ] /Subtype /Link /Type /Annot >>
endobj
37 0 obj
<< /A << /S /URI /URI (https://arxiv.org/abs/2601.17768v2) >> /BS << /W 0 >> /NM (fitz-L0) /Rect [ 12 223.79999 32 568.2 ] /Subtype /Link >>
endobj
38 0 obj
<< /Length 10 /Filter /FlateDecode >>
stream
x+ |
endstream
endobj
39 0 obj
<< /Filter /FlateDecode /Length 4675 >>
stream
xڥ[IwFWmXh䂭}ز7[}u @Z(( Hh6o^E_wʳ$y&ujny|#ݺ7[Q}SUo]ew?rC?凟QYP6OQQ]{rύXC67ϟ~Б(qYefk0)o~6yXIbiTB8/daatpvtNC*z`\{ |v;Od\Qf2`Æ))lKglW:l=ґļqw86Ǻ-QQ0Q cQ{ddɥtƱ+ IS͙fA/g7d=h3tȻv~Z*!1qY B.?J~hTDe
ak(4J<7OB̶wS@BeA; m؆5LoN3Bb6m͔kʁLZ6L/#<(wtŻ::rtח':)F<_b`[EZ#LU!ctOY,JVYٕBO0qYj1!b4*%3}@)ҷ1&6pmr"Xx"oYTXB>zN#9{zũ.q{Nڊ&nvŃ8XarXv.
_3XָY[F^Ǿc|t۞$:GKu[S)n)`݊OUC'^Q[/>`cImI]0nSޱN.cWIDW3\ !{tgp3Tp{mIH)=俏P5}B CƝFb"kJ@:N]=^A;rms@c)eP4ۅi 1m=& $:/Ϝ{x1bSVR:iUlN{LlH{^)8AyQ n7v]pa?^<v^߃DdHv[1|
xFU)Iͨ"J
.zY|9Tևqps$.Kaaolvu &xwrOeXs{v!"yp 3@$/
݁.}WIh[ڏ˸#njށk@`꺄cL-ɟ|{1mNH8n~cCeM1@Yu,f/5F*Lr1hf}և?ON8oW#lTZx|'+ٕ!-92Y4qp?UhGׇjUT>,i*/$ vvEͯ[?܁)] CbGf
!hG;鋁<^Gܑ7?Niو