%PDF-1.7
%
1 0 obj
<< /Metadata 3 0 R /Names 4 0 R /OpenAction 5 0 R /Outlines 6 0 R /PageMode /UseOutlines /Pages 7 0 R /Type /Catalog >>
endobj
2 0 obj
<< /Author (Ali Vosoughi; Dimitra Emmanouilidou; Hannes Gamper) /Creator (arXiv GenPDF \(tex2pdf:4177c2c\)) /DOI (https://doi.org/10.48550/arXiv.2503.09205) /License (http://creativecommons.org/licenses/by/4.0/) /PTEX.Fullbanner (This is pdfTeX, Version 3.141592653-2.6-1.40.28 \(TeX Live 2025\) kpathsea version 6.4.1) /Producer (pikepdf 8.15.1) /Title (Quality Over Quantity? LLM-Based Curation for a Data-Efficient Audio-Video Foundation Model) /Trapped /False /arXivID (https://arxiv.org/abs/2503.09205v4) >>
endobj
3 0 obj
<< /Subtype /XML /Type /Metadata /Length 1748 >>
stream
Quality Over Quantity? LLM-Based Curation for a Data-Efficient Audio-Video Foundation ModelAli VosoughiDimitra EmmanouilidouHannes Gamperhttp://creativecommons.org/licenses/by/4.0/cs.MMcs.CLcs.IRcs.SDeess.AS
endstream
endobj
4 0 obj
<< /Dests 8 0 R >>
endobj
5 0 obj
<< /D [ 9 0 R /Fit ] /S /GoTo >>
endobj
6 0 obj
<< /Count 5 /First 10 0 R /Last 11 0 R /Type /Outlines >>
endobj
7 0 obj
<< /Count 5 /Kids [ 9 0 R 12 0 R 13 0 R 14 0 R 15 0 R ] /Type /Pages >>
endobj
8 0 obj
<< /Kids [ 16 0 R 17 0 R ] /Limits [ (Doc-Start) (table.caption.6) ] >>
endobj
9 0 obj
<< /Annots [ 18 0 R 19 0 R 20 0 R 21 0 R 22 0 R 23 0 R 24 0 R 25 0 R 26 0 R 27 0 R 28 0 R 29 0 R 30 0 R 31 0 R 32 0 R 33 0 R 34 0 R 35 0 R 36 0 R 37 0 R 38 0 R 39 0 R 40 0 R ] /Contents [ 41 0 R 42 0 R 43 0 R 44 0 R ] /Group 45 0 R /MediaBox [ 0 0 612 792 ] /Parent 7 0 R /Resources 46 0 R /Type /Page >>
endobj
10 0 obj
<< /A 47 0 R /Next 48 0 R /Parent 6 0 R /Title 49 0 R >>
endobj
11 0 obj
<< /A 50 0 R /Parent 6 0 R /Prev 51 0 R /Title 52 0 R >>
endobj
12 0 obj
<< /Annots [ 53 0 R 54 0 R 55 0 R 56 0 R 57 0 R 58 0 R 59 0 R 60 0 R 61 0 R 62 0 R 63 0 R 64 0 R 65 0 R 66 0 R 67 0 R 68 0 R 69 0 R 70 0 R 71 0 R 72 0 R 73 0 R 74 0 R 75 0 R 76 0 R 77 0 R 78 0 R ] /Contents 79 0 R /Group 45 0 R /MediaBox [ 0 0 612 792 ] /Parent 7 0 R /Resources 80 0 R /Type /Page >>
endobj
13 0 obj
<< /Annots [ 81 0 R 82 0 R 83 0 R 84 0 R 85 0 R 86 0 R 87 0 R 88 0 R 89 0 R 90 0 R 91 0 R ] /Contents 92 0 R /Group 45 0 R /MediaBox [ 0 0 612 792 ] /Parent 7 0 R /Resources 93 0 R /Type /Page >>
endobj
14 0 obj
<< /Annots [ 94 0 R 95 0 R 96 0 R ] /Contents 97 0 R /Group 45 0 R /MediaBox [ 0 0 612 792 ] /Parent 7 0 R /Resources 98 0 R /Type /Page >>
endobj
15 0 obj
<< /Annots [ 99 0 R 100 0 R 101 0 R 102 0 R 103 0 R 104 0 R 105 0 R 106 0 R ] /Contents 107 0 R /MediaBox [ 0 0 612 792 ] /Parent 7 0 R /Resources 108 0 R /Type /Page >>
endobj
16 0 obj
<< /Kids [ 109 0 R 110 0 R 111 0 R 112 0 R 113 0 R 114 0 R ] /Limits [ (Doc-Start) (cite.tangsalmonn2024iclr-salmon) ] >>
endobj
17 0 obj
<< /Kids [ 115 0 R 116 0 R 117 0 R 118 0 R 119 0 R 120 0 R ] /Limits [ (cite.tian2018ave) (table.caption.6) ] >>
endobj
18 0 obj
<< /A << /D (cite.radford2021learning) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 290.761 292.149 297.714 303.093 ] /Subtype /Link /Type /Annot >>
endobj
19 0 obj
<< /A << /D (cite.elizalde2023clap) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 98.218 280.194 105.202 291.138 ] /Subtype /Link /Type /Annot >>
endobj
20 0 obj
<< /A << /D (cite.li2023blip) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 239.256 280.194 246.24 291.138 ] /Subtype /Link /Type /Annot >>
endobj
21 0 obj
<< /A << /D (cite.chen2023dialogmcf) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 255.887 280.194 262.871 291.138 ] /Subtype /Link /Type /Annot >>
endobj
22 0 obj
<< /A << /D (cite.harwath2016unsupervised) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 67.934 208.415 80.089 219.359 ] /Subtype /Link /Type /Annot >>
endobj
23 0 obj
<< /A << /D (cite.harwath2018jointly) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 89.945 208.415 102.099 219.359 ] /Subtype /Link /Type /Annot >>
endobj
24 0 obj
<< /A << /D (cite.tang2024video) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 149.887 184.505 162.042 195.448 ] /Subtype /Link /Type /Annot >>
endobj
25 0 obj
<< /A << /D (cite.zhu2024languagebind) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 171.898 184.505 184.052 195.448 ] /Subtype /Link /Type /Annot >>
endobj
26 0 obj
<< /A << /D (cite.wu2022wav2clip) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 146.442 172.549 153.317 183.493 ] /Subtype /Link /Type /Annot >>
endobj
27 0 obj
<< /A << /D (cite.guzhov2022audioclip) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 211.83 172.549 218.705 183.493 ] /Subtype /Link /Type /Annot >>
endobj
28 0 obj
<< /A << /D (cite.girdhar2023imagebind) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 289.698 172.549 296.572 183.493 ] /Subtype /Link /Type /Annot >>
endobj
29 0 obj
<< /A << /D (cite.shi2022learning-avhubert) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 51.308 136.684 63.333 147.628 ] /Subtype /Link /Type /Annot >>
endobj
30 0 obj
<< /A << /D (cite.hamilton2024separating) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 131.158 136.684 143.183 147.628 ] /Subtype /Link /Type /Annot >>
endobj
31 0 obj
<< /A << /D (cite.liu2024llavanext) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 364.916 470.458 377.041 481.402 ] /Subtype /Link /Type /Annot >>
endobj
32 0 obj
<< /A << /D (cite.zhang2024llavanextvideo) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 387.804 470.458 399.928 481.402 ] /Subtype /Link /Type /Annot >>
endobj
33 0 obj
<< /A << /D (cite.gong2023joint-ltuas) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 533.414 470.458 545.539 481.402 ] /Subtype /Link /Type /Annot >>
endobj
34 0 obj
<< /A << /D (cite.mistral2023) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 439.639 458.503 451.684 469.447 ] /Subtype /Link /Type /Annot >>
endobj
35 0 obj
<< /A << /D (cite.radford2023whisper) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 430.736 363.623 442.89 374.591 ] /Subtype /Link /Type /Annot >>
endobj
36 0 obj
<< /A << /D (cite.oquab2023dinov2) /S /GoTo >> /Border [ 0 0 1 ] /C [ 0 1 0 ] /H /I /Rect [ 353.233 351.667 365.387 362.611 ] /Subtype /Link /Type /Annot >>
endobj
37 0 obj
<< /A << /D (section.2) /S /GoTo >> /Border [ 0 0 1 ] /C [ 1 0 0 ] /H /I /Rect [ 310.981 147.655 319.476 158.599 ] /Subtype /Link /Type /Annot >>
endobj
38 0 obj
<< /A << /D (section.3) /S /GoTo >> /Border [ 0 0 1 ] /C [ 1 0 0 ] /H /I /Rect [ 344.86 135.7 356.974 146.644 ] /Subtype /Link /Type /Annot >>
endobj
39 0 obj
<< /A << /D (section.4) /S /GoTo >> /Border [ 0 0 1 ] /C [ 1 0 0 ] /H /I /Rect [ 551.709 135.7 564.391 146.644 ] /Subtype /Link /Type /Annot >>
endobj
40 0 obj
<< /A << /S /URI /URI (https://arxiv.org/abs/2503.09205v4) >> /BS << /W 0 >> /NM (fitz-L0) /Rect [ 12 215.46002 32 576.54 ] /Subtype /Link >>
endobj
41 0 obj
<< /Length 10 /Filter /FlateDecode >>
stream
x+ |
endstream
endobj
42 0 obj
<< /Filter /FlateDecode /Length 4904 >>
stream
xڭZ[s۸~ϯRUe3x˙8Imy@KԐT2___@Q4[[*h@F4{E_D'?&g6KųYaCFa>|Qܤ뤇fؿKǪw+瑱n̢,,)̲҆Em%MPɷoZ{4#v _'iL<YI64=ğY ɪrIK`lT7(e2Ksvm%#Goz2ݵ45+\"TvSS7_+1Ƒ|#z1Bg6h4N>4SCQ/L`vqD-ڹT V)
ցǚPI6'N@(U&aۃLwόP(7kRZ*-+u@;/^>GKjǗvQAsҳoqojyrypJ`[MHVssYf :B\U2G0s-
5lH_7?33_`pW