|
1 | 1 | [
|
2 |
| - { |
3 |
| - "title": "EcoAssistant: Using LLM Assistant More Affordably and Accurately", |
4 |
| - "authors": [ |
5 |
| - "Jieyu Zhang", |
6 |
| - "Ranjay Krishna", |
7 |
| - "Ahmed H. Awadallah", |
8 |
| - "Chi Wang" |
9 |
| - ], |
10 |
| - "year": "preprint", |
11 |
| - "venue": null, |
12 |
| - "links": { |
13 |
| - "pdf": "https://arxiv.org/abs/2310.03046", |
14 |
| - "code": "https://github.com/JieyuZ2/EcoAssistant" |
15 |
| - }, |
16 |
| - "thumbnail": "/ecoassistant.png" |
17 |
| - }, |
18 |
| - { |
19 |
| - "title": "Tool Documentation Enables Zero-Shot Tool-Usage with Large Language Models", |
20 |
| - "authors": [ |
21 |
| - "Cheng-Yu Hsieh", |
22 |
| - "Si-An Chen", |
23 |
| - "Chun-Liang Li", |
24 |
| - "Yasuhisa Fujii", |
25 |
| - "Alexander Ratner", |
26 |
| - "Chen-Yu Lee", |
27 |
| - "Ranjay Krishna", |
28 |
| - "Tomas Pfister" |
29 |
| - ], |
30 |
| - "year": "preprint", |
31 |
| - "venue": null, |
32 |
| - "links": { |
33 |
| - "pdf": "https://arxiv.org/abs/2308.00675" |
34 |
| - } |
35 |
| - }, |
36 |
| - { |
37 |
| - "title": "MIMIC: Masked Image Modeling with Image Correspondences", |
38 |
| - "authors": [ |
39 |
| - "Kalyani Marathe", |
40 |
| - "Mahtab Bigverdi", |
41 |
| - "Nishat Khan", |
42 |
| - "Tuhin Kundu", |
43 |
| - "Aniruddha Kembhavi", |
44 |
| - "Linda G. Shapiro", |
45 |
| - "Ranjay Krishna" |
46 |
| - ], |
47 |
| - "year": "preprint", |
48 |
| - "venue": null, |
49 |
| - "links": { |
50 |
| - "pdf": "https://arxiv.org/pdf/2306.15128.pdf", |
51 |
| - "code": "https://github.com/RAIVNLab/MIMIC" |
52 |
| - } |
53 |
| - }, |
54 |
| - { |
55 |
| - "title": "Cultural and Linguistic Diversity Improves Visual Representations", |
56 |
| - "authors": [ |
57 |
| - "Andre Ye", |
58 |
| - "Sebastin Santy", |
59 |
| - "Jena D. Hwang", |
60 |
| - "Amy X. Zhang", |
61 |
| - "Ranjay Krishna" |
62 |
| - ], |
63 |
| - "year": "preprint", |
64 |
| - "venue": null, |
65 |
| - "links": { |
66 |
| - "pdf": "https://arxiv.org/pdf/2310.14356.pdf" |
67 |
| - } |
68 |
| - }, |
69 |
| - { |
70 |
| - "title": "Improving Multimodal Datasets with Image Captioning", |
71 |
| - "authors": [ |
72 |
| - "Thao Nguyen", |
73 |
| - "Samir Yitzhak Gadre", |
74 |
| - "Gabriel Ilharco", |
75 |
| - "Sewoong Oh", |
76 |
| - "Ludwig Schmidt" |
77 |
| - ], |
78 |
| - "year": "2023", |
79 |
| - "venue": "NeurIPS 2023", |
80 |
| - "links": { |
81 |
| - "pdf": "https://arxiv.org/abs/2307.10350" |
82 |
| - } |
83 |
| - }, |
84 |
| - { |
85 |
| - "title": "AdANNS: A Framework for Adaptive Semantic Search", |
86 |
| - "authors": [ |
87 |
| - "Aniket Rege", |
88 |
| - "Aditya Kusupati", |
89 |
| - "Sharan Ranjit S", |
90 |
| - "Alan Fan", |
91 |
| - "Qingqing Cao", |
92 |
| - "Sham Kakade", |
93 |
| - "Prateek Jain", |
94 |
| - "Ali Farhadi" |
95 |
| - ], |
96 |
| - "year": "2023", |
97 |
| - "venue": "NeurIPS 2023", |
98 |
| - "links": { |
99 |
| - "pdf": "https://arxiv.org/abs/2305.19435", |
100 |
| - "code": "https://github.com/RAIVNLab/AdANNS" |
101 |
| - } |
102 |
| - }, |
103 |
| - { |
104 |
| - "title": "Stable and low-precision training for large-scale vision-language models", |
105 |
| - "authors": [ |
106 |
| - "Mitchell Wortsman", |
107 |
| - "Tim Dettmers", |
108 |
| - "Luke Zettlemoyer", |
109 |
| - "Ari Morcos", |
110 |
| - "Ali Farhadi", |
111 |
| - "Ludwig Schmidt" |
112 |
| - ], |
113 |
| - "year": "2023", |
114 |
| - "venue": "NeurIPS 2023", |
115 |
| - "links": { |
116 |
| - "pdf": "https://arxiv.org/abs/2304.13013" |
117 |
| - } |
118 |
| - }, |
119 | 2 | {
|
120 | 3 | "title": "Cola: How to adapt vision-language models to Compose Objects Localized with Attributes?",
|
121 | 4 | "authors": [
|
|
0 commit comments