|
250 | 250 | "code": "https://github.com/wisdomikezogwo/quilt1m"
|
251 | 251 | }
|
252 | 252 | },
|
253 |
| - { |
254 |
| - "title": "EcoAssistant: Using LLM Assistant More Affordably and Accurately", |
255 |
| - "authors": [ |
256 |
| - "Jieyu Zhang", |
257 |
| - "Ranjay Krishna", |
258 |
| - "Ahmed H. Awadallah", |
259 |
| - "Chi Wang" |
260 |
| - ], |
261 |
| - "year": "2023", |
262 |
| - "venue": null, |
263 |
| - "links": { |
264 |
| - "pdf": "https://arxiv.org/abs/2310.03046", |
265 |
| - "code": "https://github.com/JieyuZ2/EcoAssistant" |
266 |
| - }, |
267 |
| - "thumbnail": "/ecoassistant.png" |
268 |
| - }, |
269 |
| - { |
270 |
| - "title": "Tool Documentation Enables Zero-Shot Tool-Usage with Large Language Models", |
271 |
| - "authors": [ |
272 |
| - "Cheng-Yu Hsieh", |
273 |
| - "Si-An Chen", |
274 |
| - "Chun-Liang Li", |
275 |
| - "Yasuhisa Fujii", |
276 |
| - "Alexander Ratner", |
277 |
| - "Chen-Yu Lee", |
278 |
| - "Ranjay Krishna", |
279 |
| - "Tomas Pfister" |
280 |
| - ], |
281 |
| - "year": "2023", |
282 |
| - "venue": null, |
283 |
| - "links": { |
284 |
| - "pdf": "https://arxiv.org/abs/2308.00675" |
285 |
| - } |
286 |
| - }, |
287 |
| - { |
288 |
| - "title": "MIMIC: Masked Image Modeling with Image Correspondences", |
289 |
| - "authors": [ |
290 |
| - "Kalyani Marathe", |
291 |
| - "Mahtab Bigverdi", |
292 |
| - "Nishat Khan", |
293 |
| - "Tuhin Kundu", |
294 |
| - "Aniruddha Kembhavi", |
295 |
| - "Linda G. Shapiro", |
296 |
| - "Ranjay Krishna" |
297 |
| - ], |
298 |
| - "year": "2023", |
299 |
| - "venue": null, |
300 |
| - "links": { |
301 |
| - "pdf": "https://arxiv.org/pdf/2306.15128.pdf", |
302 |
| - "code": "https://github.com/RAIVNLab/MIMIC" |
303 |
| - } |
304 |
| - }, |
305 |
| - { |
306 |
| - "title": "Cultural and Linguistic Diversity Improves Visual Representations", |
307 |
| - "authors": [ |
308 |
| - "Andre Ye", |
309 |
| - "Sebastin Santy", |
310 |
| - "Jena D. Hwang", |
311 |
| - "Amy X. Zhang", |
312 |
| - "Ranjay Krishna" |
313 |
| - ], |
314 |
| - "year": "2023", |
315 |
| - "venue": null, |
316 |
| - "links": { |
317 |
| - "pdf": "https://arxiv.org/pdf/2310.14356.pdf" |
318 |
| - } |
319 |
| - }, |
320 |
| - { |
321 |
| - "title": "Improving Multimodal Datasets with Image Captioning", |
322 |
| - "authors": [ |
323 |
| - "Thao Nguyen", |
324 |
| - "Samir Yitzhak Gadre", |
325 |
| - "Gabriel Ilharco", |
326 |
| - "Sewoong Oh", |
327 |
| - "Ludwig Schmidt" |
328 |
| - ], |
329 |
| - "year": "2023", |
330 |
| - "venue": "NeurIPS 2023", |
331 |
| - "links": { |
332 |
| - "pdf": "https://arxiv.org/abs/2307.10350" |
333 |
| - } |
334 |
| - }, |
335 |
| - { |
336 |
| - "title": "AdANNS: A Framework for Adaptive Semantic Search", |
337 |
| - "authors": [ |
338 |
| - "Aniket Rege", |
339 |
| - "Aditya Kusupati", |
340 |
| - "Sharan Ranjit S", |
341 |
| - "Alan Fan", |
342 |
| - "Qingqing Cao", |
343 |
| - "Sham Kakade", |
344 |
| - "Prateek Jain", |
345 |
| - "Ali Farhadi" |
346 |
| - ], |
347 |
| - "year": "2023", |
348 |
| - "venue": "NeurIPS 2023", |
349 |
| - "links": { |
350 |
| - "pdf": "https://arxiv.org/abs/2305.19435", |
351 |
| - "code": "https://github.com/RAIVNLab/AdANNS" |
352 |
| - } |
353 |
| - }, |
354 |
| - { |
355 |
| - "title": "Stable and low-precision training for large-scale vision-language models", |
356 |
| - "authors": [ |
357 |
| - "Mitchell Wortsman", |
358 |
| - "Tim Dettmers", |
359 |
| - "Luke Zettlemoyer", |
360 |
| - "Ari Morcos", |
361 |
| - "Ali Farhadi", |
362 |
| - "Ludwig Schmidt" |
363 |
| - ], |
364 |
| - "year": "2023", |
365 |
| - "venue": "NeurIPS 2023", |
366 |
| - "links": { |
367 |
| - "pdf": "https://arxiv.org/abs/2304.13013" |
368 |
| - } |
369 |
| - }, |
370 | 253 | {
|
371 | 254 | "title": "Cola: How to adapt vision-language models to Compose Objects Localized with Attributes?",
|
372 | 255 | "authors": [
|
|
0 commit comments