Image-Text-to-Text
Transformers
English
qwen2_vl
conversational
VLM2Vec-Qwen2VL-2B / eval /OK-VQA_pred.txt
memray's picture
Upload 84 files
2fbff2e verified
('drive', '')
('forest', '')
('teddy', '')
('paw', '')
('legal', '')
('poop', '')
('bench', '')
('fun', '')
('seed', '')
('batter', '')
('salt water beach', '')
('artist', '')
('veggies', '')
('platform', '')
('bmx', '')
('boeing', '')
('girl', '')
('thousand of year', '')
('ollie', '')
('homerun', '')
('light', '')
('circle', '')
('500 pounds', '')
('cross country', '')
('wetsuit', '')
('longboard', '')
('polyester', '')
('teeth', '')
('cheesecake', '')
('vase', '')
('scotland', '')
('soup', '')
('fake', '')
('1500', '')
('quilt', '')
('brazil', '')
('pizza hut', '')
('diesel', '')
('becker vineyard', '')
('shatter', '')
("french's", '')
('design', '')
('sushi', '')
('hummingbird', '')
('they are smile', '')
('1000 mph', '')
('cowboy hat', '')
('wood', '')
('nothing', '')
('cement', '')
('railroad', '')
('fisheye', '')
('gazebo', '')
('throw it', '')
('high school', '')
('ottoman', '')
('commercial', '')
('batter', '')
('birkenstock', '')
('joss whedon', '')
('dawn', '')
('expensive', '')
('sylvester', '')
('sink', '')
('hooves', '')
('kuwait airway', '')
('1806', '')
('uber', '')
('mickey mouse', '')
('coconut', '')
('cross country', '')
('long neck', '')
('mammal', '')
('water', '')
('6 feet', '')
('siamese', '')
('veggies', '')
('veggies', '')
('stormy', '')
('convection', '')
('sail', '')
('napkin', '')
('truck', '')
('past', '')
('steer', '')
('polo', '')
('electric blanket', '')
('helium', '')
('both', '')
('many', '')
('no water', '')
('advertise brand', '')
('concert', '')
('to sleep', '')
('oneworld', '')
('curtain', '')
('pig', '')
('knob', '')
('3 feet', '')
('5 tons', '')
('levis', '')
('nocturnal', '')
('contrail', '')
('very', '')
('pizzaria', '')
('mutt', '')
('piano', '')
('cargo', '')
('canine', '')
('pancake', '')
('thanksgiving', '')
('worm', '')
('transport', '')
('herd', '')
('paw', '')
('serrated', '')
('south america', '')
('30 years', '')
('sponsor', '')
('claw', '')
('concert', '')
('drive', '')
('no left turn', '')
('pleasure', '')
('school', '')
('3 minutes', '')
('myna', '')
('swimsuit', '')
('taxi', '')
('flood', '')
('1500', '')
('poop', '')
('skatepark', '')
('hat', '')
('salt and pepper', '')
('simmer', '')
('spatula', '')
('make donuts', '')
('canal', '')
('legal', '')
('florist', '')
('anchor aweigh', '')
('seagull', '')
('microphone', '')
('both', '')
('tempered', '')
('beef', '')
('piano', '')
('thomas', '')
('nylon', '')
('rugby', '')
('race horse', '')
('plumber', '')
('sahara', '')
('pita', '')
('buddhism', '')
('ice', '')
('siamese', '')
('sydney', '')
('carnivore', '')
('honey mustard', '')
('cool', '')
('ski slope', '')
('diesel', '')
('tern', '')
('trash', '')
('disc golf', '')
('cook it', '')
('road work', '')
('farm', '')
('vitamin', '')
('ketchup and pea', '')
('clinton', '')
('metal', '')
('screensaver', '')
('medium rare', '')
('canary', '')
('juice', '')
('political', '')
('north america', '')
('motorcycle license', '')
('chihuahua', '')
('home plate', '')
('teeth', '')
('wind', '')
('crosswalk', '')
('too big', '')
('marathon', '')
('30.7 lbs', '')
('very', '')
('arabian', '')
('natural', '')
('mushroom', '')
('ship', '')
('wood and metal', '')
('tide', '')
('sunlight', '')
('robe', '')
('microwave', '')
('badminton', '')
('50 mph', '')
('wind turbine', '')
('mice', '')
('1801', '')
('hp', '')
('freight', '')
('biplane', '')
('caution', '')
('seattle', '')
('freeway', '')
('mario', '')
('near sighted', '')
('racket', '')
('bamboo', '')
('anger', '')
('fluoride', '')
('heart rate', '')
('both', '')
('feather', '')
('andes', '')
('legal', '')
('lab', '')
('1500', '')
('violin', '')
('rainbow', '')
('very big', '')
('thomas', '')
('1968', '')
('party', '')
('roadster', '')
('jk rowling', '')
('dirt bike', '')
('samsung', '')
('rough', '')
('neoprene', '')
('coke', '')
('lock', '')
('russian', '')
('gull', '')
('anchor', '')
('million', '')
('temperate', '')
('jumped', '')
('middle', '')
('pelican', '')
('chihuahua', '')
('victorian', '')
('equus quagga', '')
('hp', '')
('granite', '')
('leopard', '')
('dry hand', '')
('elephant', '')
('soccer', '')
('overhand', '')
('million', '')
('firemen', '')
('denim', '')
('1847', '')
('north america', '')
('drive', '')
('cowboy hat', '')
('rolex', '')
('25 years', '')
('arabian', '')
('greyhound', '')
('suzuki', '')
('sunlight', '')
('thomas', '')
('sun', '')
('flourescent', '')
('sail', '')
('kickstand', '')
('ceramic', '')
('1930s', '')
('hat', '')
('handstand', '')
('pass', '')
('forest', '')
('turf', '')
('table', '')
('throw', '')
('cell', '')
('culinary', '')
('cubicle', '')
('fly kite', '')
('ice', '')
('samsung', '')
('video', '')
('kohler', '')
('20s', '')
('motorola', '')
('panther', '')
('30 minutes', '')
('kenmore', '')
('communication', '')
('floral', '')
('sausage', '')
('15 years', '')
('tern', '')
('nothing', '')
('bike', '')
('alaska', '')
('hello kitty', '')
('husky', '')
('not cold', '')
('drop', '')
('70 years', '')
('rolex', '')
('salmon', '')
('cumulus', '')
('beach', '')
('tree', '')
('biplane', '')
('yankees', '')
('thousand of year', '')
('toucan', '')
('political', '')
('ferris wheel', '')
('religion', '')
('laundry', '')
('bareback', '')
('pit bull', '')
('grocery', '')
('stainless steel', '')
('thanksgiving', '')
('river', '')
('potato', '')
('north america', '')
('brake', '')
('no leaf on tree', '')
('picture', '')
('evergreen', '')
('wine taster', '')
('hispanic', '')
('no left turn', '')
('school', '')
('women', '')
('pedestrian', '')
('fake', '')
('robe', '')
('right', '')
('match', '')
('ice', '')
('exam room', '')
('exhaust', '')
('cardboard', '')
('shark', '')
('skatepark', '')
('tennis net', '')
('1940s', '')
('forest', '')
('river', '')
('mirror', '')
('fish', '')
('mule', '')
('early 19th century', '')
('boiled', '')
('drown', '')
('moderately', '')
('amtrak', '')
('skyscraper', '')
('tern', '')
('be quiet', '')
('garage', '')
('street name', '')
('chopstick', '')
('hospital', '')
('brazil', '')
('bluejay', '')
('communicating', '')
('sesame', '')
('picket', '')
('bee', '')
('college student', '')
('end aid', '')
('live', '')
('pet store', '')
('cloudy', '')
('half', '')
('nose', '')
('on trip', '')
('headphone', '')
('dine room', '')
('vacation', '')
('miniature', '')
('million', '')
('thomas', '')
('brewed', '')
('sand', '')
('rice', '')
('pleasure', '')
('sail', '')
('goalie', '')
('2 quarts', '')
('doberman', '')
('caution', '')
('75 million', '')
('worm', '')
('child', '')
('artist', '')
('cool', '')
('bandana', '')
('air canada', '')
('grilled', '')
('monitor', '')
('wet suit', '')
('sydney', '')
('bear', '')
('compact', '')
('honey mustard', '')
('play tennis', '')
('safety', '')
('broccoli', '')
('croissant', '')
('pay here', '')
('neck', '')
('pita', '')
('wireless', '')
('1800s', '')
('1903', '')
('festival', '')
('hotel', '')
('honda accord', '')
('sail', '')
('kite', '')
('plaid', '')
('catch fish', '')
('line', '')
('road work', '')
('cactus', '')
('red soil', '')
('million', '')
('blended beverage', '')
('hypothermia', '')
('fondant', '')
('toshiba', '')
('winair', '')
('stallion', '')
('legal', '')
('commercial', '')
('caution', '')
('mexico', '')
('boy', '')
('yamaha', '')
('japanese', '')
('citrus', '')
('canada', '')
('catch', '')
('pine tree', '')
('brush teeth', '')
('ski pole', '')
('ducati', '')
('labrador', '')
('pass', '')
('6 feet', '')
('budweiser', '')
('moo', '')
('strike', '')
('kibble', '')
('dough', '')
('wooden', '')
('kickflip', '')
('log', '')
('selfie', '')
('wooden', '')
('babolat', '')
('siamese', '')
('foal', '')
('talk show', '')
('many', '')
('palm tree', '')
('ice', '')
('farm', '')
('music', '')
('glove', '')
('20 inches', '')
('equestrian', '')
('pull', '')
('california hawaii', '')
('black cat', '')
('graffiti artist', '')
('bench', '')
('yosemite', '')
('bowties', '')
('lay down', '')
('cotton candy', '')
('wicker', '')
('mozzarella', '')
('america', '')
('teeth', '')
('thousand of year', '')
('hp', '')
('crystal', '')
('airplane', '')
('live', '')
('pasture', '')
('dent', '')
('tortoise', '')
('sew', '')
('see better', '')
('babe ruth', '')
('race horse', '')
('medieval', '')
('30 minutes', '')
('mozzarella', '')
('1806', '')
('motocross', '')
('million', '')
('pack material', '')
('clockmaker', '')
('forest', '')
('cotton candy', '')
('compact', '')
('poop', '')
('sticker', '')
('toy store', '')
('throw', '')
('passtime', '')
('tupperware', '')
('log', '')
('merino', '')
('pelican', '')
('navel', '')
('wetsuit', '')
('truck', '')
('child', '')
('hawk', '')
('bluetooth', '')
('coke', '')
('chinese new year', '')
('space', '')
('fish', '')
('harry potter', '')
('even', '')
('16 years', '')
('advertise brand', '')
('military', '')
('toxoplasmosis', '')
('traditional', '')
('leash', '')
('stove', '')
('napkin', '')
('military', '')
('flew', '')
('penny farthing', '')
('frisbee', '')
('kung fu panda', '')
('home plate', '')
('oven', '')
('ship', '')
('ship', '')
('wilson', '')
('sheep', '')
('wine taste', '')
('clean', '')
('furniture store', '')
('sled', '')
('phone', '')
('pirate', '')
('babar', '')
('computer', '')
('time tell', '')
('kickflip', '')
('chicken', '')
('seattle', '')
('150mph', '')
('bok choy', '')
('1885', '')
('move', '')
('jockey', '')
('engineering', '')
('plaid', '')
('firemen', '')
('europe', '')
('electric', '')
('farm', '')
('fruit', '')
('willow', '')
('shark', '')
('texas', '')
('not rain hard', '')
('brewed', '')
('giraffe', '')
('benjamin franklin', '')
('caution', '')
('swim', '')
('vitamin', '')
('ketchup', '')
('very expensive', '')
('leapfrog', '')
('arabian', '')
('pepperoni', '')
('throw it', '')
('tokyo', '')
('8 planks', '')
('furniture store', '')
('harley davidson', '')
('squat', '')
('luggage', '')
('united kingdom', '')
('alp', '')
('biplane', '')
('hamburger', '')
('stew', '')
('extremely', '')
('exam room', '')
('garage', '')
('forklift driver', '')
('50 gallons', '')
('pasture', '')
('jet fuel', '')
('ottoman', '')
('los angeles', '')
('goth', '')
('squat', '')
('motorola', '')
('zoo', '')
('smoke', '')
('practice', '')
('christmas', '')
('strawberry', '')
('formal', '')
('texas', '')
('minaret', '')
('nutrient', '')
('bench', '')
('walkway', '')
('ski slope', '')
('madonna', '')
('samsung', '')
('cool', '')
('herd', '')
('lincoln', '')
('propeller', '')
('marie antoinette', '')
('recliner', '')
('box', '')
('underhand', '')
('pepto bismol', '')
('knee', '')
('$10000', '')
('ketchup', '')
('log', '')
('same team', '')
('alpine', '')
('neoprene', '')
('microwave', '')
('stoplight', '')
('digital camera', '')
('guinness', '')
('world series', '')
('backspace', '')
('strike', '')
('danish', '')
('bath', '')
('field', '')
('wax', '')
('wetsuit', '')
('cross country', '')
('sandwich', '')
('meat', '')
("don't walk", '')
('danish', '')
('windex', '')
('cloudy', '')
('herbivore', '')
('desktop', '')
('log', '')
('sunday', '')
('tomato', '')
('christmas light', '')
('siamese', '')
('siamese', '')
('remote', '')
('shell', '')
('anniversary', '')
('autumn', '')
('himalayas', '')
('best buy', '')
('captain', '')
('troposphere', '')
('stopped', '')
('truck', '')
('goatee', '')
('star alliance', '')
('fender', '')
('penny farthing', '')
('government', '')
('tusk', '')
('yankees', '')
('capris', '')
('birthday', '')
('take picture', '')
('rancher', '')
('topology', '')
('sweet', '')
('steam engine', '')
('rice', '')
('smoothie', '')
('glad', '')
('grizzly', '')
('water ski', '')
('women', '')
('harley davidson', '')
('flock', '')
('route 66', '')
('land', '')
('design', '')
('see better', '')
('bamboo', '')
('london bridge', '')
('see yourself', '')
('canopy', '')
('transportaion', '')
('desert', '')
('bunk bed', '')
('equus quagga', '')
('space', '')
('india', '')
('sideburn', '')
('india', '')
('shark', '')
('commercial', '')
('german', '')
('line', '')
('american airline', '')
('ice', '')
('thousand of year', '')
('log', '')
('carpet', '')
('move', '')
('guinness', '')
('jet fuel', '')
('ferris wheel', '')
('circle', '')
('reflection', '')
('tusk', '')
('college', '')
('shade', '')
('spark plug', '')
('fighter jet', '')
('tuxedo', '')
('rest', '')
('put out fire', '')
('french', '')
('sister', '')
('1000 mph', '')
('moen', '')
('pillow', '')
('north', '')
('15000 feet', '')
('cosmetology', '')
('apartment', '')
('peter fonda', '')
('clydesdale', '')
('sking sled', '')
('brown bear', '')
('communication', '')
('safety', '')
('brush teeth', '')
('pulled pork', '')
('even', '')
('fix traffic light', '')
('eagle', '')
('neoprene', '')
('biscuit', '')
('grizzly', '')
('firemen', '')
('yamaha', '')
('wooden', '')
('circle', '')
('slicer', '')
('tennis match', '')
('million', '')
('glare', '')
('floral', '')
('thomas', '')
('passenger', '')
('log', '')
('black', '')
('harley', '')
('air show', '')
('collie', '')
('thousand', '')
('picture', '')
('be quiet', '')
('1940s', '')
('white shirt', '')
('oil', '')
('striped', '')
('dusk', '')
('time zone', '')
('railroad', '')
('very', '')
('pepsi', '')
('ocean', '')
('cheesecake', '')
('sailboat', '')
('heron', '')
('travel', '')
('cordless', '')
('fast food', '')
('luggage', '')
('collie', '')
('grape and banana', '')
('cooked', '')
('1500', '')
('thick', '')
('1000 mph', '')
('cow milk', '')
('near sighted', '')
('they eat grass', '')
('train station', '')
('leash', '')
('vitamin', '')
('bulb', '')
('gas', '')
('cake', '')
('korean', '')
('spray paint', '')
('gottlieb daimler', '')
('20 inches', '')
('american shorthair', '')
('herbivorous', '')
('mustard', '')
('disorganized', '')
('hitchcock', '')
('steamed', '')
('fine', '')
('broken leg', '')
('brush teeth', '')
('croissant', '')
('2 tons', '')
('french fry', '')
('climate change', '')
('control horse', '')
('tern', '')
('olives', '')
('benjamin franklin', '')
('juice', '')
('picket', '')
('50 cents', '')
('ebay', '')
("2000's", '')
('carrot', '')
('hike', '')
('cafeteria', '')
('log', '')
('phone', '')
('watch tv', '')
('15 years', '')
('steam locomotive', '')
('not safe', '')
('to sleep', '')
('cowboy hat', '')
('goldilocks', '')
('rawlings', '')
('canine', '')
('fedora', '')
('blt', '')
('suitcase', '')
('300', '')
('rosa park', '')
('day', '')
('equestrian', '')
('reuben', '')
('plant', '')
('roll', '')
('heat', '')
('in oven', '')
('mouse', '')
('bake it', '')
('mosquito net', '')
('french door', '')
('anger', '')
('big ben', '')
('donuts', '')
('15000 feet', '')
('sing', '')
('time zone', '')
('thirsty', '')
('pacific ocean', '')
('rugby', '')
('korean air', '')
('pun', '')
('southeast asia', '')
('halloween', '')
('50 years', '')
('1930s', '')
('video game', '')
('australia', '')
('shark', '')
('pacific ocean', '')
('pitbull', '')
('german shepard', '')
('fruit', '')
('butter', '')
('arabian', '')
('downhill', '')
('6 weeks', '')
('cook', '')
('vanilla', '')
('recently', '')
('fiberglass', '')
('spoon', '')
('pajama', '')
('1000 mph', '')
('1936', '')
('messy', '')
('gothic', '')
('medieval', '')
('bowl', '')
('500 pounds', '')
('luggage', '')
('jansport', '')
('monet', '')
('asian', '')
('mahogany', '')
('tabby', '')
('ricotta', '')
('figurine', '')
('wallpaper', '')
('hole', '')
('floral', '')
('carbon monoxide', '')
('pass', '')
('motorcycle license', '')
('vase', '')
("french's", '')
('boeing', '')
('picnic', '')
('clock tower', '')
('wetsuit', '')
('everest', '')
('150mph', '')
('stopped', '')
('marshmellow', '')
('15 years', '')
('boeing', '')
('itali', '')
('fruit', '')
('cruise', '')
('twin', '')
('canine', '')
('tokyo', '')
('baked in oven', '')
('antarctica', '')
('halloween', '')
('not valuable', '')
('lincoln', '')
('museum', '')
('vietnam', '')
('very', '')
('zebra', '')
('lettuce', '')
('daisy', '')
('australia', '')
('office', '')
('serena williams', '')
('orange juice', '')
("valentine's day", '')
('tony hawk', '')
('cumulus', '')
('transport good', '')
('transport good', '')
('flip phone', '')
('coffee table', '')
('cook', '')
('tree', '')
('kohler', '')
('barn', '')
('architect', '')
('europe', '')
('race horse', '')
('shoulder', '')
('volleyball', '')
('gothic', '')
('benjamin franklin', '')
('fire hydrant', '')
('black cat', '')
('fall', '')
('colander', '')
('play video game', '')
('merino', '')
('dry hand', '')
('pilot', '')
('legal', '')
('partly cloudy', '')
('amazon', '')
('20s', '')
('log', '')
('san francisco', '')
('tony hawk', '')
('bang', '')
('roy cawood', '')
('2 16 years', '')
('blanket', '')
('new york city', '')
('brahman', '')