Spaces:
Running
Running
minor c
Browse files- examples/generated_output_captions_en.jsonl +150 -0
- test_1/1.txt +0 -1
examples/generated_output_captions_en.jsonl
ADDED
@@ -0,0 +1,150 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"id": 930, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A baby is crying.", "ground_truth_text": "A baby is crying in distress in short bursts rapidly."}
|
2 |
+
{"id": 8272, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A man speaks as a door slams.", "ground_truth_text": "Men speak followed by a door shutting."}
|
3 |
+
{"id": 1272, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A cat meows and a door slams.", "ground_truth_text": "A cat meows followed by the sounds of items clattering."}
|
4 |
+
{"id": 2733, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A dog barks and growls while people speak.", "ground_truth_text": "A dog barking as a man and a woman are talking followed by water splashing and children talking in the background."}
|
5 |
+
{"id": 670, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A loud screeching sound followed by people cheering.", "ground_truth_text": "A loud engine revving, then the crowd claps and cheers."}
|
6 |
+
{"id": 2796, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A person is sniffling and sniffing.", "ground_truth_text": "Water trickling followed by a person snickering."}
|
7 |
+
{"id": 8779, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A chainsaw is revving up and then idling.", "ground_truth_text": "A chainsaw revs then idles and eventually stops."}
|
8 |
+
{"id": 7437, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A motor revs up and then a hiss is heard.", "ground_truth_text": "Speedboat with water spraying."}
|
9 |
+
{"id": 1402, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nPlease suggest a caption for the audio I've shared. ", "generated_text": "A dog barks and growls followed by a dog whimpering.", "ground_truth_text": "A dog barks then runs followed by dogs growling."}
|
10 |
+
{"id": 4934, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A man and a woman are speaking and a baby is making sounds.", "ground_truth_text": "People are talking as a snake hisses."}
|
11 |
+
{"id": 907, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you draft a caption for this audio recording? ", "generated_text": "A helicopter flies overhead.", "ground_truth_text": "A helicopter flies close to the ground overhead and flies off."}
|
12 |
+
{"id": 2187, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A train is moving along the tracks and a bell is ringing.", "ground_truth_text": "Steam train whistle as it approaches on the tracks then recedes."}
|
13 |
+
{"id": 5944, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A series of electronic beeps.", "ground_truth_text": "A loud, sharp electronic beep is occurring repetitively."}
|
14 |
+
{"id": 607, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A telephone rings and then stops.", "ground_truth_text": "Phone ringing then the click of being picked up and put back down."}
|
15 |
+
{"id": 8591, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A vehicle engine running and a dog barking.", "ground_truth_text": "Water is running and frog croaks."}
|
16 |
+
{"id": 6163, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A horse is trotting and birds are chirping.", "ground_truth_text": "Traffic passing in the distance and birds chirp as a running horse gets closer with louder clip-clops."}
|
17 |
+
{"id": 4560, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A gentle wind blows and birds chirp.", "ground_truth_text": "Light wind blowing followed by birds chirping as more wind blows."}
|
18 |
+
{"id": 1526, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you come up with a caption for this audio segment? ", "generated_text": "A large bell is being rung.", "ground_truth_text": "Several bells are chimed."}
|
19 |
+
{"id": 2348, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A train is passing by and a dog barks.", "ground_truth_text": "A bus engine idles followed by faint beeping and people conversing in the distance."}
|
20 |
+
{"id": 366, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A toilet is being flushed and a man speaks.", "ground_truth_text": "Food is frying and being stirred followed by a man talking."}
|
21 |
+
{"id": 9142, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A woman speaks while water runs and food sizzles.", "ground_truth_text": "A soft sizzle of food frying and a scraping noise which followed by a woman with a soft voice saying a few words."}
|
22 |
+
{"id": 8405, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A dog barks as music plays.", "ground_truth_text": "A dog barks several times, and then music starts to play in the background."}
|
23 |
+
{"id": 4771, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A woman whistling and tapping on a surface.", "ground_truth_text": "A baby cries and a surface is tapped."}
|
24 |
+
{"id": 2391, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A large group of people are clapping followed by a man speaking and laughing.", "ground_truth_text": "An audience applause as a man laughs and then speaks."}
|
25 |
+
{"id": 4317, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nKindly generate a caption for the following audio. ", "generated_text": "A woman speaks followed by a goat bleating.", "ground_truth_text": "A young female voice with goat bleating in the background."}
|
26 |
+
{"id": 5326, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you come up with a caption for this audio segment? ", "generated_text": "A vehicle is driving by and the wind is blowing.", "ground_truth_text": "Thunder booms in the distance as traffic passes by."}
|
27 |
+
{"id": 3420, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A horn is honking while people are talking.", "ground_truth_text": "A horn sounds while people talk in the background."}
|
28 |
+
{"id": 7749, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A dog barks and growls while children talk.", "ground_truth_text": "Dogs yipping and barking over human chatter."}
|
29 |
+
{"id": 7948, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you come up with a caption for this audio segment? ", "generated_text": "A metal object is being dragged across a surface followed by a loud bang.", "ground_truth_text": "Some clicking followed by scraping then a loud bang."}
|
30 |
+
{"id": 5579, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nTranslate the essence of this audio into a caption. ", "generated_text": "A man speaks followed by a metal hit.", "ground_truth_text": "Speaking followed by a bang."}
|
31 |
+
{"id": 9861, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A truck engine idling followed by a horn.", "ground_truth_text": "Wind blowing with faint humming of engines followed by a distant horn."}
|
32 |
+
{"id": 4150, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A woman speaks while metal clinks.", "ground_truth_text": "A woman speaks, metal clinks."}
|
33 |
+
{"id": 134, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A phone beeps and a man speaks.", "ground_truth_text": "A beep and a tone sounds then an electronic voice talks."}
|
34 |
+
{"id": 10007, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A bird caws and caws again.", "ground_truth_text": "Wind noises and seagulls whining."}
|
35 |
+
{"id": 3932, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A man speaks while birds chirp.", "ground_truth_text": "Bird tweeting in the background and a man talking."}
|
36 |
+
{"id": 1547, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A horn blares, followed by a man speaking.", "ground_truth_text": "Loud musical horn then vehicle zooming by then male voice."}
|
37 |
+
{"id": 5263, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A dog barks and growls and a man speaks.", "ground_truth_text": "Dogs bark and whimper then a woman speaks."}
|
38 |
+
{"id": 5052, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nDevise a caption that matches the theme of this audio. ", "generated_text": "A man speaks and ducks quack.", "ground_truth_text": "Ducks quack as a woman speaks followed by flapping wings."}
|
39 |
+
{"id": 3143, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A fly buzzes and then a frog croaks.", "ground_truth_text": "A fly buzzing followed by a gulping sound is repeated, after which a frog croaks."}
|
40 |
+
{"id": 3282, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you draft a caption for this audio recording? ", "generated_text": "A telephone is ringing and then someone is typing on a keyboard.", "ground_truth_text": "A telephone is ringing and beeping."}
|
41 |
+
{"id": 4923, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A sizzle followed by a tap.", "ground_truth_text": "Grease sizzles as a condiment is shaken then put down."}
|
42 |
+
{"id": 4144, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A dog barks followed by a gunshot.", "ground_truth_text": "Pounding hitting sounds followed by a dog barking frantically."}
|
43 |
+
{"id": 6241, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption best describes the content of this audio? ", "generated_text": "A boat motor runs followed by a man speaking.", "ground_truth_text": "An aircraft flies while wind blows and a man talks."}
|
44 |
+
{"id": 2281, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A train is moving along the tracks while people are talking.", "ground_truth_text": "Horses and a child speaking in the background."}
|
45 |
+
{"id": 869, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you draft a caption for this audio recording? ", "generated_text": "A woman laughs and speaks while people laugh in the background.", "ground_truth_text": "A man speaks when someone laughs quickly as the wind blows and ducks are quacking from a distance followed by laughter and a man speaks."}
|
46 |
+
{"id": 6129, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A dog growling followed by a hiss and a loud engine revving.", "ground_truth_text": "A frog croaks and a whoosh goes off."}
|
47 |
+
{"id": 7864, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nDevise a caption that matches the theme of this audio. ", "generated_text": "A man speaks and a spray can is used.", "ground_truth_text": "A man speaks followed by a loud hiss."}
|
48 |
+
{"id": 3871, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you draft a caption for this audio recording? ", "generated_text": "A cat meows and a man speaks.", "ground_truth_text": "A cat is meowing softly several times then a man speaks."}
|
49 |
+
{"id": 4153, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A man speaking while water is splashing.", "ground_truth_text": "A man speaks with some sizzling."}
|
50 |
+
{"id": 7242, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A man speaks and a baby cries.", "ground_truth_text": "A woman talking with snoring in the background."}
|
51 |
+
{"id": 2458, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A large group of people are cheering and a car is driving by.", "ground_truth_text": "People are talking and cheering then a vehicle speeds off loudly."}
|
52 |
+
{"id": 6881, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A telephone rings.", "ground_truth_text": "Telephone is ringing loudly."}
|
53 |
+
{"id": 619, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A woman laughs and a man speaks while a whistle blows.", "ground_truth_text": "A woman is screaming loudly while duck is quacking in background."}
|
54 |
+
{"id": 2956, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A woman speaks while a bird chirps and a plate is moved.", "ground_truth_text": "A woman talks while in the background there is the splashing of ducks in the water."}
|
55 |
+
{"id": 9193, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A machine gun is fired.", "ground_truth_text": "An automatic gunfire is triggered for a long period."}
|
56 |
+
{"id": 4298, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nKindly generate a caption for the following audio. ", "generated_text": "A man speaks while a bird squawks and a dog barks.", "ground_truth_text": "Rain and hail hit a window while a person speaks."}
|
57 |
+
{"id": 1483, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A bird is chirping and whistling.", "ground_truth_text": "Whistling with birds in the background."}
|
58 |
+
{"id": 5009, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nTranslate the essence of this audio into a caption. ", "generated_text": "A man speaks followed by a whistle.", "ground_truth_text": "A man talks and then whistles."}
|
59 |
+
{"id": 2056, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nKindly generate a caption for the following audio. ", "generated_text": "A bird chirps, then an explosion occurs.", "ground_truth_text": "An explosion take place then birds chirp while an engine runs."}
|
60 |
+
{"id": 1874, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nTranslate the essence of this audio into a caption. ", "generated_text": "A helicopter is flying nearby.", "ground_truth_text": "A motorboat is cruising on the water."}
|
61 |
+
{"id": 9736, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A man speaks while food sizzles.", "ground_truth_text": "A man talking followed by clanking against a metal surface as food and oil sizzle."}
|
62 |
+
{"id": 3712, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A bell rings and a clock ticks.", "ground_truth_text": "An old fashioned bell rings and at the end a click and the ringing stops."}
|
63 |
+
{"id": 4847, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A motor starts up and then stops.", "ground_truth_text": "An engine running followed by revving and then idling with faint beeping in the background."}
|
64 |
+
{"id": 8816, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A train horn blares and people laugh.", "ground_truth_text": "Loud boat engine passing and then laughing."}
|
65 |
+
{"id": 2389, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you draft a caption for this audio recording? ", "generated_text": "A man is speaking and a bird is chirping.", "ground_truth_text": "Running water with male speech and bird calls."}
|
66 |
+
{"id": 5542, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A cat meows and growls followed by a woman speaking.", "ground_truth_text": "A cat meows, followed by a person talking, followed by several meows."}
|
67 |
+
{"id": 10045, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A man speaks followed by a large explosion.", "ground_truth_text": "A man speaks and an object bursts."}
|
68 |
+
{"id": 8153, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A strong wind blows and birds chirp as people talk in the distance.", "ground_truth_text": "Cars pass by as the wind blows heavily and birds chirp followed by multiple people communicating from a distance."}
|
69 |
+
{"id": 2906, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A man speaks and a computer beeps.", "ground_truth_text": "A computer voice is talking and beeps sound then a man talks at the same time as the computer voice, more beeps and the man gets the last word."}
|
70 |
+
{"id": 5355, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A man speaking followed by a door closing.", "ground_truth_text": "An adult male speaking followed by a sliding door shutting."}
|
71 |
+
{"id": 8397, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A telephone ringing.", "ground_truth_text": "Different telephone ringings."}
|
72 |
+
{"id": 8122, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption best describes the content of this audio? ", "generated_text": "A motor is running.", "ground_truth_text": "A small engine runs continuously."}
|
73 |
+
{"id": 5103, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A man speaking followed by a dog barking.", "ground_truth_text": "A woman is speaking and animals barking."}
|
74 |
+
{"id": 6025, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A car horn blares and a child yells.", "ground_truth_text": "A police car accelerates uses its siren briefly and squeals its tires."}
|
75 |
+
{"id": 8576, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A car engine revs up and then a door slams.", "ground_truth_text": "An engine starts up and then revs every second."}
|
76 |
+
{"id": 5884, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A series of beeps followed by a series of ticking sounds.", "ground_truth_text": "Something is beeping and another object is stomping around."}
|
77 |
+
{"id": 3482, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A sheep bleats and a bird chirps.", "ground_truth_text": "A goat baaing followed by a person softly talking and heavy footsteps on dirt as a bird chirps in the background."}
|
78 |
+
{"id": 9331, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A woman sneezes twice.", "ground_truth_text": "A person sneezing."}
|
79 |
+
{"id": 1917, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nDevise a caption that matches the theme of this audio. ", "generated_text": "A metal clang followed by a man speaking.", "ground_truth_text": "Silverware clinking and man speaking."}
|
80 |
+
{"id": 10088, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A man is speaking while a dog is barking and growling.", "ground_truth_text": "A man shouts as a horse runs with a dog barking in the background."}
|
81 |
+
{"id": 2627, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A bird is chirping while the wind is blowing.", "ground_truth_text": "Wind blowing, birds chirp, some horse footsteps on dirt."}
|
82 |
+
{"id": 1502, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A child speaks while someone types on a keyboard.", "ground_truth_text": "A male child speaks and plastic crumples and crinkles."}
|
83 |
+
{"id": 3740, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A man speaking followed by a woman speaking and a goat bleating.", "ground_truth_text": "Children and man with sheep sounds."}
|
84 |
+
{"id": 1857, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you draft a caption for this audio recording? ", "generated_text": "A woman talks and a bird chirps.", "ground_truth_text": "A woman speaks as birds chirp."}
|
85 |
+
{"id": 5327, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A woman yells and then an explosion occurs.", "ground_truth_text": "Yelling followed by a pop and silence."}
|
86 |
+
{"id": 1375, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A man speaks and laughs while a bird chirps.", "ground_truth_text": "Men speaking with distant traffic then sprays and men laughing."}
|
87 |
+
{"id": 3042, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A person burps, then laughs, then burps again.", "ground_truth_text": "A girl burps loudly and other girls laugh, complain and talk."}
|
88 |
+
{"id": 3062, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A baby is crying.", "ground_truth_text": "A baby continuously crying."}
|
89 |
+
{"id": 6900, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A machine gun is firing rapidly.", "ground_truth_text": "A sequence of sustained machine gun fire followed by shorter bursts of rapid gunfire."}
|
90 |
+
{"id": 7914, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nGenerate an audio caption from this sound file. ", "generated_text": "A train horn blows followed by people talking and laughing.", "ground_truth_text": "A train horn blares loudly several times as people speak and laugh."}
|
91 |
+
{"id": 9641, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A bus passes by and a person yells.", "ground_truth_text": "N engine followed by a hiss and faint honks of a horn as traffic passes."}
|
92 |
+
{"id": 9499, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A dog barks, then a knock is heard, followed by music.", "ground_truth_text": "Pigeon cooing, birds chirping and then drum beats."}
|
93 |
+
{"id": 6537, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A car passes by and then a horn honks followed by speech.", "ground_truth_text": "A vehicle driving by quickly followed by honking and distant murmuring."}
|
94 |
+
{"id": 2500, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A vehicle revs its engine and then a person yells.", "ground_truth_text": "A motor vehicle engine is running and revving, tires squeal, an adult male yell, a blast occurs, and metal clangs."}
|
95 |
+
{"id": 8862, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A vehicle engine revs up and then a man speaks and laughs.", "ground_truth_text": "Engines are revving followed by an engine idling with people talking and giggling."}
|
96 |
+
{"id": 5050, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nPlease suggest a caption for the audio I've shared. ", "generated_text": "A strong wind blows and water splashes.", "ground_truth_text": "Splashing water accompanied by wind noises."}
|
97 |
+
{"id": 2050, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nDevise a caption that matches the theme of this audio. ", "generated_text": "A man speaks and then sneezes.", "ground_truth_text": "A woman talks and someone belches loudly."}
|
98 |
+
{"id": 10098, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption best describes the content of this audio? ", "generated_text": "A man speaks while a door slams.", "ground_truth_text": "A man is speaking and opens a door."}
|
99 |
+
{"id": 10206, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A man speaks followed by beeping.", "ground_truth_text": "A man speaks while electronics beeps."}
|
100 |
+
{"id": 10109, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A man speaking followed by a car horn.", "ground_truth_text": "A man is speaking and a car horn honks."}
|
101 |
+
{"id": 9166, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A woman speaks followed by a man speaking and then a bell ringing.", "ground_truth_text": "A man speaking briefly followed by woman speaking alongside an electronic bell dinging with another man speaking then a seagull squawking."}
|
102 |
+
{"id": 3823, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nKindly generate a caption for the following audio. ", "generated_text": "A woman is speaking over music and a man is speaking over music.", "ground_truth_text": "People loudly talking with a bell ringing."}
|
103 |
+
{"id": 10137, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nGenerate an audio caption from this sound file. ", "generated_text": "A woman speaks and pans are clanged.", "ground_truth_text": "A woman talks while tapping plastic and wood objects."}
|
104 |
+
{"id": 3231, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A crowd is talking and a motorcycle is revving its engine.", "ground_truth_text": "A crowd of people talking with traffic ambiance in the background followed by a vehicle engine revving."}
|
105 |
+
{"id": 10406, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A bird whistles and then a person whistles.", "ground_truth_text": "A bird whistle, and then a person whistles."}
|
106 |
+
{"id": 10287, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A dog snoring and then barking.", "ground_truth_text": "A soft, breathy snore in the foreground, while a child yells distantly in the background."}
|
107 |
+
{"id": 10514, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A helicopter is flying above.", "ground_truth_text": "Pressured air blowing."}
|
108 |
+
{"id": 11241, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nTranslate the essence of this audio into a caption. ", "generated_text": "A vehicle engine starts up and revs.", "ground_truth_text": "Clanking followed by engine starting and revving."}
|
109 |
+
{"id": 10720, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nKindly generate a caption for the following audio. ", "generated_text": "A wind blowing followed by a metal clank.", "ground_truth_text": "The wind is blowing, rustling is present, and metal is clanging."}
|
110 |
+
{"id": 11082, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A woman speaking followed by a siren.", "ground_truth_text": "White noise an woman speaking followed by whistling."}
|
111 |
+
{"id": 11406, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you come up with a caption for this audio segment? ", "generated_text": "A man speaks as a train passes by.", "ground_truth_text": "Waves splashing, then a woman speaks."}
|
112 |
+
{"id": 11411, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCome up with a fitting caption for this audio track. ", "generated_text": "A man speaking followed by a loud thunder.", "ground_truth_text": "A woman and a men talking into a microphone as the waves are heard coming from the ocean."}
|
113 |
+
{"id": 11673, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A truck engine runs and a horn honks.", "ground_truth_text": "Motorcycle engine runs in idle followed by a horn beeping."}
|
114 |
+
{"id": 10565, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCaption this audio file for me, please. ", "generated_text": "A child laughing and music playing, followed by a child speaking.", "ground_truth_text": "Laughter followed by music and a child speaking."}
|
115 |
+
{"id": 10931, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you come up with a caption for this audio segment? ", "generated_text": "A man speaks followed by an explosion and a fire burning.", "ground_truth_text": "Someone speaks then an explosion occurs."}
|
116 |
+
{"id": 11445, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A toilet is flushed and water is running.", "ground_truth_text": "A toilet flushing followed by a door slamming open."}
|
117 |
+
{"id": 10586, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWhat caption would you suggest for this audio? ", "generated_text": "A helicopter is flying nearby while a man and a woman are talking.", "ground_truth_text": "A man talking in the background as a vehicle horn honks in the distance followed by a faint emergency siren going off and another man talking in the foreground as wind moderately blows into a microphone."}
|
118 |
+
{"id": 11989, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A man speaks while food is being cooked.", "ground_truth_text": "A man speaks followed by sizzling of food in a pan then he speaks again."}
|
119 |
+
{"id": 12214, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A wind blows and a vehicle skids.", "ground_truth_text": "The wind is blowing, an engine runs, and tires squeal."}
|
120 |
+
{"id": 12172, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nTranslate the essence of this audio into a caption. ", "generated_text": "A cat meows and people laugh.", "ground_truth_text": "A cat is caterwauling while several people laugh."}
|
121 |
+
{"id": 12179, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A train horn blows followed by a train whistle.", "ground_truth_text": "A large horn followed by a chime."}
|
122 |
+
{"id": 12219, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A cat meows and a child speaks.", "ground_truth_text": "An animal groans then a child speaks."}
|
123 |
+
{"id": 12547, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A person burps and then laughs.", "ground_truth_text": "People laughing with something snoring."}
|
124 |
+
{"id": 11984, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you draft a caption for this audio recording? ", "generated_text": "A man speaks followed by a loud explosion and people screaming.", "ground_truth_text": "A man speaks followed by explosions and crashing with others speaking and screaming."}
|
125 |
+
{"id": 12276, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A sheep bleats, then a man speaks.", "ground_truth_text": "Goat bleating followed by a man speaking."}
|
126 |
+
{"id": 12536, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nPlease suggest a caption for the audio I've shared. ", "generated_text": "A woman is wailing and people are cheering.", "ground_truth_text": "A slightly, muffled cat meowing is followed by people laughing and loud applause."}
|
127 |
+
{"id": 12311, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A man speaks followed by a hiss of air.", "ground_truth_text": "A man speaking followed by faucet water flowing and hitting a metallic surface."}
|
128 |
+
{"id": 12989, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nTranslate the essence of this audio into a caption. ", "generated_text": "A horse neighs and people talk.", "ground_truth_text": "Sheep bleat as a man laughs and a woman speaks while people talking in the background."}
|
129 |
+
{"id": 12901, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you provide a caption for this sound recording? ", "generated_text": "A man speaks while a horse neighs.", "ground_truth_text": "Bees are buzzing as a man speaks followed by a woman speaking."}
|
130 |
+
{"id": 13231, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nI need a caption for this piece of audio; can you help? ", "generated_text": "A river is flowing and a man speaks.", "ground_truth_text": "A flowing stream then a man speaks."}
|
131 |
+
{"id": 13085, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A clock ticking followed by a whistle blowing.", "ground_truth_text": "Opening clatter with soft quite bees buzzing."}
|
132 |
+
{"id": 13354, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A train whistle blows followed by people talking.", "ground_truth_text": "Hissing with some rustling and people speaking followed by a train whistle blowing."}
|
133 |
+
{"id": 13228, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nKindly generate a caption for the following audio. ", "generated_text": "A vehicle is moving fast and people are cheering.", "ground_truth_text": "A vehicle is driving by while people are shouting."}
|
134 |
+
{"id": 13431, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nDevise a caption that matches the theme of this audio. ", "generated_text": "A child is crying and a woman is speaking.", "ground_truth_text": "A child cries and yells and an adult speaks in response."}
|
135 |
+
{"id": 13080, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A man speaking followed by a woman speaking and a hissing sound.", "ground_truth_text": "People talk nearby as a sprayer sprays liquid, and then a machine hums in the distance."}
|
136 |
+
{"id": 13378, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A man speaks followed by a large explosion and people laughing.", "ground_truth_text": "A loud burst followed by men speaking and laughing."}
|
137 |
+
{"id": 13473, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A horn honks followed by a man speaking.", "ground_truth_text": "Vehicle horn followed by man talking."}
|
138 |
+
{"id": 13855, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nKindly generate a caption for the following audio. ", "generated_text": "A man talks and whistles.", "ground_truth_text": "A woman is speaking then whistles."}
|
139 |
+
{"id": 13332, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCraft a caption that encapsulates this audio. ", "generated_text": "A car engine revs up, a woman screams, and a man speaks.", "ground_truth_text": "A high pitched whine with animals bleating and a person talking."}
|
140 |
+
{"id": 13951, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A cat meows and a child speaks.", "ground_truth_text": "An animal groans then a child speaks."}
|
141 |
+
{"id": 14057, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nHow would you caption this audio snippet? ", "generated_text": "A baby is crying and laughing.", "ground_truth_text": "Screaming followed by goat noises."}
|
142 |
+
{"id": 13970, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A woman is speaking while a train is moving nearby.", "ground_truth_text": "Steam hisses nearby as many people talk."}
|
143 |
+
{"id": 13591, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCould you come up with a caption for this audio segment? ", "generated_text": "A group of people are talking and laughing while a bird is chirping.", "ground_truth_text": "A crowd is talking and horse neighs a couple of times."}
|
144 |
+
{"id": 14312, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCreate a caption that summarizes this audio. ", "generated_text": "A man talks while a clock ticks.", "ground_truth_text": "A man is speaking while birds chirp in the background."}
|
145 |
+
{"id": 14716, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nGenerate an audio caption from this sound file. ", "generated_text": "A horn honks twice.", "ground_truth_text": "A car horn honks three times as birds chirp in the distance."}
|
146 |
+
{"id": 14556, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nWould you generate a caption based on this audio? ", "generated_text": "A man speaks and a whistle blows.", "ground_truth_text": "A person talking with chime sound and a person whistling."}
|
147 |
+
{"id": 15009, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A train blows its horn and passes by.", "ground_truth_text": "A toy helicopter starting up as wind blows moderately into a microphone."}
|
148 |
+
{"id": 14268, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nCan you formulate a caption for the given audio piece?", "generated_text": "A man speaks and laughs while a baby laughs and a man snores.", "ground_truth_text": "A man singing before laughing followed by a goat baaing then snorting a few times as a dog barks in the background."}
|
149 |
+
{"id": 14657, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nListen and generate a caption for the provided audio. ", "generated_text": "A woman speaks and a child speaks while paper crinkles.", "ground_truth_text": "A woman talks nearby, and then a child speaks as paper crinkles."}
|
150 |
+
{"id": 14989, "lang_q": "en", "lang_g": "en", "lang_o": "en", "original_question": "<audio>\nDevise a caption that matches the theme of this audio. ", "generated_text": "A large engine is running and then a small engine starts up.", "ground_truth_text": "A soft whirring sound."}
|
test_1/1.txt
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
qweqw
|
|
|
|