{
  "Y0SSy52rc1BM.wav": {
    "caption": "A female singer performs a melodic song accompanied by music while a crowd joyfully sings along in a lively environment.",
    "timestamp_events": "['(Choir-0.0-1.932)', '(Music-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)', '(Choir-3.092-10.0)']"
  },
  "YbkG4M4TiXZg.wav": {
    "caption": "A man speaks while a power tool revs up, indicating a speech event followed by the sound of a chainsaw.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.268)', '(Chainsaw-0.0-10.0)', '(Male speech, man speaking-1.772-4.425)', '(Male speech, man speaking-5.008-8.118)', '(Bird vocalization, bird call, bird song-5.362-7.512)', '(Bird vocalization, bird call, bird song-8.244-8.709)', '(Bird vocalization, bird call, bird song-8.937-9.283)', '(Male speech, man speaking-9.661-10.0)']"
  },
  "Y6fRYeClf5U4.wav": {
    "caption": "A woman delivers a speech while a crowd of people engage in conversation in an urban setting.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Wind-0.008-10.0)', '(Female speech, woman speaking-0.074-1.65)', '(Female speech, woman speaking-2.879-5.427)', '(Female speech, woman speaking-5.604-6.083)', '(Female speech, woman speaking-6.9-10.0)']"
  },
  "YAjOUP6RJMZw.wav": {
    "caption": "A man delivers a speech while a crowd cheers, with children shouting intermittently, creating a lively atmosphere.",
    "timestamp_events": "['(Laughter-0.0-10.0)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Male speech, man speaking-0.0-10.0)']"
  },
  "YCoBAR5Mbjys.wav": {
    "caption": "The clock ticks steadily as soft music plays in the background, creating a calming atmosphere in a cozy living room.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Alarm clock-0.008-10.0)', '(Tick-0.386-0.583)', '(Tick-1.071-1.22)', '(Tick-1.764-1.906)', '(Tick-2.465-2.638)', '(Tick-3.197-3.331)', '(Tick-3.772-3.976)', '(Tick-4.346-4.48)', '(Tick-4.646-4.787)', '(Tick-5.087-5.22)', '(Tick-5.669-5.795)', '(Tick-6.031-6.15)', '(Tick-6.37-6.528)', '(Tick-6.724-6.795)', '(Tick-6.969-7.118)', '(Tick-7.386-7.614)', '(Tick-8.134-8.354)', '(Tick-8.882-9.094)', '(Tick-9.315-9.425)', '(Tick-9.575-9.685)']"
  },
  "Y3IbsuhsbHs8.wav": {
    "caption": "People laughing and talking in a large room or hall, with occasional snickers and speech heard.",
    "timestamp_events": "['(Human sounds-0.0-0.436)', '(Background noise-0.0-10.0)', '(Laughter-0.309-1.053)', '(Female speech, woman speaking-0.971-3.913)', '(Laughter-1.934-3.461)', '(Laughter-3.943-4.936)', '(Female speech, woman speaking-4.695-6.862)', '(Breathing-5.315-5.619)', '(Laughter-6.464-8.894)', '(Female speech, woman speaking-7.165-8.63)', '(Female speech, woman speaking-8.894-10.0)']"
  },
  "Y1AH6zC7l3bA.wav": {
    "caption": "Metal clanks as a man speaks in the background, suggesting a workshop environment with ongoing hammering and train passing by.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Female speech, woman speaking-0.016-0.535)', '(Generic impact sounds-0.228-0.709)', '(Generic impact sounds-0.898-0.969)', '(Female speech, woman speaking-0.913-1.449)', '(Generic impact sounds-1.693-2.213)', '(Generic impact sounds-2.732-3.283)', '(Generic impact sounds-3.535-4.189)', '(Generic impact sounds-4.362-4.465)', '(Female speech, woman speaking-4.669-5.354)', '(Generic impact sounds-4.976-5.173)', '(Female speech, woman speaking-5.457-6.102)', '(Generic impact sounds-5.764-6.213)', '(Thump, thud-6.307-6.48)', '(Generic impact sounds-6.906-7.118)', '(Generic impact sounds-7.756-8.11)', '(Generic impact sounds-8.378-8.575)', '(Female speech, woman speaking-8.858-10.0)', '(Generic impact sounds-8.937-9.26)']"
  },
  "Y9SFitaVFvAA.wav": {
    "caption": "Rapid gunfire echoes through a large indoor space, followed by a man speaking in the midst of music playing.",
    "timestamp_events": "['(Video game sound-0.0-10.0)', '(Fusillade-0.15-0.312)', '(Fusillade-0.555-0.752)', '(Fusillade-0.816-1.845)', '(Fusillade-1.995-2.661)', '(Fusillade-2.846-3.684)', '(Fusillade-3.881-4.743)', '(Fusillade-4.997-6.339)', '(Male speech, man speaking-6.298-8.699)', '(Fusillade-6.576-6.738)', '(Fusillade-6.883-7.079)', '(Fusillade-7.195-7.357)', '(Fusillade-7.49-7.617)', '(Fusillade-7.75-7.929)', '(Fusillade-8.045-8.196)', '(Fusillade-8.323-8.45)', '(Fusillade-8.595-8.757)', '(Fusillade-8.907-9.051)', '(Fusillade-9.167-10.0)']"
  },
  "Y6SvDRiIG2NY.wav": {
    "caption": "A group of people sing and harmonize, creating vocal music with occasional beatboxing, in a room with a piano.",
    "timestamp_events": "['(Male singing-0.0-6.594)', '(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Breathing-7.064-8.314)', '(Breathing-8.911-10.0)', '(Male singing-9.713-10.0)']"
  },
  "Y2YV1ueymy4Y.wav": {
    "caption": "A jingle bell tinkles softly as a man sings and music plays in a room.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Jingle, tinkle-0.0-10.0)', '(Male singing-0.582-1.492)', '(Male singing-2.849-3.531)', '(Male singing-5.196-6.139)', '(Male singing-7.503-8.316)', '(Male singing-8.633-10.0)']"
  },
  "YbEhD9zFO8BE.wav": {
    "caption": "A flock of pigeons coo and flap their wings, creating a soothing ambiance in a serene outdoor environment.",
    "timestamp_events": "['(Tick-0.0-0.214)', '(Rustle-0.0-10.0)', '(Tick-0.418-0.612)', '(Coo-0.827-2.031)', '(Generic impact sounds-2.149-2.536)', '(Coo-2.708-7.16)', '(Generic impact sounds-3.44-4.042)', '(Generic impact sounds-4.295-4.555)', '(Generic impact sounds-4.815-5.066)', '(Generic impact sounds-5.591-5.859)', '(Coo-7.622-9.999)', '(Generic impact sounds-7.762-7.977)', '(Generic impact sounds-9.835-10.0)']"
  },
  "Y-c2GLPjL6Sg.wav": {
    "caption": "A man speaks while running, amidst the energetic cheers of a crowd, in a stadium during a race.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Shout-0.0-10.0)', '(Background noise-0.0-10.0)', '(Clapping-0.275-3.358)', '(Human voice-3.304-4.636)', '(Clapping-4.457-10.0)', '(Human voice-6.933-8.925)']"
  },
  "Y6N3CTf5fqYI.wav": {
    "caption": "A man confidently delivers a speech, eliciting applause from the crowd gathered in an indoor theater.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Male speech, man speaking-0.395-1.756)', '(Male speech, man speaking-2.217-3.591)', '(Male speech, man speaking-3.928-4.258)', '(Male speech, man speaking-4.416-5.22)', '(Male speech, man speaking-5.433-7.241)', '(Clapping-7.261-7.412)', '(Clapping-7.55-7.722)', '(Clapping-7.825-10.0)']"
  },
  "Y0HW0akGNCLk.wav": {
    "caption": "A man speaks followed by a door opening as a cash register rings, indicating a transaction in a store.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.718)', '(Background noise-0.0-10.0)', '(Male speech, man speaking-2.097-3.502)', '(Tap-3.358-3.461)', '(Tap-3.771-3.915)', '(Male speech, man speaking-4.287-5.362)', '(Tap-4.735-4.824)', '(Cash register-4.859-5.341)', '(Cash register-5.458-7.077)', '(Tap-6.677-6.767)', '(Tap-6.911-7.049)', '(Male speech, man speaking-6.966-9.012)', '(Tap-9.329-9.487)']"
  },
  "YCBibl5506Lw.wav": {
    "caption": "A boat engine idles while people converse in the background, creating a bustling atmosphere.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.827)', '(Boat, Water vehicle-0.0-10.0)', '(Idling-0.0-10.0)', '(Conversation-0.079-8.976)', '(Female speech, woman speaking-1.575-1.858)', '(Male speech, man speaking-1.937-2.252)', '(Male speech, man speaking-3.575-4.598)', '(Male speech, man speaking-5.134-5.764)', '(Male speech, man speaking-6.22-7.11)', '(Male speech, man speaking-8.157-8.858)']"
  },
  "YbJvOp4gmHBg.wav": {
    "caption": "Gunshots and artillery fire echo through the air as music plays during a military parade at a raceway.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Generic impact sounds-0.166-0.307)', '(Artillery fire-0.32-0.704)', '(Generic impact sounds-0.781-0.948)', '(Generic impact sounds-1.063-1.165)', '(Generic impact sounds-1.524-1.677)', '(Generic impact sounds-2.625-2.881)', '(Artillery fire-3.035-3.521)', '(Generic impact sounds-3.611-3.777)', '(Generic impact sounds-4.213-4.43)', '(Generic impact sounds-5.096-5.262)', '(Artillery fire-5.288-5.762)', '(Generic impact sounds-5.89-6.095)', '(Generic impact sounds-6.479-6.812)', '(Generic impact sounds-6.94-7.106)', '(Artillery fire-7.222-7.606)', '(Generic impact sounds-8.207-8.425)', '(Artillery fire-8.476-8.988)', '(Generic impact sounds-9.206-9.385)', '(Generic impact sounds-9.654-9.795)']"
  },
  "Y4nw3UiN65Y8.wav": {
    "caption": "The train hisses as a man speaks in the background, indicating a subway or metro station environment.",
    "timestamp_events": "['(Subway, metro, underground-0.0-10.0)', '(Male speech, man speaking-0.852-1.983)', '(Radio-0.894-2.011)', '(Radio-2.709-3.631)', '(Male speech, man speaking-2.751-3.631)']"
  },
  "YAaeemnJDijQ.wav": {
    "caption": "A man speaks while using an electric shaver, creating a buzzing sound in a small room.",
    "timestamp_events": "['(Electric shaver, electric razor-0.0-0.647)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.623-2.629)', '(Male speech, man speaking-1.364-1.849)', '(Male speech, man speaking-2.662-4.701)', '(Generic impact sounds-2.8-2.962)', '(Electric shaver, electric razor-3.921-10.0)', '(Male speech, man speaking-5.521-7.057)', '(Surface contact-7.284-9.819)']"
  },
  "Y0pcV5rYkDHI.wav": {
    "caption": "A man speaks while an industrial cage whirrs in the background, possibly in a open lot.",
    "timestamp_events": "['(Male speech, man speaking-0.0-5.309)', '(Wind-0.0-10.0)', '(Water-0.0-10.0)', '(Boiling-0.0-10.0)', '(Male speech, man speaking-6.251-8.588)', '(Male speech, man speaking-9.385-10.0)']"
  },
  "Y0x6Zy66NEMc.wav": {
    "caption": "A crowd erupts with cheers and applause as a thumping sound fills the television studio, indicating an exciting event.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Human sounds-0.959-1.653)', '(Hubbub, speech noise, speech babble-2.107-3.309)', '(Breathing-4.601-5.117)', '(Glass chink, clink-5.9-6.21)', '(Hubbub, speech noise, speech babble-6.505-8.251)', '(Male singing-8.217-10.0)', '(Tap dance-9.392-10.0)']"
  },
  "YAdovQEX-Jco.wav": {
    "caption": "An aircraft engine roars with a high-pitched whine as an adult male speaks in the background, indicating the presence of a fixed-wing airplane.",
    "timestamp_events": "['(Aircraft engine-0.0-10.0)', '(Wind-0.0-10.0)', '(Video game sound-0.0-10.0)']"
  },
  "YAegX3TR1uJE.wav": {
    "caption": "Water splashes and gurgles as a pig, a domestic pet, enjoys itself in a watery environment, possibly a farm.",
    "timestamp_events": "['(Pig-0.0-10.0)', '(Rustle-0.0-10.0)', '(Mechanisms-0.0-10.0)']"
  },
  "Ya2TTI6qSzfE.wav": {
    "caption": "A man sings passionately as a crowd erupts in cheers and applause, creating a lively atmosphere in an entertainment center.",
    "timestamp_events": "['(Male singing-0.0-1.193)', '(Music-0.0-10.0)', '(Choir-1.386-2.542)', '(Male singing-2.708-4.741)', '(Choir-5.218-10.0)', '(Whoop-5.692-10.0)', '(Clapping-6.518-6.622)', '(Clapping-6.975-7.064)', '(Clapping-7.21-7.306)', '(Clapping-7.459-7.604)', '(Clapping-7.929-8.081)', '(Clapping-8.454-8.537)', '(Clapping-8.987-9.07)']"
  },
  "Y03nQvlxML6U.wav": {
    "caption": "A punk rock band performs on stage at a concert while loud rock music blares and someone screams.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Male singing-1.362-3.724)', '(Bellow-1.409-3.724)', '(Male singing-4.11-6.283)', '(Bellow-4.189-6.268)', '(Male singing-6.701-8.898)', '(Bellow-6.764-8.874)', '(Bellow-9.213-10.0)', '(Male singing-9.213-10.0)']"
  },
  "Y4vFHOgUKYvM.wav": {
    "caption": "A crowd gathers while music plays in the background, accompanied by people talking and shouting in excitement.",
    "timestamp_events": "['(Crowd-0.087-10.0)', '(Female speech, woman speaking-0.103-0.98)', '(Speech-1.061-1.728)', '(Music-1.728-10.0)', '(Female speech, woman speaking-2.467-3.019)', '(Speech-4.62-5.741)', '(Shout-5.724-9.258)']"
  },
  "YBshHvq-mgRA.wav": {
    "caption": "The crowd erupts in cheers as a man comments, accompanied by background music and occasional slamming sounds, in a wrestling ring.",
    "timestamp_events": "['(Whistling-0.0-1.031)', '(Crowd-0.0-10.0)', '(Cheering-0.0-10.0)', '(Shout-0.0-10.0)', '(Generic impact sounds-0.376-0.527)', '(Generic impact sounds-0.76-0.971)', '(Generic impact sounds-1.625-1.859)', '(Whistling-2.378-3.19)', '(Generic impact sounds-3.01-3.16)', '(Whack, thwack-3.725-4.041)', '(Whack, thwack-4.432-4.74)', '(Male speech, man speaking-4.868-5.418)', '(Whack, thwack-5.049-5.282)', '(Whack, thwack-5.568-5.801)', '(Male speech, man speaking-5.606-7.901)', '(Whack, thwack-6.102-6.328)', '(Generic impact sounds-8.277-8.397)', '(Generic impact sounds-8.623-8.796)', '(Whack, thwack-9.518-9.857)']"
  },
  "Y1zCIzIPLVec.wav": {
    "caption": "An remote controlled boat moving in circles while distant traffic noise fills the air near a lake along a busy road.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Traffic noise, roadway noise-0.0-10.0)', '(Mechanisms-2.753-6.773)', '(Mechanisms-8.284-10.0)']"
  },
  "YaZsaM0PNRns.wav": {
    "caption": "A crowd cheers and sings along to the music in a large hall, creating an energetic and lively atmosphere.",
    "timestamp_events": "['(Music-0.107-10.0)', '(Shout-0.168-1.096)', '(Shout-1.619-3.021)', '(Human voice-3.021-3.165)', '(Male singing-3.062-3.529)', '(Shout-3.412-4.691)', '(Male singing-3.756-4.56)', '(Male singing-5.158-6.107)', '(Screaming-6.519-7.034)', '(Male singing-7.323-8.045)', '(Screaming-7.619-8.375)', '(Male singing-8.354-10.0)', '(Human voice-8.588-9.199)']"
  },
  "Y1478ZIPwttc.wav": {
    "caption": "Raindrops hitting a car roof or window as the car accelerates.",
    "timestamp_events": "['(Sound effect-0.0-10.0)', '(Car-0.0-10.0)', '(Rain on surface-0.0-10.0)', '(Tick-1.495-1.617)', '(Tick-2.38-2.559)', '(Accelerating, revving, vroom-3.03-4.444)', '(Tick-3.615-3.769)', '(Tick-6.531-6.669)', '(Tick-6.978-7.124)', '(Tick-8.026-8.164)', '(Tick-9.838-9.935)']"
  },
  "Y4HfHRvLxQ8M.wav": {
    "caption": "A male singer performs a melodic tune accompanied by the sound of a bird whistling and singing in the background.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Bird vocalization, bird call, bird song-0.086-2.237)', '(Male singing-0.684-2.196)', '(Bird vocalization, bird call, bird song-2.588-3.392)', '(Male singing-2.938-6.746)', '(Bird vocalization, bird call, bird song-3.681-5.756)', '(Bird vocalization, bird call, bird song-5.9-6.979)', '(Bird vocalization, bird call, bird song-7.096-8.581)', '(Male singing-7.536-10.0)', '(Bird vocalization, bird call, bird song-8.849-9.736)']"
  },
  "Y3BTTvj5U8I8.wav": {
    "caption": "The crowd erupts in cheers as music plays and someone sings passionately on an urban outdoor stage.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Shout-6.646-10.0)', '(Female singing-0.0-10.0)']"
  },
  "Y0RB4tYbyU8k.wav": {
    "caption": "A car revs its tires and the sound of a choir singing can be heard in the background at a music event.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Background noise-0.0-10.0)', '(Choir-0.0-10.0)']"
  },
  "YaYjhl2nIB-A.wav": {
    "caption": "A crowd of people talking and a horse trotting can be heard at a football field where a group of people play brass instruments.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Walk, footsteps-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)']"
  },
  "Yax4-MpbbMtc.wav": {
    "caption": "Clanking cutlery and dishes can be heard as a man speaks, suggesting a busy kitchen environment.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Male speech, man speaking-0.015-0.958)', '(Generic impact sounds-1.143-1.24)', '(Generic impact sounds-1.614-1.744)', '(Male speech, man speaking-2.283-4.072)', '(Generic impact sounds-4.278-4.392)', '(Male speech, man speaking-5.206-6.304)', '(Generic impact sounds-6.943-7.373)', '(Generic impact sounds-7.471-7.512)', '(Generic impact sounds-7.609-7.69)', '(Generic impact sounds-7.836-9.022)', '(Male speech, man speaking-9.021-10.0)']"
  },
  "Y6XFQxLLEYvg.wav": {
    "caption": "Violin music fills the air as a crowd gathers in a plaza, creating a lively and musical atmosphere.",
    "timestamp_events": "['(Male singing-0.0-1.844)', '(Wind-0.0-10.0)', '(Music-0.0-10.0)', '(Male singing-2.304-9.483)']"
  },
  "Ya6QXF6WhVEY.wav": {
    "caption": "A man speaks amidst the buzzing of bees indicating a conversation in an apiary.",
    "timestamp_events": "['(Buzz-0.0-10.0)', '(Male speech, man speaking-0.094-2.496)', '(Cricket-0.504-0.701)', '(Cricket-2.134-3.094)', '(Male speech, man speaking-3.291-4.803)', '(Cricket-3.299-4.22)', '(Tick-4.181-4.307)', '(Cricket-4.339-4.709)', '(Tick-4.795-4.882)', '(Cricket-5.039-5.197)', '(Cricket-5.346-5.528)', '(Cricket-5.638-5.803)', '(Cricket-5.937-6.748)', '(Cricket-6.937-7.094)', '(Male speech, man speaking-7.197-8.78)', '(Cricket-7.244-8.339)', '(Cricket-8.598-8.992)', '(Male speech, man speaking-8.913-9.299)', '(Cricket-9.693-9.89)']"
  },
  "Y0poMyUX8Jvk.wav": {
    "caption": "The sounds of fireworks bursting and people chatting and celebrating.",
    "timestamp_events": "['(Firecracker-0.0-10.0)', '(Wind-0.0-10.0)', '(Crowd-0.0-10.0)']"
  },
  "Y993A2y5lv-s.wav": {
    "caption": "A bird chirps and tweets in the background as it vocalizes its song in a natural outdoor environment.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Television-0.0-10.0)', '(Chirp, tweet-0.253-0.688)', '(Chirp, tweet-0.875-1.124)', '(Chirp, tweet-1.228-1.815)', '(Chirp, tweet-2.161-2.493)', '(Chirp, tweet-2.583-2.853)', '(Chirp, tweet-3.053-3.925)', '(Chirp, tweet-4.091-4.506)', '(Chirp, tweet-4.679-4.948)', '(Chirp, tweet-5.488-6.456)', '(Chirp, tweet-6.56-6.836)', '(Chirp, tweet-6.981-7.68)', '(Chirp, tweet-7.908-8.904)', '(Chirp, tweet-9.713-10.0)']"
  },
  "Y2p0Qerx4CXs.wav": {
    "caption": "A woman engages with a baby in a room, eliciting joyful laughter from the baby, while a man's voice emanates from the television in the background, adding to the cheerful ambiance.",
    "timestamp_events": "['(Baby laughter-0.0-0.418)', '(Male speech, man speaking-0.0-4.096)', '(Television-0.0-9.412)', '(Mechanisms-0.0-9.412)', '(Breathing-0.455-0.837)', '(Baby laughter-0.673-2.51)', '(Laughter-2.537-2.946)', '(Breathing-3.001-3.419)', '(Baby laughter-3.31-5.329)', '(Human sounds-3.392-3.904)', '(Male speech, man speaking-4.374-6.957)', '(Human sounds-4.501-4.822)', '(Breathing-5.356-5.729)', '(Human sounds-5.801-6.29)', '(Baby laughter-5.829-7.502)', '(Human sounds-6.909-7.299)', '(Breathing-6.909-7.391)', '(Male speech, man speaking-7.566-9.412)', '(Breathing-7.584-8.539)', '(Baby laughter-8.675-9.412)', '(Human sounds-8.748-9.195)']"
  },
  "Y5U-ynroFS5c.wav": {
    "caption": "Water splashes as a child's voice is heard, accompanied by a soothing melody, creating a serene ambiance by a stream.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Water-0.0-10.0)', '(Female speech, woman speaking-0.89-1.48)', '(Conversation-0.968-9.492)', '(Female speech, woman speaking-2.654-3.433)', '(Female speech, woman speaking-3.583-4.425)', '(Female speech, woman speaking-5.213-5.772)', '(Female speech, woman speaking-6.339-6.858)', '(Female speech, woman speaking-7.693-9.575)']"
  },
  "YBeuw9qGEm1Y.wav": {
    "caption": "Quick succession of \"boing\" sounds followed by thunder and rain falling on a hard surface as a musical chime rings out, creating a peaceful ambiance in an outdoor setting.",
    "timestamp_events": "['(Sound effect-0.09-3.496)', '(Boing-0.464-0.691)', '(Boing-1.591-2.251)', '(Rain-2.996-7.222)', '(Thunder-4.648-5.98)', '(Sound effect-7.209-7.836)', '(Music-7.209-10.0)', '(Sound effect-8.271-8.886)', '(Sound effect-9.334-10.0)']"
  },
  "Y84Ti19rdxwQ.wav": {
    "caption": "Birds chirp as a cricket hums softly, creating a peaceful ambiance in a natural outdoor setting.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.903)', '(Cricket-0.0-7.431)', '(Male speech, man speaking-1.082-2.244)', '(Music-1.919-10.0)', '(Male speech, man speaking-4.651-5.674)', '(Male speech, man speaking-5.986-7.376)']"
  },
  "Y9GzIjpH58gw.wav": {
    "caption": "A group of people singing with music playing in the background, while children shout in a crowded place and firecrackers burst.",
    "timestamp_events": "['(Firecracker-0.0-10.0)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Shout-0.0-10.0)']"
  },
  "Y64AHuTLREwA.wav": {
    "caption": "Several different beeps go off as a smoke detector and fire alarm sound in a room.",
    "timestamp_events": "['(Background noise-0.0-3.186)', '(Fire alarm-0.022-0.808)', '(Door-0.434-0.733)', '(Door-0.823-1.085)', '(Fire alarm-1.047-1.892)', '(Walk, footsteps-1.122-1.436)', '(Walk, footsteps-1.653-1.803)', '(Walk, footsteps-1.87-2.027)', '(Fire alarm-2.042-2.984)', '(Walk, footsteps-2.094-2.311)', '(Walk, footsteps-2.603-2.767)', '(Walk, footsteps-3.029-3.179)', '(Background noise-3.964-6.971)', '(Walk, footsteps-4.039-4.271)', '(Fire alarm-4.069-5.004)', '(Walk, footsteps-4.338-4.488)', '(Walk, footsteps-4.577-4.929)', '(Walk, footsteps-5.019-5.161)', '(Fire alarm-5.079-5.999)', '(Walk, footsteps-5.916-6.215)', '(Fire alarm-6.103-6.926)', '(Door-6.806-6.993)', '(Door-7.652-7.816)', '(Background noise-7.681-10.0)', '(Walk, footsteps-7.952-8.029)', '(Fire alarm-8.085-9.065)', '(Walk, footsteps-8.309-8.473)', '(Fire alarm-9.132-10.0)']"
  },
  "Y0TyHc67BhZo.wav": {
    "caption": "The whistle sound after the man's speech adds a playful and light tone to the atmosphere.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Male speech, man speaking-0.955-1.875)', '(Breathing-2.06-2.562)', '(Whistle-2.699-6.016)', '(Male speech, man speaking-6.944-8.132)', '(Breathing-8.132-8.812)', '(Whistle-8.88-10.0)']"
  },
  "Y0npckTh3OiE.wav": {
    "caption": "A man speaks on stage as a crowd applauds in a discotheque, creating a lively and energetic atmosphere.",
    "timestamp_events": "['(Hubbub, speech noise, speech babble-0.0-10.0)', '(Male speech, man speaking-0.0-2.348)', '(Applause-0.012-2.267)', '(Applause-2.371-2.568)', '(Female speech, woman speaking-2.47-3.181)', '(Applause-2.689-2.886)', '(Male speech, man speaking-3.123-4.014)', '(Male speech, man speaking-4.135-6.021)', '(Applause-4.245-4.332)', '(Applause-4.407-4.864)', '(Applause-5.934-6.027)', '(Applause-6.113-6.246)', '(Male speech, man speaking-6.137-6.836)', '(Applause-6.298-6.414)', '(Applause-6.478-10.0)', '(Male speech, man speaking-6.917-7.183)', '(Male speech, man speaking-7.618-7.843)', '(Male speech, man speaking-8.3-8.525)', '(Male speech, man speaking-8.901-9.433)', '(Male speech, man speaking-9.607-10.0)']"
  },
  "Y9FfGXUqa4K4.wav": {
    "caption": "A man speaks through a loudspeaker as a crowd cheers in the background at a raceway.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Background noise-0.0-10.0)', '(Male speech, man speaking-0.008-1.497)', '(Male speech, man speaking-1.798-4.944)', '(Male speech, man speaking-5.335-6.072)', '(Shout-5.372-6.065)', '(Male speech, man speaking-6.351-7.065)', '(Shout-6.373-7.028)', '(Shout-7.276-7.953)', '(Male speech, man speaking-7.306-7.878)', '(Male speech, man speaking-8.202-8.849)', '(Shout-8.284-8.894)', '(Shout-9.157-9.744)', '(Male speech, man speaking-9.157-9.759)']"
  },
  "Y6CMZKs7K1xU.wav": {
    "caption": "A horse neighs as a man speaks, creating a mix of music, shuffle, and speech in a countryside setting.",
    "timestamp_events": "['(Shuffle-0.0-10.0)', '(Background noise-0.0-10.0)', '(Male speech, man speaking-5.887-6.217)', '(Male speech, man speaking-6.938-7.88)', '(Male speech, man speaking-8.21-8.608)', '(Male speech, man speaking-9.138-9.639)']"
  },
  "Y1dOxolAu32w.wav": {
    "caption": "A man speaks while music plays in the background, accompanied by the sound of a barking dog.",
    "timestamp_events": "['(Male singing-0.0-3.09)', '(Music-0.0-10.0)', '(Howl-0.574-1.656)', '(Male speech, man speaking-2.099-3.364)', '(Male singing-3.585-5.267)', '(Howl-3.729-5.515)', '(Male speech, man speaking-5.815-6.949)', '(Male singing-5.815-7.718)', '(Howl-7.679-8.983)', '(Male singing-8.123-10.0)']"
  },
  "Y3Xmm3QTRrfw.wav": {
    "caption": "A car speeds by as the sound of a vehicle passing on a race track can be heard.",
    "timestamp_events": "['(Tire squeal, skidding-0.0-0.485)', '(Accelerating, revving, vroom-0.0-0.582)', '(Car-0.0-10.0)', '(Accelerating, revving, vroom-0.883-1.906)', '(Accelerating, revving, vroom-2.491-3.921)', '(Tire squeal, skidding-2.792-4.376)', '(Accelerating, revving, vroom-5.326-6.033)', '(Accelerating, revving, vroom-7.243-10.0)']"
  },
  "Y5pHPou2UR28.wav": {
    "caption": "A man speaks while a car engine runs, creating a background noise in the car interior.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.258)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-1.55-2.952)', '(Generic impact sounds-2.897-6.278)', '(Male speech, man speaking-7.014-9.062)']"
  },
  "Y7lRn3df0hiU.wav": {
    "caption": "A dog growls and barks while a man speaks in a domestic setting.",
    "timestamp_events": "['(Growling-0.0-1.818)', '(Mechanisms-0.0-10.0)', '(Growling-2.572-4.277)', '(Growling-4.443-4.789)', '(Human voice-4.969-5.562)', '(Growling-5.684-6.342)', '(Yip-6.312-7.029)', '(Yip-7.708-8.259)', '(Human voice-7.763-8.291)', '(Growling-8.143-9.193)', '(Laughter-8.454-8.73)', '(Yip-9.181-9.898)', '(Human voice-9.217-9.884)']"
  },
  "Y18PPxEB6Cb4.wav": {
    "caption": "A boat motor roars as waves crash and the ocean gurgles, indicating the audio event of a motorboat speeding on water.",
    "timestamp_events": "['(Motorboat, speedboat-0.0-10.0)', '(Accelerating, revving, vroom-0.0-10.0)', '(Water-0.0-10.0)', '(Generic impact sounds-2.164-2.387)', '(Generic impact sounds-3.478-3.662)', '(Tick-4.696-4.831)', '(Generic impact sounds-6.85-7.14)', '(Generic impact sounds-7.353-8.841)', '(Generic impact sounds-9.217-9.459)']"
  },
  "Y057il3kuCBs.wav": {
    "caption": "Water runs from a faucet as a man speaks, creating a soothing audio in a bathroom.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.642)', '(Washing machine-0.0-10.0)', '(Water-0.0-10.0)', '(Male speech, man speaking-1.271-5.447)', '(Male speech, man speaking-6.006-7.696)', '(Male speech, man speaking-8.045-10.0)']"
  },
  "Y91WlRTPwZ-U.wav": {
    "caption": "A woman delivers a speech on stage, her voice clear and confident, captivating the audience's attention.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-0.582)', '(Wind-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)', '(Female speech, woman speaking-1.061-2.491)', '(Female speech, woman speaking-2.832-5.562)', '(Female speech, woman speaking-5.936-7.154)', '(Female speech, woman speaking-8.186-9.421)', '(Female speech, woman speaking-9.68-10.0)']"
  },
  "Y9lICP7L-TGc.wav": {
    "caption": "A man yells, followed by an explosion, and another man screams in a museum, creating a whack and thwack audio event.",
    "timestamp_events": "['(Human voice-0.0-0.149)', '(Video game sound-0.0-3.219)', '(Sound effect-0.0-3.219)', '(Human voice-0.46-2.106)', '(Human voice-2.431-2.763)', '(Video game sound-4.174-8.302)', '(Human voice-4.181-4.43)', '(Sound effect-4.381-8.302)', '(Human voice-4.927-5.377)', '(Human voice-5.944-7.037)']"
  },
  "Y9svHQT4uKYQ.wav": {
    "caption": "A train horn blares repeatedly as a train passes by, indicating the presence of rail transport in the audio.",
    "timestamp_events": "['(Train-0.107-3.825)', '(Train horn-0.258-3.165)', '(Background noise-3.887-10.0)', '(Generic impact sounds-4.065-4.354)', '(Generic impact sounds-4.498-5.186)', '(Train horn-5.144-6.107)', '(Generic impact sounds-6.313-6.815)', '(Generic impact sounds-7.014-7.323)', '(Train horn-7.323-8.272)', '(Generic impact sounds-8.505-8.897)', '(Train horn-8.959-9.928)']"
  },
  "Y4Av-qsIIncg.wav": {
    "caption": "The sound of a vehicle starting up is followed by a door closing, suggesting that someone is getting into a car.",
    "timestamp_events": "['(Sliding door-0.0-1.708)', '(Wind-0.0-10.0)', '(Generic impact sounds-0.715-1.016)', '(Sliding door-1.949-3.055)', '(Generic impact sounds-3.356-4.169)', '(Sliding door-3.356-5.508)', '(Generic impact sounds-5.26-5.508)', '(Generic impact sounds-5.643-5.869)', '(Sliding door-5.658-8.503)', '(Generic impact sounds-7.028-7.276)', '(Generic impact sounds-7.72-8.367)', '(Generic impact sounds-9.406-9.669)', '(Generic impact sounds-9.925-10.0)']"
  },
  "Y7L1XpYRlyN0.wav": {
    "caption": "Dogs bark and people laugh as music plays in the background, creating a lively atmosphere at a gathering.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Bark-0.217-0.428)', '(Bark-0.509-0.706)', '(Bark-1.12-1.317)', '(Bark-1.419-1.636)', '(Bark-1.738-1.921)', '(Laughter-2.003-3.401)', '(Bark-2.111-2.315)', '(Bark-2.451-2.655)', '(Bark-3.157-3.347)', '(Bark-3.442-3.659)', '(Laughter-3.632-5.031)', '(Bark-3.802-4.012)', '(Bark-4.121-4.325)', '(Laughter-5.194-10.0)', '(Bark-7.882-8.079)', '(Bark-8.344-8.486)', '(Bark-8.629-8.805)', '(Bark-9.199-10.0)']"
  },
  "Y9a8eza-EovA.wav": {
    "caption": "A group of people in a crowded room shout battle cries, creating a lively and energetic atmosphere.",
    "timestamp_events": "['(Battle cry-0.0-1.096)', '(Background noise-0.0-10.0)', '(Crowd-0.0-10.0)', '(Battle cry-1.241-4.313)', '(Battle cry-4.505-5.165)', '(Battle cry-5.344-7.467)', '(Battle cry-7.66-10.0)']"
  },
  "Y3si70GDTyOs.wav": {
    "caption": "Music plays as a male singer performs while a crowd talks in the background in a lecture room.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Children shouting-1.646-4.685)', '(Children shouting-4.847-10.0)', '(Male singing-7.341-10.0)']"
  },
  "Ynf3jIDNiDcM.wav": {
    "caption": "A steam train engine chugs along the railroad tracks, followed by a loud train whistle blowing in a rural setting.",
    "timestamp_events": "['(Steam-0.0-10.0)', '(Train-0.0-10.0)', '(Steam whistle-6.204-8.348)']"
  },
  "Y6jUhJzJ7nes.wav": {
    "caption": "Emergency sirens blare as an ambulance and police car rush by, indicating a chaotic scene on the streets.",
    "timestamp_events": "['(Male singing-0.0-3.893)', '(Music-0.0-5.21)', '(Crowd-0.0-10.0)', '(Siren-5.013-10.0)', '(Male speech, man speaking-5.921-6.835)', '(Female speech, woman speaking-7.971-9.087)', '(Male speech, man speaking-9.299-10.0)']"
  },
  "Y253YvMHwUoc.wav": {
    "caption": "A man's speech is heard over rushing water, indicating that he is speaking while on a rowboat in a stream.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.903)', '(Wind-0.0-10.0)', '(Water-0.0-10.0)', '(Male speech, man speaking-2.29-4.068)', '(Male speech, man speaking-4.541-5.256)', '(Tick-5.691-5.797)', '(Male speech, man speaking-5.903-8.377)']"
  },
  "Y2S0b5wQu7Aw.wav": {
    "caption": "A man raps with music playing in the background, creating an energetic atmosphere in an urban setting.",
    "timestamp_events": "['(Female singing-0.0-0.338)', '(Music-0.0-10.0)', '(Female singing-1.488-4.077)', '(Male speech, man speaking-4.242-10.0)', '(Female singing-4.734-7.198)', '(Female singing-8.638-10.0)']"
  },
  "Y6w7s49SIVEs.wav": {
    "caption": "A woman sings while music plays in the background in a museum, creating a harmonious atmosphere.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Female singing-1.055-3.85)', '(Female singing-4.339-8.055)', '(Female singing-8.614-10.0)']"
  },
  "YCpZSkQqTxoI.wav": {
    "caption": "A man speaks while playing the guitar with music in the background inside a small room.",
    "timestamp_events": "['(Music-0.0-9.063)', '(Background noise-0.0-10.0)', '(Male speech, man speaking-1.181-2.543)', '(Male speech, man speaking-3.449-3.78)', '(Male speech, man speaking-4.205-5.291)', '(Male speech, man speaking-9.598-9.882)']"
  },
  "YnEahTzq1wQY.wav": {
    "caption": "A man passionately speaks as a crowd erupts in cheers, creating an electrifying atmosphere in a lively event.",
    "timestamp_events": "['(Clapping-0.0-0.128)', '(Male speech, man speaking-0.0-1.05)', '(Crowd-0.0-10.0)', '(Clapping-0.384-0.691)', '(Laughter-0.832-1.78)', '(Clapping-1.178-8.924)', '(Male speech, man speaking-1.216-2.945)', '(Whoop-2.843-4.187)', '(Whoop-4.392-5.48)', '(Whoop-5.659-6.722)', '(Human voice-6.825-7.426)', '(Male speech, man speaking-7.542-8.323)', '(Battle cry-8.207-8.656)', '(Male speech, man speaking-8.771-9.347)', '(Battle cry-9.245-10.0)']"
  },
  "Y4gCzqnMDAiY.wav": {
    "caption": "A man passionately delivers a speech while a crowd cheers in the background, creating an energetic atmosphere.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.744)', '(Background noise-0.0-10.0)', '(Clapping-1.947-6.732)', '(Male speech, man speaking-3.531-3.84)', '(Male speech, man speaking-4.392-5.789)', '(Male speech, man speaking-6.691-8.275)', '(Male speech, man speaking-8.698-10.0)']"
  },
  "YATJ15VUJy7A.wav": {
    "caption": "A crowd erupts in cheers and applause as someone delivers a speech in a lively event.",
    "timestamp_events": "['(Whistling-0.0-1.061)', '(Applause-0.0-10.0)', '(Crowd-0.0-10.0)', '(Run-0.0-10.0)', '(Shout-0.008-10.0)', '(Male speech, man speaking-0.655-2.287)', '(Whistling-1.385-1.61)', '(Whistling-2.461-2.686)', '(Male speech, man speaking-3.363-4.078)', '(Whistling-3.552-4.47)', '(Male speech, man speaking-4.457-4.831)', '(Male speech, man speaking-5.773-6.569)', '(Female speech, woman speaking-7.344-7.901)', '(Male speech, man speaking-8.202-8.548)', '(Whistling-8.486-9.031)', '(Whistling-9.356-9.737)']"
  },
  "Y94Bq4SKq5ik.wav": {
    "caption": "A bell rings softly as music plays in the background, creating a serene atmosphere in an orchestra pit.",
    "timestamp_events": "['(Choir-0.0-2.583)', '(Music-0.0-10.0)', '(Chime-1.726-7.044)']"
  },
  "YaFVdCDUdjqw.wav": {
    "caption": "A man narrates while a volcano erupts in the background.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.799)', '(Fire-0.0-10.0)', '(Wind-0.0-10.0)', '(Male speech, man speaking-1.54-2.182)', '(Male speech, man speaking-2.355-3.116)', '(Male speech, man speaking-4.575-5.052)', '(Male speech, man speaking-6.663-7.645)', '(Male speech, man speaking-7.832-8.994)', '(Male speech, man speaking-9.16-10.0)']"
  },
  "YBA4qayqjvGk.wav": {
    "caption": "Pigeons coo and flap their wings as bird vocalizations fill the air in an urban setting.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Vehicle-0.0-10.0)', '(Coo-0.094-0.638)', '(Rustle-0.244-0.717)', '(Bird vocalization, bird call, bird song-0.669-1.402)', '(Rustle-0.89-1.094)', '(Coo-1.126-2.488)', '(Bird vocalization, bird call, bird song-1.724-2.417)', '(Rustle-1.953-2.079)', '(Rustle-2.378-2.748)', '(Coo-2.626-2.935)', '(Vehicle horn, car horn, honking, toot-2.78-3.26)', '(Rustle-3.496-4.339)', '(Coo-3.661-10.0)', '(Bird vocalization, bird call, bird song-4.236-4.882)', '(Rustle-5.173-7.038)', '(Bird vocalization, bird call, bird song-6.63-7.252)', '(Rustle-7.22-7.646)', '(Rustle-7.858-8.031)', '(Bird vocalization, bird call, bird song-7.874-8.693)', '(Bird vocalization, bird call, bird song-9.488-10.0)']"
  },
  "Y-9wo95HMngI.wav": {
    "caption": "A male voice sings while a male voice joins in briefly, creating a harmonious melody in a dressing room.",
    "timestamp_events": "['(Male singing-0.0-1.342)', '(Background noise-0.0-10.0)', '(Breathing-1.376-2.179)', '(Male singing-1.858-4.541)', '(Breathing-3.005-3.876)', '(Breathing-4.14-4.931)', '(Male singing-4.759-6.571)', '(Male singing-6.686-7.592)', '(Breathing-6.812-7.5)', '(Breathing-7.706-7.97)', '(Male singing-7.97-10.0)']"
  },
  "Y0-lu3JkALFM.wav": {
    "caption": "A melodic tune with a woman singing softly accompanies the sound of a meowing cat in a playroom.",
    "timestamp_events": "['(Music-0.0-9.421)', '(Synthetic singing-0.0-9.421)', '(Mechanisms-0.0-9.421)']"
  },
  "YccHK041hfTw.wav": {
    "caption": "The sound of a door opening and closing is accompanied by faint squeaks, suggesting the presence of rodents, possibly in a veterinarian's office.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.875)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-1.549-1.663)', '(Cat-2.329-5.716)', '(Generic impact sounds-3.109-3.247)', '(Generic impact sounds-5.814-6.78)', '(Cat-5.919-6.049)', '(Cat-7.024-7.471)', '(Cat-7.625-7.698)', '(Cat-7.95-8.275)', '(Cat-8.413-8.836)', '(Cat-8.998-9.104)', '(Cat-9.364-9.429)', '(Cat-9.575-10.0)']"
  },
  "YAUOcgHcIXFw.wav": {
    "caption": "A printing machine stops abruptly in a room followed by paper rustling.",
    "timestamp_events": "['(Printer-0.0-5.315)', '(Mechanisms-0.0-10.0)', '(Paper rustling-5.755-8.149)', '(Paper rustling-8.434-8.849)', '(Surface contact-8.89-9.346)', '(Surface contact-9.802-10.0)']"
  },
  "YCBYbC4rL5LQ.wav": {
    "caption": "An animal rustles through the undergrowth, capturing the essence of a wild animal's natural habitat.",
    "timestamp_events": "['(Rustle-0.0-2.764)', '(Rumble-0.0-10.0)', '(Animal-0.409-0.512)', '(Animal-0.717-0.929)', '(Animal-1.079-1.472)', '(Animal-2.543-2.677)', '(Animal-2.835-2.945)', '(Animal-3.079-3.228)', '(Animal-3.37-3.48)', '(Rustle-3.976-5.772)', '(Animal-4.094-4.252)', '(Animal-4.646-5.063)', '(Animal-5.276-5.575)', '(Animal-5.709-6.346)', '(Animal-6.52-7.039)', '(Rustle-6.63-10.0)', '(Animal-7.205-7.291)', '(Animal-7.496-7.591)', '(Animal-7.732-7.898)', '(Animal-8.213-8.378)', '(Animal-8.591-8.677)', '(Animal-9.142-9.228)', '(Animal-9.512-9.622)', '(Animal-9.803-9.882)']"
  },
  "Y8NNEbcu6tlw.wav": {
    "caption": "Water splashes and gurgles while a baby laughs in the background, suggesting washing in a bathtub.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Human voice-0.118-0.299)', '(Generic impact sounds-0.591-0.709)', '(Breathing-0.693-0.929)', '(Breathing-1.378-1.835)', '(Splash, splatter-2.094-7.165)', '(Generic impact sounds-2.102-3.016)', '(Generic impact sounds-3.213-3.465)', '(Generic impact sounds-4.409-4.614)', '(Generic impact sounds-4.835-5.669)', '(Human voice-5.898-6.37)', '(Generic impact sounds-6.465-6.85)', '(Baby laughter-6.827-7.213)', '(Breathing-7.252-7.48)', '(Baby laughter-7.472-8.433)', '(Water-7.866-9.346)', '(Generic impact sounds-8.142-8.299)', '(Human voice-8.606-9.244)', '(Generic impact sounds-8.953-9.315)', '(Generic impact sounds-9.898-9.984)']"
  },
  "YbPL19UIq0iA.wav": {
    "caption": "The sound of rattling and laughter fills the air as people speak, indicating a lively atmosphere, possibly in a social gathering or party.",
    "timestamp_events": "['(Music-0.0-9.157)', '(Hubbub, speech noise, speech babble-0.0-9.157)', '(Generic impact sounds-0.048-0.248)', '(Generic impact sounds-0.517-0.765)', '(Generic impact sounds-1.001-1.116)', '(Generic impact sounds-1.44-1.633)', '(Generic impact sounds-2.715-3.162)', '(Generic impact sounds-3.555-3.693)', '(Generic impact sounds-4.403-4.589)', '(Generic impact sounds-5.96-6.097)', '(Generic impact sounds-7.372-7.551)', '(Shout-7.827-9.122)', '(Generic impact sounds-8.867-9.053)']"
  },
  "Y1Qik4gI3Xlw.wav": {
    "caption": "A woman softly whispers while speaking in a hushed tone, possibly in a quiet room or intimate setting.",
    "timestamp_events": "['(Whispering-0.0-0.286)', '(Background noise-0.0-10.0)', '(Whispering-0.403-0.823)', '(Whispering-0.939-1.454)', '(Breathing-1.521-2.594)', '(Human sounds-2.639-3.149)', '(Breathing-3.104-3.578)', '(Breathing-3.766-4.07)', '(Whispering-4.119-7.487)', '(Whispering-7.737-9.886)']"
  },
  "Y0qlMC4f7vVo.wav": {
    "caption": "A baby cries while a woman speaks in a hospital room, accompanied by a background music.",
    "timestamp_events": "['(Music-0.0-9.13)', '(Male singing-0.0-9.13)', '(Baby cry, infant cry-0.392-1.484)', '(Baby cry, infant cry-1.724-2.659)', '(Baby cry, infant cry-3.03-5.915)', '(Baby cry, infant cry-6.121-9.13)']"
  },
  "Y4te1v86pSn0.wav": {
    "caption": "Birds chirp and sing as a squawking sound is heard, indicating the presence of domestic animals or pets in an outdoor environment.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.307)', '(Bird vocalization, bird call, bird song-0.0-0.526)', '(Wind-0.0-10.0)', '(Bird vocalization, bird call, bird song-0.691-3.488)', '(Male speech, man speaking-0.838-1.732)', '(Male speech, man speaking-2.458-10.0)', '(Bird vocalization, bird call, bird song-3.639-4.175)', '(Bird vocalization, bird call, bird song-4.34-5.062)', '(Bird vocalization, bird call, bird song-5.241-6.705)', '(Bird vocalization, bird call, bird song-6.89-9.062)', '(Bird vocalization, bird call, bird song-9.186-9.241)', '(Bird vocalization, bird call, bird song-9.371-10.0)']"
  },
  "Y4Csr25pn41Q.wav": {
    "caption": "People yell and laugh in a small room while music plays, creating a lively atmosphere.",
    "timestamp_events": "['(Human sounds-0.0-1.268)', '(Background noise-0.0-10.0)', '(Human sounds-1.364-1.804)', '(Human sounds-1.907-2.217)', '(Human sounds-2.313-2.691)', '(Human sounds-2.808-2.993)', '(Male speech, man speaking-2.959-5.309)', '(Laughter-5.138-6.031)', '(Male speech, man speaking-5.818-10.0)']"
  },
  "Y43RFHuMSFIY.wav": {
    "caption": "A guitar strums softly as electronic music plays in the background at a lively discotheque.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Male singing-0.0-10.0)', '(Male speech, man speaking-7.105-9.789)']"
  },
  "Y7YkMNtI7NvI.wav": {
    "caption": "A group of people engage in conversation while wind blows in the background at a busy social gathering.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)', '(Male speech, man speaking-0.541-2.232)', '(Male speech, man speaking-9.411-10.0)']"
  },
  "Ybi0yeSSgMX0.wav": {
    "caption": "A choir sings harmoniously on stage, creating a beautiful a cappella performance.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Choir-0.0-10.0)', '(Male singing-0.579-1.889)', '(Male singing-3.078-4.567)', '(Male singing-5.568-7.111)']"
  },
  "Y8S7zOYPESi8.wav": {
    "caption": "A small dog barks while a woman speaks in a domestic environment, possibly indicating the presence of pets.",
    "timestamp_events": "['(Yip-0.0-0.309)', '(Mechanisms-0.0-9.283)', '(Yip-0.487-1.319)', '(Yip-1.593-2.734)', '(Yip-2.912-4.089)', '(Female speech, woman speaking-4.22-6.229)', '(Yip-4.874-5.242)', '(Yip-5.979-7.096)', '(Female speech, woman speaking-6.466-6.918)', '(Female speech, woman speaking-7.191-7.595)', '(Yip-7.239-7.631)', '(Yip-7.857-9.046)']"
  },
  "Y14RrzOGATv8.wav": {
    "caption": "A group of people engage in conversation as they walk adn a wind blows in an urban setting.",
    "timestamp_events": "['(Child speech, kid speaking-0.0-3.664)', '(Wind-0.0-10.0)', '(Walk, footsteps-1.618-1.723)', '(Walk, footsteps-2.333-2.491)', '(Walk, footsteps-2.762-2.927)', '(Walk, footsteps-3.318-3.574)', '(Walk, footsteps-3.792-4.108)', '(Walk, footsteps-4.409-4.59)', '(Child speech, kid speaking-4.59-5.011)', '(Walk, footsteps-4.981-5.109)', '(Child speech, kid speaking-5.267-5.463)', '(Walk, footsteps-5.448-5.636)', '(Child speech, kid speaking-5.771-8.442)', '(Walk, footsteps-5.989-6.102)', '(Walk, footsteps-6.275-6.388)', '(Walk, footsteps-6.576-6.817)', '(Walk, footsteps-6.923-7.028)', '(Walk, footsteps-7.224-7.517)', '(Walk, footsteps-7.705-7.878)', '(Walk, footsteps-8.277-8.623)', '(Child speech, kid speaking-8.661-10.0)', '(Walk, footsteps-8.721-8.879)', '(Walk, footsteps-9.082-9.255)', '(Walk, footsteps-9.496-9.676)', '(Walk, footsteps-9.789-10.0)']"
  },
  "Y7ikvVbnualY.wav": {
    "caption": "People laugh and talk in a music studio as a man with glasses and a red glove holds a red object.",
    "timestamp_events": "['(Laughter-0.0-1.279)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-1.437-5.004)', '(Conversation-1.475-9.526)', '(Laughter-2.047-2.22)', '(Laughter-2.551-2.799)', '(Breathing-5.26-5.531)', '(Male speech, man speaking-5.576-9.15)', '(Laughter-6.9-7.938)', '(Laughter-8.766-9.293)', '(Breathing-9.285-9.752)', '(Male speech, man speaking-9.857-10.0)']"
  },
  "Y4Gw8jFlJyLI.wav": {
    "caption": "A man sings on stage while a crowd cheers and claps in a large hall, accompanied by music and occasional whoops.",
    "timestamp_events": "['(Male singing-0.0-2.915)', '(Music-0.0-10.0)', '(Screaming-0.052-0.82)', '(Whoop-3.434-5.986)', '(Male singing-4.174-4.734)', '(Male singing-6.006-10.0)', '(Whoop-6.691-7.742)', '(Human voice-8.966-9.72)']"
  },
  "Y446RTbt3Vao.wav": {
    "caption": "An adult male speaks while a group of people chuckle and chortle in a large room or hall.",
    "timestamp_events": "['(Male speech, man speaking-0.0-2.065)', '(Conversation-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Giggle-1.859-5.165)', '(Male speech, man speaking-4.711-5.509)', '(Giggle-5.495-7.062)', '(Breathing-5.577-6.093)', '(Male speech, man speaking-6.031-6.725)', '(Breathing-6.663-7.0)', '(Male speech, man speaking-7.014-10.0)', '(Giggle-8.189-8.766)']"
  },
  "Y703tZ8sFF6k.wav": {
    "caption": "A dog whimpers while a man laughs in a music studio, accompanied by domestic animal sounds and music.",
    "timestamp_events": "['(Dog-0.0-0.29)', '(Male singing-0.0-0.802)', '(Music-0.0-10.0)', '(Dog-0.485-1.045)', '(Male singing-1.175-5.099)', '(Dog-1.395-1.988)', '(Dog-3.044-3.247)', '(Dog-3.409-3.767)', '(Dog-3.929-4.295)', '(Dog-5.846-6.049)', '(Male singing-5.911-8.909)', '(Dog-6.399-7.203)', '(Howl-7.203-9.152)', '(Male singing-9.185-10.0)', '(Howl-9.51-10.0)']"
  },
  "Ya8oPAcGtj6Q.wav": {
    "caption": "A man speaks followed by a duck quacking, creating a unique audio event of human-animal interaction in a natural setting.",
    "timestamp_events": "['(Background noise-0.015-4.256)', '(Male speech, man speaking-4.256-5.641)', '(Crow-4.47-5.604)', '(Crow-5.796-6.223)', '(Crow-5.929-5.976)', '(Crow-6.48-7.349)', '(Crow-7.769-8.321)', '(Male speech, man speaking-8.645-10.0)', '(Crow-9.028-9.374)']"
  },
  "YBGH3pmm6-JY.wav": {
    "caption": "People are talking and laughing while a dog barks in the background, creating a lively atmosphere.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.651)', '(Music-0.0-10.0)', '(Laughter-0.692-0.913)', '(Female speech, woman speaking-1.395-1.808)', '(Mouse-1.925-2.483)', '(Female speech, woman speaking-2.669-3.247)', '(Laughter-3.061-6.987)', '(Breathing-3.867-4.363)', '(Female speech, woman speaking-4.384-5.355)', '(Mouse-5.334-5.816)', '(Mouse-6.209-7.035)', '(Speech-7.097-7.986)', '(Mouse-7.69-8.399)', '(Speech-8.543-9.515)', '(Mouse-8.661-9.68)']"
  },
  "YCaoTyzMbMiE.wav": {
    "caption": "Water splashes and gurgles as a rowboat, canoe, or kayak glides through the peaceful environment of a waterway.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Rowboat, canoe, kayak-0.0-10.0)', '(Stream, river-0.0-10.0)', '(Surface contact-0.093-0.384)', '(Surface contact-0.543-1.089)', '(Surface contact-3.074-3.614)', '(Surface contact-5.004-5.488)', '(Surface contact-6.145-6.525)', '(Surface contact-6.961-7.389)', '(Surface contact-7.721-8.074)']"
  },
  "Y5ZV5NcgFMck.wav": {
    "caption": "A man sings accompanied by music as a crowd cheers in the orchestra pit. (Audio event: Singing)",
    "timestamp_events": "['(Male singing-0.0-1.293)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Male singing-1.533-2.399)', '(Whoop-2.2-2.973)', '(Male singing-2.674-3.024)', '(Male singing-3.307-6.777)', '(Whistling-5.746-6.11)', '(Whoop-6.6-7.573)', '(Male singing-7.933-10.0)', '(Whistling-7.993-8.282)', '(Whistling-8.987-9.44)', '(Whoop-9.267-10.0)']"
  },
  "Y0xaEqnvDJgY.wav": {
    "caption": "A group of women in black dresses sing a capella in a large ballroom, accompanied by music.",
    "timestamp_events": "['(Female singing-0.0-2.591)', '(Music-0.0-10.0)', '(Choir-0.0-10.0)', '(Female singing-3.197-10.0)']"
  },
  "Y3wV80XZI2yI.wav": {
    "caption": "A frog croaks while people talk in the background, creating a lively atmosphere in a serene pond.",
    "timestamp_events": "['(Pig-0.0-2.077)', '(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Pig-2.257-2.634)', '(Female speech, woman speaking-3.853-5.049)', '(Speech-5.546-5.968)', '(Pig-5.997-7.878)', '(Female speech, woman speaking-7.555-8.059)', '(Pig-8.051-9.12)', '(Female speech, woman speaking-9.029-10.0)']"
  },
  "Y-6sNhZq681c.wav": {
    "caption": "A man speaks while music plays in the background in an indoor setting.",
    "timestamp_events": "['(Male speech, man speaking-0.0-3.496)', '(Music-0.0-10.0)', '(Background noise-0.0-10.0)', '(Male speech, man speaking-4.035-10.0)']"
  },
  "Y6ZBYrFpQt6w.wav": {
    "caption": "A loud car horn honks in an urban environment, followed by the sound of rustling in the background.",
    "timestamp_events": "['(Wind-0.075-6.595)', '(Run-0.129-0.306)', '(Run-0.415-0.578)', '(Run-0.755-0.931)', '(Run-1.081-1.489)', '(Run-1.584-2.182)', '(Vehicle horn, car horn, honking, toot-2.332-3.361)', '(Air horn, truck horn-3.311-4.53)', '(Run-4.943-5.106)', '(Run-5.346-6.595)']"
  },
  "Y2-4EJZwsBrc.wav": {
    "caption": "A man speaks with a speech synthesizer as music plays in the background in a home theater.",
    "timestamp_events": "['(Music-0.391-10.0)', '(Conversation-1.174-10.0)', '(Male speech, man speaking-1.196-2.611)', '(Male speech, man speaking-3.341-4.327)', '(Male speech, man speaking-4.703-6.072)', '(Male speech, man speaking-6.448-7.976)', '(Male speech, man speaking-8.269-8.879)', '(Male speech, man speaking-9.044-10.0)']"
  },
  "Y9QXJJl3YzDU.wav": {
    "caption": "A man speaks as music plays in the background, accompanied by the sound of a skateboard rolling.",
    "timestamp_events": "['(Male speech, man speaking-0.0-2.513)', '(Music-0.0-9.594)', '(Skateboard-0.903-3.236)', '(Male speech, man speaking-3.078-3.883)', '(Female singing-6.027-9.248)']"
  },
  "Y1rmhTDK7qAg.wav": {
    "caption": "A man speaks while music plays in a playroom.",
    "timestamp_events": "['(Male speech, man speaking-0.0-2.622)', '(Music-0.0-10.0)', '(Generic impact sounds-1.175-1.273)', '(Generic impact sounds-2.938-3.199)', '(Generic impact sounds-3.509-3.9)', '(Generic impact sounds-4.237-4.766)', '(Generic impact sounds-5.144-5.371)', '(Generic impact sounds-5.692-5.773)', '(Generic impact sounds-6.196-6.334)', '(Generic impact sounds-7.373-7.512)', '(Generic impact sounds-8.535-8.608)', '(Generic impact sounds-8.836-8.957)', '(Generic impact sounds-9.778-10.0)']"
  },
  "Ya6VitvO4tgE.wav": {
    "caption": "A crowd erupts in cheers as an adult female delivers a speech, creating an atmosphere of excitement and celebration.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-3.427)', '(Background noise-0.0-10.0)', '(Breathing-3.427-3.733)', '(Female speech, woman speaking-3.785-4.554)', '(Whoop-4.545-7.727)', '(Applause-5.806-10.0)']"
  },
  "Y3r8zgkmCGxQ.wav": {
    "caption": "People are talking and laughing while water splashes and splatters in a water park pool.",
    "timestamp_events": "['(Water-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Human voice-0.048-0.157)', '(Tick-0.048-0.254)', '(Human voice-0.331-0.457)', '(Child speech, kid speaking-0.734-1.627)', '(Laughter-1.668-2.135)', '(Human voice-2.162-2.491)', '(Human voice-2.704-2.848)', '(Human voice-3.095-3.48)', '(Laughter-3.679-4.949)', '(Cough-4.221-4.468)', '(Male speech, man speaking-4.811-5.656)', '(Sniff-5.016-5.216)', '(Laughter-5.916-6.651)', '(Female speech, woman speaking-6.822-9.122)', '(Laughter-9.575-10.0)']"
  },
  "Y0IuJ1tiJb-g.wav": {
    "caption": "Water trickles down inside a small room, creating a soothing sound reminiscent of a peaceful indoor fountain.",
    "timestamp_events": "['(Trickle, dribble-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-3.562-3.667)', '(Generic impact sounds-4.529-4.668)', '(Generic impact sounds-6.112-6.624)', '(Generic impact sounds-7.392-7.52)', '(Generic impact sounds-8.463-10.0)']"
  },
  "Y5nOBC7ctGbY.wav": {
    "caption": "A camera clicks as a woman speaks in the background followed by a man asking questions in a calm and productive atmosphere in a small room.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-2.213)', '(Conversation-0.0-10.0)', '(Walk, footsteps-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-1.498-3.159)', '(Camera-3.208-5.266)', '(Male speech, man speaking-3.643-4.889)', '(Female speech, woman speaking-4.502-5.015)', '(Male speech, man speaking-5.43-6.812)', '(Camera-5.459-6.203)', '(Female speech, woman speaking-5.459-7.527)', '(Male speech, man speaking-7.092-8.203)', '(Female speech, woman speaking-8.85-10.0)']"
  },
  "Y3ccXywmials.wav": {
    "caption": "Swing music fills the ballroom as a man delivers a speech, igniting cheers from the crowd.",
    "timestamp_events": "['(Male singing-0.0-2.215)', '(Human voice-1.687-2.467)', '(Music-2.264-10.0)', '(Male singing-2.719-6.464)', '(Human voice-3.247-3.563)', '(Human voice-3.742-4.798)', '(Male singing-6.756-8.308)', '(Male singing-8.478-10.0)']"
  },
  "Y3clQa02xoi8.wav": {
    "caption": "A vehicle engine is running and vibrating while music plays in the background, suggesting a lively atmosphere.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Car-0.0-10.0)', '(Accelerating, revving, vroom-6.004-10.0)']"
  },
  "Y5QgmnPM42Kg.wav": {
    "caption": "A man sings passionately in an inddor setting like a home or studio.",
    "timestamp_events": "['(Music-0.183-5.247)', '(Hubbub, speech noise, speech babble-0.187-5.247)', '(Male speech, man speaking-0.24-1.296)', '(Male singing-0.33-1.319)', '(Male singing-1.406-2.145)', '(Male speech, man speaking-2.436-2.836)', '(Male speech, man speaking-3.345-4.123)', '(Male singing-4.33-4.919)']"
  },
  "YBQaFuod-ueg.wav": {
    "caption": "An adult female delivers a speech while a crowd cheers in an outdoor location near a chainlink fence.",
    "timestamp_events": "['(Conversation-0.0-4.02)', '(Background noise-0.0-9.351)', '(Child speech, kid speaking-0.003-1.854)', '(Giggle-1.314-2.42)', '(Male speech, man speaking-2.381-3.686)', '(Child speech, kid speaking-3.133-4.001)', '(Shout-3.59-9.351)', '(Child speech, kid speaking-7.35-7.877)', '(Child speech, kid speaking-8.024-8.609)', '(Child speech, kid speaking-8.706-9.351)']"
  },
  "Y-9MfiQzh99c.wav": {
    "caption": "A power tool motor is running and vibrating while metal whirring occurs, accompanied by background music, in a woodworking workshop.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.324-0.415)', '(Generic impact sounds-0.869-1.077)', '(Generic impact sounds-1.492-2.374)', '(Surface contact-4.06-4.682)', '(Generic impact sounds-5.214-5.642)', '(Surface contact-6.485-6.9)', '(Generic impact sounds-7.328-7.549)', '(Generic impact sounds-8.093-8.301)']"
  },
  "Y710INRXyTus.wav": {
    "caption": "A man speaks as a car speeds by, creating a high-energy atmosphere, possibly in an urban setting.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.307)', '(Accelerating, revving, vroom-0.0-5.293)', '(Race car, auto racing-0.0-10.0)', '(Male speech, man speaking-5.908-9.888)']"
  },
  "Y-bOmOinDpPo.wav": {
    "caption": "Music plays as a crowd claps, creating a lively atmosphere in a stadium during a football game.",
    "timestamp_events": "['(Clapping-0.0-0.088)', '(Whistle-0.0-0.426)', '(Music-0.0-0.965)', '(Cheering-0.0-9.791)', '(Clapping-0.251-0.338)', '(Clapping-0.483-0.578)', '(Clapping-0.74-1.066)', '(Battle cry-1.078-1.718)', '(Music-1.655-7.848)', '(Clapping-1.855-1.993)', '(Clapping-2.194-2.332)', '(Clapping-2.645-2.783)', '(Clapping-3.059-3.184)', '(Clapping-3.423-3.586)', '(Clapping-3.849-4.049)', '(Clapping-4.25-4.388)', '(Clapping-4.676-4.864)', '(Clapping-5.077-5.253)', '(Clapping-5.466-5.604)', '(Clapping-5.917-6.08)', '(Clapping-6.319-6.544)', '(Clapping-6.807-6.995)', '(Clapping-7.209-7.397)', '(Clapping-7.61-7.798)', '(Battle cry-8.036-9.077)', '(Hubbub, speech noise, speech babble-8.732-9.721)']"
  },
  "Y8tt5tDwAYQs.wav": {
    "caption": "People talking and a baby crying can be heard in a large room or hall, creating a hubbub of speech noise and babble.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.571)', '(Background noise-0.0-10.0)', '(Laughter-0.477-2.328)', '(Shout-0.803-2.375)', '(Male speech, man speaking-2.41-3.912)', '(Shout-2.643-4.191)', '(Breathing-4.005-4.238)', '(Male speech, man speaking-4.261-4.494)', '(Breathing-4.68-4.901)', '(Male speech, man speaking-4.855-10.0)', '(Shout-4.89-6.077)', '(Laughter-8.906-10.0)']"
  },
  "YBlMgnV76g8w.wav": {
    "caption": "The engine of a car revs up and down, creating a medium frequency rumble in the vehicle.",
    "timestamp_events": "['(Car-0.0-10.0)', '(Generic impact sounds-0.138-0.39)', '(Generic impact sounds-0.516-1.388)', '(Generic impact sounds-1.456-1.846)', '(Generic impact sounds-1.927-2.374)', '(Generic impact sounds-2.523-3.039)', '(Generic impact sounds-3.154-3.234)', '(Generic impact sounds-3.406-5.734)', '(Accelerating, revving, vroom-4.002-10.0)', '(Generic impact sounds-5.929-6.044)', '(Generic impact sounds-6.216-7.03)', '(Generic impact sounds-7.213-7.775)', '(Generic impact sounds-8.349-8.555)', '(Generic impact sounds-9.369-9.817)']"
  },
  "Y25TL-KzwiVA.wav": {
    "caption": "A car engine revs as it traverses through streets driven by a man.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.375)', '(Car-0.0-10.0)', '(Accelerating, revving, vroom-0.485-2.597)', '(Generic impact sounds-0.629-4.375)', '(Accelerating, revving, vroom-3.149-4.116)', '(Generic impact sounds-4.519-5.818)', '(Generic impact sounds-5.949-6.024)', '(Generic impact sounds-6.354-6.979)', '(Generic impact sounds-7.227-7.66)', '(Generic impact sounds-7.839-8.382)', '(Accelerating, revving, vroom-8.153-10.0)', '(Generic impact sounds-9.076-9.536)', '(Generic impact sounds-9.742-9.9)']"
  },
  "YaQfXbZo8UZI.wav": {
    "caption": "A group of people sing and clap along to music as a woman in a black dress performs on stage in an orchestra pit.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Clapping-0.315-0.769)', '(Clapping-1.189-1.302)', '(Female singing-1.189-1.827)', '(Clapping-1.757-2.334)', '(Female singing-2.168-3.226)', '(Clapping-3.156-3.61)', '(Female singing-3.61-4.344)', '(Clapping-4.406-4.834)', '(Female singing-4.476-5.691)', '(Clapping-5.83-6.259)', '(Female singing-5.865-7.098)', '(Clapping-7.168-7.649)', '(Female singing-7.413-9.432)', '(Clapping-8.593-9.012)', '(Female singing-9.729-10.0)']"
  },
  "Y9Botkvq32u0.wav": {
    "caption": "Emergency sirens blare as a car alarm rings out, indicating a chaotic scene on the road.",
    "timestamp_events": "['(Car alarm-0.0-8.668)', '(Mechanisms-0.0-10.0)', '(Vehicle horn, car horn, honking, toot-1.383-2.241)', '(Vehicle horn, car horn, honking, toot-2.548-3.022)', '(Vehicle horn, car horn, honking, toot-3.252-3.483)', '(Vehicle horn, car horn, honking, toot-3.598-4.2)', '(Vehicle horn, car horn, honking, toot-8.656-8.848)', '(Vehicle horn, car horn, honking, toot-8.976-9.718)']"
  },
  "Y8wjCtXtSuQE.wav": {
    "caption": "A large crowd erupts in cheers and applause as music plays in an indoor basketball court.",
    "timestamp_events": "['(Shout-0.0-1.914)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Whoop-2.304-3.092)', '(Shout-3.19-6.293)']"
  },
  "Y8u2v1db6Hx4.wav": {
    "caption": "A child babbles while speaking to a female while playing inside a house.",
    "timestamp_events": "['(Conversation-0.0-9.626)', '(Female speech, woman speaking-9.122-9.626)', '(Background noise-0.0-10.0)', '(Child speech, kid speaking-6.63-8.838)']"
  },
  "Y6zbkVL8ZxcU.wav": {
    "caption": "Multiple people are laughing and talking while a car horn blares in the background, indicating a chaotic and noisy environment.",
    "timestamp_events": "['(Car alarm-0.0-10.0)', '(Wind-0.0-10.0)', '(Giggle-1.02-2.5)', '(Giggle-2.77-3.807)', '(Giggle-4.077-5.861)', '(Breathing-6.497-6.94)', '(Human voice-7.037-7.825)', '(Giggle-8.199-8.427)', '(Breathing-9.077-9.513)', '(Giggle-9.492-9.858)']"
  },
  "Y3qDzHyrsWeg.wav": {
    "caption": "The motorboat speeds through the water, creating splashes, as it moves along near some houses.",
    "timestamp_events": "['(Accelerating, revving, vroom-0.0-1.648)', '(Wind-0.0-4.497)', '(Water-0.0-4.497)', '(Motorboat, speedboat-0.0-4.511)', '(Motorboat, speedboat-4.623-10.0)', '(Wind-4.623-10.0)', '(Water-4.623-10.0)', '(Accelerating, revving, vroom-4.623-10.0)']"
  },
  "YxNJxsEWLfh0.wav": {
    "caption": "A woman speaks while a child cries, creating a whimpering and sobbing sound in a room.",
    "timestamp_events": "['(Human voice-0.0-0.23)', '(Background noise-0.0-10.0)', '(Crying, sobbing-0.189-4.485)', '(Female speech, woman speaking-0.196-1.701)', '(Conversation-0.196-10.0)', '(Human voice-1.078-1.24)', '(Human voice-1.793-1.939)', '(Female speech, woman speaking-2.382-3.949)', '(Breathing-4.725-4.993)', '(Crying, sobbing-5.0-5.983)', '(Male speech, man speaking-5.969-7.825)', '(Crying, sobbing-8.155-10.0)', '(Breathing-8.161-8.438)', '(Female speech, woman speaking-8.437-10.0)']"
  },
  "Ywf57lUIx8ME.wav": {
    "caption": "Fireworks explode in the urban setting as a firecracker sound dominates the audio, creating a lively atmosphere.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Firecracker-0.293-1.543)', '(Speech-0.668-2.446)', '(Firecracker-2.19-2.664)', '(Firecracker-2.927-3.687)', '(Speech-3.492-4.689)', '(Firecracker-4.695-5.388)', '(Firecracker-6.148-6.704)', '(Firecracker-7.382-8.458)', '(Firecracker-8.879-9.293)', '(Firecracker-9.819-10.0)']"
  },
  "YZub0gYFPmY8.wav": {
    "caption": "A digital beeping sound is heard repeatedly, indicating a fire alarm going off in a child's room.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.126)', '(Background noise-0.0-10.0)', '(Generic impact sounds-0.31-0.401)', '(Generic impact sounds-0.505-0.929)', '(Generic impact sounds-1.032-1.135)', '(Fire alarm-1.101-1.399)', '(Fire alarm-1.571-2.03)', '(Generic impact sounds-2.225-2.408)', '(Fire alarm-2.443-3.016)', '(Generic impact sounds-3.234-3.36)', '(Fire alarm-3.44-4.094)', '(Generic impact sounds-4.266-4.415)', '(Generic impact sounds-4.908-5.115)', '(Fire alarm-5.447-6.067)', '(Generic impact sounds-6.055-6.399)', '(Fire alarm-6.399-7.018)', '(Generic impact sounds-7.03-7.397)', '(Fire alarm-7.397-8.016)', '(Generic impact sounds-7.982-8.131)', '(Generic impact sounds-8.245-8.429)', '(Generic impact sounds-8.922-9.14)', '(Generic impact sounds-9.255-9.392)', '(Fire alarm-9.392-10.0)']"
  },
  "YXYQyoNGpMk0.wav": {
    "caption": "People are talking, arguing and clapping while music and speech can be heard in the television studio.",
    "timestamp_events": "['(Male speech, man speaking-0.0-3.047)', '(Conversation-0.0-10.0)', '(Music-0.0-10.0)', '(Male speech, man speaking-3.514-4.898)', '(Male speech, man speaking-5.801-10.0)']"
  },
  "YZbGL9ItQZeI.wav": {
    "caption": "A sheep bleats as a man speaks, indicating the presence of livestock on a farm.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Moo-0.012-2.435)', '(Moo-3.008-6.634)', '(Walk, footsteps-6.663-6.779)', '(Conversation-6.709-10.0)', '(Male speech, man speaking-6.709-10.0)', '(Walk, footsteps-6.877-6.946)', '(Walk, footsteps-7.287-7.444)', '(Walk, footsteps-7.513-7.663)']"
  },
  "Yr-5NCjm4GlQ.wav": {
    "caption": "A guitar strums while a keyboard is tapped intermittently, creating a melodic music in a discotheque.",
    "timestamp_events": "['(Tap dance-0.0-0.078)', '(Music-0.0-10.0)', '(Background noise-0.0-10.0)', '(Tap dance-0.391-0.552)', '(Tap dance-0.99-3.751)', '(Tap dance-3.903-8.318)', '(Tap dance-8.461-8.899)', '(Tap dance-9.042-9.211)', '(Tap dance-9.336-9.417)', '(Tap dance-9.533-9.703)', '(Tap dance-9.837-10.0)']"
  },
  "YSFD6nFXY1jw.wav": {
    "caption": "A man speaks with music playing in the background while a vehicle passes by, creating a lively atmosphere on a bustling street.",
    "timestamp_events": "['(Music-0.0-7.158)', '(Bicycle, tricycle-0.144-4.293)', '(Male speech, man speaking-0.801-7.173)']"
  },
  "Yvaq0LbYJjsk.wav": {
    "caption": "Music plays as an eruption occurs, followed by a booming sound, creating a lively atmosphere in a burial chamber.",
    "timestamp_events": "['(Sound effect-0.0-0.582)', '(Music-0.0-10.0)', '(Video game sound-0.0-10.0)', '(Sound effect-0.98-1.942)', '(Sound effect-2.459-3.084)', '(Sound effect-3.45-3.905)', '(Fire-4.425-10.0)']"
  },
  "YRprKnpcWaP4.wav": {
    "caption": "A crowd of people cheer and chant while a group of girls dance on stage with fiery energy.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.315-1.767)', '(Cheering-1.56-5.073)', '(Hubbub, speech noise, speech babble-2.417-3.06)', '(Male speech, man speaking-5.01-5.937)', '(Conversation-5.024-8.641)', '(Hubbub, speech noise, speech babble-6.373-7.064)', '(Male speech, man speaking-6.892-7.369)', '(Female speech, woman speaking-7.791-8.634)', '(Hubbub, speech noise, speech babble-8.634-10.0)']"
  },
  "YUdDgy6nuxyM.wav": {
    "caption": "The sound of scraping and a woman's voice can be heard as sanding and rubbing occur in a workshop.",
    "timestamp_events": "['(Sanding-0.0-0.181)', '(Female speech, woman speaking-0.0-0.78)', '(Music-0.0-10.0)', '(Sanding-0.307-2.74)', '(Female speech, woman speaking-1.638-3.11)', '(Sanding-2.929-4.866)', '(Female speech, woman speaking-5.094-5.323)', '(Female speech, woman speaking-5.488-6.969)', '(Female speech, woman speaking-7.189-10.0)']"
  },
  "YZFfTfUWPwhY.wav": {
    "caption": "A chainsaw roars as a man starts it up, accompanied by the sound of power tools and occasional speech in a wooded area.",
    "timestamp_events": "['(Wind-0.008-10.0)', '(Sawing-0.03-1.495)', '(Male speech, man speaking-2.106-2.754)', '(Sawing-3.064-4.028)', '(Sawing-4.536-5.641)', '(Sawing-5.884-10.0)', '(Male speech, man speaking-8.542-10.0)']"
  },
  "YVpi3hCbu9Ow.wav": {
    "caption": "A cat growls repeatedly in a domestic setting, indicating the presence of a pet in a home environment.",
    "timestamp_events": "['(Breathing-0.0-0.614)', '(Mechanisms-0.0-10.0)', '(Laughter-0.573-1.617)', '(Growling-0.929-3.349)', '(Breathing-1.848-2.312)', '(Breathing-2.866-3.188)', '(Breathing-3.805-4.207)', '(Growling-4.209-6.709)', '(Breathing-7.317-8.041)', '(Laughter-8.819-9.622)', '(Growling-9.507-10.0)']"
  },
  "YNWkDQE9RrDc.wav": {
    "caption": "A train approaches a subway station as it gets closer, with the sound of rail transport and train wagons.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Train-0.0-10.0)', '(Railroad car, train wagon-0.179-0.551)', '(Generic impact sounds-1.37-1.588)', '(Generic impact sounds-1.754-1.895)', '(Generic impact sounds-4.02-4.277)', '(Generic impact sounds-5.199-5.442)', '(Generic impact sounds-6.172-6.466)', '(Generic impact sounds-7.183-7.503)', '(Railroad car, train wagon-7.618-8.259)', '(Generic impact sounds-8.732-9.052)', '(Generic impact sounds-9.347-9.59)']"
  },
  "YUvDH9LfN0D8.wav": {
    "caption": "The sound of clicking accompanies a man's speech in a small room, suggesting a conversation or presentation.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.61)', '(Background noise-0.0-10.0)', '(Computer keyboard-0.579-0.858)', '(Male speech, man speaking-0.941-2.069)', '(Computer keyboard-2.4-3.379)', '(Clicking-3.792-3.958)', '(Clicking-5.162-5.245)', '(Clicking-5.493-5.598)', '(Male speech, man speaking-5.862-6.652)', '(Clicking-5.884-5.944)', '(Clicking-7.637-7.75)', '(Computer keyboard-8.217-8.698)', '(Computer keyboard-9.714-9.962)']"
  },
  "YUYeiSU4AWj4.wav": {
    "caption": "Music plays softly as water splashes in a large room, resembling the sound of a bathtub filling or being washed.",
    "timestamp_events": "['(Music-0.0-6.029)', '(Water-0.0-7.15)', '(Mechanisms-5.14-10.0)', '(Generic impact sounds-7.159-7.488)', '(Generic impact sounds-7.652-9.034)', '(Generic impact sounds-9.295-9.73)']"
  },
  "Yrl09PeW40dw.wav": {
    "caption": "The engine roars to life as music fills the air, with occasional scratching sounds, in a music studio.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Male speech, man speaking-1.165-1.591)', '(Male speech, man speaking-1.804-3.426)', '(Shout-3.433-4.23)', '(Male speech, man speaking-3.653-3.969)', '(Male speech, man speaking-5.591-5.777)', '(Shout-6.423-7.887)', '(Male speech, man speaking-6.457-7.928)']"
  },
  "Yto2RF7hOTFw.wav": {
    "caption": "Dishes clang together as a woman laughs, accompanied by the sound of cutlery and silverware in a kitchen.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Dishes, pots, and pans-0.184-3.469)', '(Dishes, pots, and pans-3.662-5.701)', '(Breathing-4.966-5.546)', '(Human sounds-5.768-6.184)', '(Breathing-6.174-6.58)', '(Human sounds-6.58-7.121)', '(Dishes, pots, and pans-7.092-7.208)', '(Breathing-7.14-7.498)', '(Human sounds-7.701-8.638)', '(Dishes, pots, and pans-8.657-9.845)']"
  },
  "YX4GVaDr0BBo.wav": {
    "caption": "A boat motor roars as an adult male speaks in the background, indicating a lively environment on a motorboat.",
    "timestamp_events": "['(Motorboat, speedboat-0.0-10.0)', '(Accelerating, revving, vroom-5.805-10.0)', '(Water-0.0-10.0)']"
  },
  "YqjlPexB2uVI.wav": {
    "caption": "A man speaks amidst the chirping of birds in a small room, creating an insect-like ambiance.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Bird vocalization, bird call, bird song-0.321-0.475)', '(Female speech, woman speaking-0.796-2.402)', '(Bird vocalization, bird call, bird song-1.285-1.508)', '(Bird vocalization, bird call, bird song-1.941-2.109)', '(Bird vocalization, bird call, bird song-2.486-2.723)', '(Bird vocalization, bird call, bird song-2.863-3.031)', '(Bird vocalization, bird call, bird song-3.268-3.464)', '(Bird vocalization, bird call, bird song-3.631-3.869)', '(Female speech, woman speaking-4.204-4.749)', '(Bird vocalization, bird call, bird song-5.279-5.908)', '(Bird vocalization, bird call, bird song-6.466-6.634)', '(Female speech, woman speaking-6.508-7.444)', '(Bird vocalization, bird call, bird song-7.835-8.296)', '(Bird vocalization, bird call, bird song-8.547-8.939)', '(Female speech, woman speaking-9.036-10.0)']"
  },
  "YRjogI2AWTwc.wav": {
    "caption": "Shoes squeak as a man speaks in the background while a basketball bounces in a large indoor room.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.408)', '(Basketball bounce-0.0-7.286)', '(Mechanisms-0.0-10.0)', '(Squeal-0.359-1.703)', '(Male speech, man speaking-1.857-2.971)', '(Squeal-2.061-4.417)', '(Male speech, man speaking-3.534-4.686)', '(Squeal-4.75-5.698)', '(Squeal-5.928-6.684)', '(Squeal-7.055-7.337)', '(Male speech, man speaking-7.465-9.334)', '(Basketball bounce-8.297-8.54)', '(Basketball bounce-9.181-9.347)', '(Male speech, man speaking-9.641-10.0)']"
  },
  "YvZRbl0XpjvA.wav": {
    "caption": "The sound of music fills the air as a car races by, its tires squealing on the raceway.",
    "timestamp_events": "['(Race car, auto racing-0.0-0.796)', '(Music-0.0-10.0)', '(Accelerating, revving, vroom-1.201-8.841)', '(Race car, auto racing-1.229-8.757)']"
  },
  "YO5WhPro-vNQ.wav": {
    "caption": "A man speaks while chewing inside a small room, creating a mastication sound in the audio.",
    "timestamp_events": "['(Male speech, man speaking-0.0-4.861)', '(Background noise-0.0-10.0)', '(Chewing, mastication-4.959-5.914)', '(Chewing, mastication-6.132-6.336)', '(Male speech, man speaking-6.313-6.501)', '(Chewing, mastication-6.546-7.013)', '(Chewing, mastication-7.254-8.194)', '(Male speech, man speaking-8.059-8.992)', '(Chewing, mastication-9.12-9.782)']"
  },
  "YTf4ewOEp0f0.wav": {
    "caption": "Water runs as a woman's voice speaks in a rural setting, likely outside, surrounded by nature.",
    "timestamp_events": "['(Water-0.0-10.0)', '(Background noise-0.0-10.0)', '(Female speech, woman speaking-1.619-5.529)', '(Child speech, kid speaking-3.392-3.839)', '(Human sounds-5.083-8.093)', '(Female speech, woman speaking-9.282-10.0)']"
  },
  "YUoBN57zrTKs.wav": {
    "caption": "A woman speaks while a motor vehicle engine runs, creating an eruption of sound in the background.",
    "timestamp_events": "['(Female speech, woman speaking-0.11-2.346)', '(Jet engine-0.0-10.0)', '(Male speech, man speaking-9.228-10.0)', '(Background noise-0.0-10.0)']"
  },
  "YywDib8jp4Yo.wav": {
    "caption": "Birds chirp and sing while music plays in the background with a man speaking, creating a tense atmosphere in a natural environment.",
    "timestamp_events": "['(Sound effect-0.068-0.873)', '(Water-0.805-10.0)', '(Chirp, tweet-0.82-2.363)', '(Wind-0.842-10.0)', '(Chirp, tweet-3.236-3.416)', '(Music-4.229-10.0)', '(Chirp, tweet-4.304-4.545)', '(Chirp, tweet-5.5-5.696)', '(Chirp, tweet-6.734-7.035)', '(Chirp, tweet-7.457-7.645)', '(Chirp, tweet-7.968-8.706)']"
  },
  "YWwwwbUrBLbQ.wav": {
    "caption": "A man speaks while an electric shaver hums in the background inside a large room.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.701)', '(Conversation-0.0-9.586)', '(Electric shaver, electric razor-0.0-10.0)', '(Television-0.0-10.0)', '(Male speech, man speaking-0.828-2.294)', '(Male speech, man speaking-3.186-4.376)', '(Male speech, man speaking-5.072-6.394)', '(Male speech, man speaking-6.548-9.786)']"
  },
  "YU13QD1WjOLY.wav": {
    "caption": "A man's voice is heard speaking as a group of people talk in the background in an urban environment.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)', '(Male speech, man speaking-0.105-10.0)', '(Conversation-0.12-10.0)']"
  },
  "YPbbFSX52Coo.wav": {
    "caption": "A man is sawing wood with occasional rubbing sounds in a woodworking workshop.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.284)', '(Background noise-0.0-10.0)', '(Sawing-0.123-5.529)', '(Male speech, man speaking-6.03-7.96)', '(Sawing-7.21-10.0)']"
  },
  "Yy7G-meRcLlY.wav": {
    "caption": "A woman speaks while a child crying, creating a tense atmosphere in a living room.",
    "timestamp_events": "['(Crumpling, crinkling-0.07-0.936)', '(Mechanisms-0.07-10.0)', '(Baby laughter-0.74-2.668)', '(Human sounds-1.047-3.478)', '(Crumpling, crinkling-2.458-4.246)', '(Speech-3.883-6.229)', '(Baby laughter-4.246-5.209)', '(Crumpling, crinkling-5.559-6.215)', '(Baby laughter-6.257-10.0)', '(Crumpling, crinkling-7.123-10.0)', '(Speech-9.623-10.0)']"
  },
  "Yu9laZiHd8kI.wav": {
    "caption": "A crowd cheers as people talk in the background while music plays, creating a lively atmosphere in a gymnasium.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Cheering-0.0-10.0)', '(Male singing-0.004-5.309)', '(Giggle-0.622-1.268)', '(Giggle-3.206-4.23)', '(Whoop-6.835-8.622)', '(Applause-8.629-10.0)', '(Laughter-9.034-10.0)']"
  },
  "YQJQYCFL4JXo.wav": {
    "caption": "An infant cries and sobs in a hospital room, accompanied by the sound of a baby crying.",
    "timestamp_events": "['(Baby cry, infant cry-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Female speech, woman speaking-0.536-1.362)', '(Female speech, woman speaking-2.945-3.597)', '(Female speech, woman speaking-6.24-7.346)', '(Female speech, woman speaking-7.94-10.0)']"
  },
  "YTbFyJs4zslc.wav": {
    "caption": "A man sings pop music while music plays in the background at a performance in an arena.",
    "timestamp_events": "['(Male singing-0.0-3.052)', '(Music-0.0-10.0)', '(Male singing-3.255-10.0)', '(Cheering-6.659-10.0)']"
  },
  "YoJ8r0hglNZ4.wav": {
    "caption": "A frog croaks nearby while birds chirp in the distance, creating a serene ambiance in a bamboo forest.",
    "timestamp_events": "['(Frog-0.0-0.341)', '(Background noise-0.0-9.389)', '(Frog-0.705-2.75)', '(Chirp, tweet-0.938-1.86)', '(Chirp, tweet-3.178-4.256)', '(Frog-4.737-5.535)', '(Frog-5.776-6.646)', '(Chirp, tweet-5.925-6.217)', '(Chirp, tweet-6.457-6.626)', '(Chirp, tweet-6.782-6.983)', '(Frog-6.964-7.509)', '(Chirp, tweet-7.139-7.327)', '(Frog-7.607-8.21)', '(Chirp, tweet-9.009-9.119)']"
  },
  "YPWBkhLhDFxE.wav": {
    "caption": "A loud thump followed by a series of speech suggests people talking and a possible collision in an indoor environment.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-2.573)', '(Music-0.0-10.0)', '(Tap dance-0.0-10.0)', '(Conversation-0.015-10.0)', '(Male speech, man speaking-4.063-4.432)', '(Female speech, woman speaking-4.605-5.455)', '(Female speech, woman speaking-6.163-6.524)', '(Female speech, woman speaking-9.549-10.0)']"
  },
  "YRVJcpsJ7lsQ.wav": {
    "caption": "A man sings passionately accompanied by lively pop music, occasionally shouting, in a large hall.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Distortion-0.0-10.0)', '(Male singing-1.598-10.0)']"
  },
  "Yw9AleaPf7iM.wav": {
    "caption": "The sound of an engine humming with the wind blowing suggests a bus driving on a mountain road, accompanied by the sound of air brakes.",
    "timestamp_events": "['(Bus-0.0-10.0)', '(Video game sound-0.0-10.0)', '(Air brake-2.148-2.416)', '(Chirp, tweet-3.818-4.23)', '(Chirp, tweet-6.979-8.354)', '(Chirp, tweet-9.488-10.0)']"
  },
  "YqXlsRC3Gsfw.wav": {
    "caption": "A man speaks while a group of people sings in the background at an outdoor athletic field.",
    "timestamp_events": "['(Male speech, man speaking-0.0-2.671)', '(Conversation-0.0-6.862)', '(Electric rotor drone, quadcopter-0.0-10.0)', '(Male speech, man speaking-3.13-4.116)', '(Male speech, man speaking-4.409-6.847)', '(Male singing-7.118-10.0)']"
  },
  "YSR6aKHtJzqk.wav": {
    "caption": "Electronic music plays as drums join in, creating a rhythmic and energetic atmosphere in the entertainment center.",
    "timestamp_events": "['(Whistling-0.0-0.849)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Whoop-1.103-5.722)', '(Whistling-3.619-4.375)', '(Whoop-6.114-8.072)']"
  },
  "YrHjCq6n-BDI.wav": {
    "caption": "A baby cries while a woman speaks, accompanied by laughter and music, suggesting a lively and joyful atmosphere.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Television-0.0-10.0)', '(Female speech, woman speaking-0.055-0.425)', '(Baby laughter-0.496-1.787)', '(Female speech, woman speaking-1.654-2.244)', '(Female speech, woman speaking-3.677-4.512)', '(Baby laughter-4.307-6.984)', '(Female speech, woman speaking-6.638-7.693)', '(Baby laughter-7.606-8.197)', '(Female speech, woman speaking-8.283-8.756)', '(Baby laughter-9.425-10.0)', '(Female speech, woman speaking-9.85-10.0)']"
  },
  "YSpGt2BvnyPw.wav": {
    "caption": "The sound of a keyboard being typed on can be heard, accompanied by the faint sound of a spray.",
    "timestamp_events": "['(Rattle-0.0-1.22)', '(Mechanisms-0.0-10.0)', '(Rattle-1.495-2.333)', '(Rattle-2.464-2.608)', '(Breathing-2.519-3.839)', '(Rattle-2.828-4.457)', '(Rattle-4.622-7.206)', '(Breathing-7.351-10.0)', '(Rattle-7.536-10.0)']"
  },
  "YZXXzggUwPGI.wav": {
    "caption": "Music plays as a crowd cheers in a discotheque, creating a lively atmosphere.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Whoop-3.726-6.634)', '(Clapping-4.733-4.871)', '(Clapping-5.139-5.302)', '(Clapping-5.546-5.757)', '(Clapping-5.944-6.423)', '(Clapping-6.594-6.894)', '(Whoop-6.886-9.347)', '(Clapping-7.057-7.317)', '(Clapping-7.544-7.658)', '(Clapping-7.983-8.145)', '(Clapping-8.373-8.568)', '(Clapping-9.185-9.323)', '(Music-9.315-9.323)', '(Clapping-9.551-9.672)']"
  },
  "YSNz88gWKE2o.wav": {
    "caption": "The sound of a saw cutting through wood fills the air in an art studio, accompanied by faint speech in the background.",
    "timestamp_events": "['(Background noise-0.03-10.0)', '(Sawing-0.037-2.416)', '(Male speech, man speaking-1.024-2.511)', '(Male speech, man speaking-3.167-6.105)', '(Sawing-6.525-10.0)']"
  },
  "YTMEOrTGMymU.wav": {
    "caption": "People talk in the distance while music plays faintly, suggesting a social gathering or event. (Speech: 0.75, Music: 0.15)",
    "timestamp_events": "['(Water-0.118-10.0)', '(Hubbub, speech noise, speech babble-0.192-10.0)', '(Bird-5.928-9.993)']"
  },
  "YPr45BZooyBw.wav": {
    "caption": "A person snores loudly while soft music plays, occasionally interrupted by the sound of sonar in an art gallery.",
    "timestamp_events": "['(Sine wave-0.0-2.791)', '(Background noise-0.0-10.0)', '(Chant-1.825-9.222)']"
  },
  "YSDczdpkmaNM.wav": {
    "caption": "A loud explosion followed by another explosion shakes the ground as a thump and thud resonate in the forest.",
    "timestamp_events": "['(Sound effect-0.0-3.157)', '(Sound effect-3.344-4.546)', '(Sound effect-4.798-5.944)', '(Sound effect-6.106-7.308)', '(Wind-7.284-10.0)', '(Bird vocalization, bird call, bird song-7.463-7.698)', '(Bird vocalization, bird call, bird song-7.918-10.0)']"
  },
  "YokfsYhLADq0.wav": {
    "caption": "A man speaks followed by the sound of a door opening in a small room with pots, pans, and dishes.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.535)', '(Rustle-0.0-10.0)', '(Generic impact sounds-0.169-0.287)', '(Generic impact sounds-0.73-0.821)', '(Male speech, man speaking-1.108-2.425)', '(Generic impact sounds-1.186-1.356)', '(Generic impact sounds-2.503-2.621)', '(Generic impact sounds-3.051-3.207)', '(Generic impact sounds-3.598-3.703)', '(Male speech, man speaking-3.716-4.042)', '(Male speech, man speaking-4.316-5.711)', '(Generic impact sounds-4.902-5.059)', '(Generic impact sounds-6.141-6.284)', '(Male speech, man speaking-6.545-7.119)', '(Generic impact sounds-6.584-6.701)', '(Generic impact sounds-7.562-7.653)', '(Generic impact sounds-7.888-8.214)', '(Generic impact sounds-8.383-8.501)', '(Generic impact sounds-8.657-9.022)', '(Generic impact sounds-9.505-9.948)']"
  },
  "YUFVVOXkRw98.wav": {
    "caption": "People are talking while a typewriter is being used intermittently in a sauna.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-1.287)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.143-0.519)', '(Insect-1.249-1.768)', '(Female speech, woman speaking-1.58-3.687)', '(Insect-1.934-2.852)', '(Generic impact sounds-4.793-6.93)', '(Insect-6.96-7.803)', '(Insect-8.059-8.202)', '(Insect-8.427-8.584)', '(Generic impact sounds-8.698-8.924)', '(Insect-8.984-9.594)', '(Generic impact sounds-9.721-9.81)']"
  },
  "YU08Cnvf96G0.wav": {
    "caption": "A man speaks while music plays in the background, as the sound of a guitar accompanies them.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.976)', '(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-1.134-1.906)', '(Generic impact sounds-2.189-3.0)', '(Male speech, man speaking-2.26-3.953)', '(Generic impact sounds-3.567-5.016)', '(Male speech, man speaking-5.307-7.843)', '(Generic impact sounds-6.504-7.118)', '(Generic impact sounds-7.811-8.244)', '(Male speech, man speaking-8.425-10.0)', '(Generic impact sounds-8.661-9.047)', '(Generic impact sounds-9.37-9.48)', '(Generic impact sounds-9.701-9.835)']"
  },
  "YRsyFCVt-eAk.wav": {
    "caption": "Insects buzz loudly as a man speaks outside in a rural area, possibly near a beehive or apiary.",
    "timestamp_events": "['(Bird vocalization, bird call, bird song-0.0-1.676)', '(Buzz-0.0-10.0)', '(Male speech, man speaking-1.299-1.676)', '(Conversation-1.327-9.036)', '(Male speech, man speaking-2.193-4.749)', '(Bird vocalization, bird call, bird song-4.372-5.14)', '(Male speech, man speaking-4.902-6.257)', '(Bird vocalization, bird call, bird song-5.95-6.453)', '(Male speech, man speaking-7.514-9.022)', '(Tick-7.612-7.723)', '(Bird vocalization, bird call, bird song-7.723-8.673)', '(Tick-8.017-8.156)', '(Bird vocalization, bird call, bird song-9.469-10.0)']"
  },
  "YyNhVXCMz4bg.wav": {
    "caption": "A large motor vehicle engine roars while people converse in the background, possibly in a busy street.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.608-0.815)', '(Generic impact sounds-1.454-1.632)', '(Generic impact sounds-2.134-2.375)', '(Generic impact sounds-3.454-3.632)', '(Generic impact sounds-4.416-4.601)', '(Generic impact sounds-5.488-5.839)', '(Hubbub, speech noise, speech babble-7.117-10.0)', '(Generic impact sounds-7.165-7.371)', '(Generic impact sounds-7.591-7.736)', '(Generic impact sounds-8.127-8.34)', '(Generic impact sounds-8.828-9.041)', '(Generic impact sounds-9.241-9.433)']"
  },
  "YT395i9eMaUE.wav": {
    "caption": "People talking and laughing while a slap and smack sound can be heard in a veterinarian's office.",
    "timestamp_events": "['(Shout-0.0-1.075)', '(Male speech, man speaking-0.0-1.131)', '(Background noise-0.0-10.0)', '(Laughter-0.517-2.402)', '(Shout-2.444-5.112)', '(Male speech, man speaking-2.486-3.31)', '(Laughter-4.218-6.732)', '(Male speech, man speaking-5.056-6.732)', '(Laughter-7.626-7.947)', '(Male speech, man speaking-8.059-8.436)', '(Male speech, man speaking-8.561-10.0)']"
  },
  "YXHzSL1ZUQmo.wav": {
    "caption": "A lively crowd erupts in applause and cheers as a catchy tune plays in an arena/performance setting. (Audio-visual label: Music; Tap)",
    "timestamp_events": "['(Music-0.0-10.0)', '(Tap dance-0.0-10.0)', '(Human voice-1.691-2.078)', '(Whoop-2.147-3.406)', '(Cheering-4.9-10.0)', '(Whoop-4.907-7.313)']"
  },
  "YZE5XnFfq4fc.wav": {
    "caption": "A group of people are talking and singing in the background while music plays in a discotheque.",
    "timestamp_events": "['(Male singing-0.0-0.395)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Male singing-0.704-1.451)', '(Male singing-1.76-3.092)', '(Male singing-3.531-5.846)', '(Male singing-6.277-8.811)', '(Male singing-9.087-10.0)']"
  },
  "YSam83Obq6lI.wav": {
    "caption": "Sheep bleat while people talk in a veterinarian's office.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.191)', '(Conversation-0.0-8.481)', '(Background noise-0.0-9.11)', '(Child speech, kid speaking-0.438-0.69)', '(Bleat-0.554-0.961)', '(Male speech, man speaking-1.149-2.445)', '(Female speech, woman speaking-1.96-2.391)', '(Child speech, kid speaking-2.579-2.856)', '(Bleat-2.708-3.334)', '(Male speech, man speaking-3.278-3.873)', '(Bleat-3.898-4.086)', '(Bleat-4.292-4.925)', '(Male speech, man speaking-4.856-5.325)', '(Female speech, woman speaking-5.231-6.452)', '(Male speech, man speaking-6.484-7.391)', '(Child speech, kid speaking-7.748-8.033)', '(Male speech, man speaking-8.061-8.5)', '(Animal-8.662-9.11)']"
  },
  "Yv-6Vr68LqaQ.wav": {
    "caption": "A dog growls and roars, indicating the presence of an animal, possibly in a zoo or wildlife sanctuary.",
    "timestamp_events": "['(Animal-1.196-10.0)', '(Pant-2.152-4.146)', '(Noise-2.491-7.637)', '(Pant-5.922-7.487)']"
  },
  "YsxiVIGK5AEc.wav": {
    "caption": "A man passionately yells while music plays loudly in a crowded room, creating a lively atmosphere.",
    "timestamp_events": "['(Singing-0.0-10.0)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Shout-0.0-10.0)']"
  },
  "YTpwYCxG7KVY.wav": {
    "caption": "Pigeons coo and flap their wings inside a small room, creating a soothing ambiance of bird sounds.",
    "timestamp_events": "['(Coo-0.0-9.588)', '(Background noise-0.0-9.588)', '(Generic impact sounds-0.061-0.285)', '(Generic impact sounds-0.382-0.718)', '(Generic impact sounds-0.794-1.054)', '(Generic impact sounds-1.146-1.344)', '(Generic impact sounds-1.441-1.869)', '(Generic impact sounds-1.955-2.078)', '(Generic impact sounds-2.2-2.342)', '(Generic impact sounds-2.48-2.673)', '(Generic impact sounds-2.755-2.969)', '(Generic impact sounds-3.132-3.386)', '(Generic impact sounds-3.498-3.727)', '(Generic impact sounds-3.804-4.16)', '(Generic impact sounds-4.277-4.71)', '(Generic impact sounds-4.832-5.118)', '(Generic impact sounds-5.189-5.291)', '(Generic impact sounds-5.362-5.79)', '(Generic impact sounds-5.866-6.034)', '(Generic impact sounds-6.207-6.375)', '(Generic impact sounds-6.518-6.803)', '(Generic impact sounds-6.9-6.991)', '(Generic impact sounds-7.093-7.328)', '(Generic impact sounds-7.409-7.745)', '(Generic impact sounds-7.862-8.183)', '(Generic impact sounds-8.295-9.212)', '(Generic impact sounds-9.334-9.553)']"
  },
  "YwaXgPy1lcVc.wav": {
    "caption": "The sound of a revving sound can be heard in a small room as music plays in the background.",
    "timestamp_events": "['(Effects unit-0.0-10.0)', '(Music-0.0-10.0)', '(Background noise-0.0-10.0)']"
  },
  "YVbNrg0CKeLs.wav": {
    "caption": "A woman speaks while food sizzles in a small room, creating a frying sound in a restaurant kitchen.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-0.666)', '(Music-0.0-10.0)', '(Sizzle-0.0-10.0)', '(Female speech, woman speaking-0.883-2.074)', '(Female speech, woman speaking-2.586-3.547)']"
  },
  "YVFWYrsLbPrQ.wav": {
    "caption": "People laugh and a door slams as someone gives a speech in a home theater.",
    "timestamp_events": "['(Laughter-0.0-0.379)', '(Background noise-0.0-10.0)', '(Laughter-0.567-1.433)', '(Laughter-1.639-4.34)', '(Conversation-2.052-10.0)', '(Male speech, man speaking-2.093-3.736)', '(Male speech, man speaking-3.928-4.333)', '(Shout-5.303-6.114)', '(Laughter-5.611-7.076)', '(Laughter-7.199-8.437)', '(Female speech, woman speaking-8.416-10.0)', '(Male speech, man speaking-8.808-10.0)', '(Laughter-9.289-10.0)']"
  },
  "YtnDk4oW36yA.wav": {
    "caption": "A man speaks as dishes, pots, and pans clank in a small room, suggesting a bustling kitchen environment.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.744)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.038-0.217)', '(Generic impact sounds-1.013-1.167)', '(Generic impact sounds-2.036-2.499)', '(Generic impact sounds-2.751-3.157)', '(Male speech, man speaking-2.784-3.596)', '(Generic impact sounds-3.304-3.474)', '(Generic impact sounds-3.669-4.051)', '(Male speech, man speaking-4.035-7.138)', '(Generic impact sounds-4.49-4.969)', '(Surface contact-4.863-5.229)', '(Generic impact sounds-6.439-6.553)', '(Generic impact sounds-6.951-7.739)', '(Surface contact-7.893-8.08)', '(Generic impact sounds-8.405-8.633)', '(Generic impact sounds-8.86-9.453)', '(Generic impact sounds-9.713-10.0)']"
  },
  "Yr70z9eOy7HQ.wav": {
    "caption": "Dishes clatter, pots and pans clang, and cutlery clinks as people engage in lively conversation in a bustling kitchen.",
    "timestamp_events": "['(Background noise-0.015-10.0)', '(Mechanisms-0.03-2.636)', '(Male speech, man speaking-1.274-1.731)', '(Male speech, man speaking-2.114-2.644)', '(Male speech, man speaking-3.211-4.801)', '(Male speech, man speaking-7.828-8.498)', '(Male speech, man speaking-8.586-10.0)']"
  },
  "YvcUpgcfbD9I.wav": {
    "caption": "A man speaks while water splashes and splatters in a natural outdoor setting, possibly near a stream or river.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.525)', '(Conversation-0.0-10.0)', '(Wind-0.0-10.0)', '(Water-0.0-10.0)', '(Male speech, man speaking-0.842-2.434)', '(Male speech, man speaking-4.067-4.579)', '(Male speech, man speaking-4.904-5.651)', '(Slosh-5.806-7.382)', '(Male speech, man speaking-5.871-6.585)', '(Male speech, man speaking-7.503-8.73)', '(Slosh-7.983-9.234)', '(Male speech, man speaking-9.518-10.0)']"
  },
  "YRu0GDcId1i8.wav": {
    "caption": "A truck engine roars loudly while an adult female voice is heard in the background, possibly near a road.",
    "timestamp_events": "['(Wind-2.093-10.0)', '(Bus-2.107-10.0)', '(Video game sound-2.107-10.0)', '(Accelerating, revving, vroom-3.591-4.725)', '(Accelerating, revving, vroom-5.248-6.278)', '(Air brake-5.55-5.715)', '(Accelerating, revving, vroom-6.746-7.983)', '(Air brake-7.138-7.447)', '(Air brake-8.65-8.828)']"
  },
  "YZVaAtQUvJqk.wav": {
    "caption": "A woman delivers a speech inside a small room, with the sound of writing in the background.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-1.202)', '(Background noise-0.0-10.0)', '(Writing-1.367-1.512)', '(Writing-1.601-2.758)', '(Female speech, woman speaking-1.643-4.053)', '(Writing-2.875-4.115)', '(Female speech, woman speaking-4.487-5.134)', '(Writing-4.515-6.064)', '(Female speech, woman speaking-5.32-6.105)', '(Writing-6.202-6.539)', '(Writing-6.718-9.384)', '(Female speech, woman speaking-9.735-10.0)']"
  },
  "YxpHVSUkczKU.wav": {
    "caption": "The machine with lot of gears is constantly running.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Bell-0.008-1.738)', '(Generic impact sounds-0.677-1.196)', '(Generic impact sounds-1.52-1.896)', '(Generic impact sounds-2.122-2.777)', '(Gears-2.476-10.0)', '(Bell-2.558-5.154)', '(Generic impact sounds-5.154-5.5)', '(Generic impact sounds-6.204-6.504)', '(Generic impact sounds-7.398-7.69)', '(Generic impact sounds-8.382-8.781)', '(Generic impact sounds-9.609-10.0)']"
  },
  "YP2yp7rhU3wM.wav": {
    "caption": "A basketball bounces as the crowd erupts in cheers and applause, creating an electric atmosphere in a sports arena.",
    "timestamp_events": "['(Male speech, man speaking-0.128-2.062)', '(Shout-0.143-2.114)', '(Crowd-0.151-10.0)', '(Clapping-1.535-2.566)', '(Shout-2.453-3.213)', '(Basketball bounce-3.491-3.958)', '(Shout-3.996-10.0)', '(Whistling-5.132-6.358)', '(Clapping-6.275-7.675)', '(Child speech, kid speaking-9.406-10.0)']"
  },
  "YujFf8dufwBc.wav": {
    "caption": "A wild animal growls repeatedly, resembling the roaring sound of lions and tigers, indicating a presence of wild animals in their natural habitat.",
    "timestamp_events": "['(Roar-0.0-0.613)', '(Background noise-0.0-10.0)', '(Bird vocalization, bird call, bird song-0.029-0.532)', '(Roar-0.694-1.486)', '(Roar-1.591-3.366)', '(Bird vocalization, bird call, bird song-3.283-3.772)', '(Roar-3.472-10.0)', '(Bird vocalization, bird call, bird song-6.0-6.811)', '(Bird vocalization, bird call, bird song-7.323-8.622)']"
  },
  "YOs3XxJputFw.wav": {
    "caption": "A man's speech is accompanied by the sizzling sound of food frying in a pan, suggesting a kitchen environment.",
    "timestamp_events": "['(Sizzle-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Brief tone-0.745-1.947)', '(Male speech, man speaking-1.094-2.995)', '(Male speech, man speaking-3.149-4.522)', '(Male speech, man speaking-6.293-6.789)', '(Male speech, man speaking-8.243-10.0)']"
  },
  "YP5bQMKcpfWY.wav": {
    "caption": "The sound of a skateboard rattling and rattling can be heard, indicating a skateboarder performing tricks in a playground.",
    "timestamp_events": "['(Mechanisms-0.0-0.81)', '(Wind-0.0-10.0)', '(Skateboard-0.0-10.0)', '(Squeal-1.817-2.402)', '(Squeal-4.311-4.652)', '(Squeal-6.212-7.203)']"
  },
  "YX7hjqG1Hxp8.wav": {
    "caption": "A man's voice is heard speaking while crumpling paper in a small room, creating a distinct sound.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.292)', '(Crumpling, crinkling-0.0-0.691)', '(Background noise-0.0-10.0)', '(Crumpling, crinkling-1.103-2.918)', '(Male speech, man speaking-2.952-4.67)', '(Crumpling, crinkling-3.282-3.557)', '(Male speech, man speaking-4.897-6.952)', '(Crumpling, crinkling-5.344-8.031)', '(Male speech, man speaking-8.34-9.467)', '(Crumpling, crinkling-9.0-9.509)', '(Crumpling, crinkling-9.66-10.0)']"
  },
  "YRcFfWvrIyI4.wav": {
    "caption": "A whistle blows as people converse and a horse neighs in the countryside.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Male speech, man speaking-0.039-3.024)', '(Bird vocalization, bird call, bird song-0.465-1.362)', '(Music-1.402-7.913)', '(Bird vocalization, bird call, bird song-1.63-2.906)', '(Male speech, man speaking-3.236-3.449)', '(Female speech, woman speaking-3.457-3.89)', '(Bird vocalization, bird call, bird song-4.11-4.268)', '(Male speech, man speaking-4.409-5.78)', '(Bird vocalization, bird call, bird song-5.299-5.386)', '(Bird vocalization, bird call, bird song-6.11-6.992)', '(Bird vocalization, bird call, bird song-7.283-7.913)', '(Male speech, man speaking-7.528-8.638)', '(Music-8.157-9.118)', '(Male speech, man speaking-8.74-9.165)', '(Male speech, man speaking-9.362-10.0)', '(Music-9.409-10.0)']"
  },
  "YoQt7cyDuBHY.wav": {
    "caption": "A man speaks followed by light banging sounds as music, keyboard, and synthesizer play in a music studio.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.98)', '(Background noise-0.0-7.938)', '(Male speech, man speaking-1.804-2.327)', '(Male speech, man speaking-2.681-3.55)', '(Male speech, man speaking-3.829-5.759)', '(Mechanisms-7.85-10.0)']"
  },
  "YTpEUM7UxS6k.wav": {
    "caption": "A man speaks while a crowd talks in the background, with the sound of a basketball bouncing, indicating a basketball game.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.674)', '(Crowd-0.0-10.0)', '(Basketball bounce-0.505-0.665)', '(Basketball bounce-1.124-1.411)', '(Basketball bounce-1.797-2.099)', '(Male speech, man speaking-1.881-5.115)', '(Basketball bounce-3.117-3.589)', '(Basketball bounce-4.22-4.484)', '(Male speech, man speaking-5.31-6.181)', '(Basketball bounce-5.424-5.631)', '(Male speech, man speaking-6.342-10.0)', '(Basketball bounce-6.423-7.064)', '(Basketball bounce-7.649-7.867)', '(Basketball bounce-8.096-8.36)', '(Basketball bounce-8.761-8.911)', '(Basketball bounce-9.094-9.278)', '(Basketball bounce-9.484-9.679)']"
  },
  "YU6jdeOMpxZQ.wav": {
    "caption": "People are talking and music is playing as a man on a microphone rapping to a group of people on stage with flags.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Male speech, man speaking-2.931-3.859)', '(Male speech, man speaking-4.175-6.313)', '(Male speech, man speaking-9.406-10.0)']"
  },
  "YUyD8DnQdA4I.wav": {
    "caption": "A man speaks while a dog growls and barks in a veterinarians_office, creating a Bark; Domestic animals, pets; Speech; Dog; Growling; Animal audio event.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Growling-0.127-0.876)', '(Bark-0.711-0.89)', '(Bark-1.701-1.845)', '(Human voice-1.87-2.795)', '(Bark-2.808-2.973)', '(Male speech, man speaking-3.323-4.278)', '(Bark-4.608-4.828)', '(Growling-4.643-5.804)', '(Male speech, man speaking-5.426-6.835)', '(Human voice-5.547-7.128)', '(Growling-6.546-10.0)', '(Bark-8.931-9.103)']"
  },
  "YxQfUoZ4qDsk.wav": {
    "caption": "A man passionately delivers a speech while a cheering crowd energizes the atmosphere in a television studio.",
    "timestamp_events": "['(Shout-0.0-1.287)', '(Crowd-0.0-10.0)', '(Male speech, man speaking-0.534-3.273)', '(Female speech, woman speaking-3.266-3.792)', '(Male speech, man speaking-3.943-4.695)', '(Male speech, man speaking-5.117-7.412)', '(Shout-7.464-10.0)', '(Male speech, man speaking-9.142-10.0)']"
  },
  "YZ9XF-0Xfma4.wav": {
    "caption": "A man speaks over a radio amidst the sound of an aircraft engine running in the background during a rainstorm.",
    "timestamp_events": "['(Video game sound-0.0-10.0)', '(Car-0.0-10.0)', '(Male speech, man speaking-0.241-0.677)', '(Accelerating, revving, vroom-1.261-10.0)', '(Male speech, man speaking-2.076-2.821)', '(Male speech, man speaking-3.417-4.255)', '(Male speech, man speaking-5.183-5.975)', '(Male speech, man speaking-6.17-7.706)', '(Male speech, man speaking-9.484-10.0)']"
  },
  "YquOLJIEI3Po.wav": {
    "caption": "People cheer and scream as fireworks explode in the sky, creating a thrilling atmosphere of entertainment and celebration.",
    "timestamp_events": "['(Shout-0.0-1.175)', '(Crowd-0.0-2.995)', '(Wind-0.0-3.021)', '(Fireworks-0.062-2.995)', '(Shout-1.403-3.011)', '(Wind-3.096-10.0)', '(Crowd-3.117-10.0)', '(Fireworks-3.117-10.0)']"
  },
  "Yrj7xnzNtnf0.wav": {
    "caption": "A woman speaks and laughs as the audio event, while two women sit together in a conference center.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Conversation-0.148-10.0)', '(Female speech, woman speaking-0.175-1.323)', '(Breathing-1.426-1.962)', '(Female speech, woman speaking-1.433-6.856)', '(Laughter-4.086-6.835)', '(Laughter-7.165-7.639)', '(Female speech, woman speaking-7.261-7.454)', '(Breathing-7.756-8.065)', '(Female speech, woman speaking-8.052-10.0)']"
  },
  "Yu8ifKT-skCQ.wav": {
    "caption": "A guitar is strummed while music plays in the background, creating a musical ambiance in an orchestra pit.",
    "timestamp_events": "['(Male singing-0.0-0.33)', '(Music-0.0-10.0)', '(Background noise-0.0-10.0)', '(Male singing-0.477-1.208)', '(Male singing-4.538-9.161)']"
  },
  "YsiEO1iky8Rs.wav": {
    "caption": "A man delivers a speech while the audience chuckles and chortles in a conference center.",
    "timestamp_events": "['(Male speech, man speaking-0.0-5.026)', '(Background noise-0.008-10.0)', '(Laughter-4.978-7.077)', '(Male speech, man speaking-5.553-10.0)']"
  },
  "YshS4pI9IT8Y.wav": {
    "caption": "Rock and roll music blares as people yell and sing in a discotheque, creating a lively and energetic atmosphere.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Shout-0.37-1.064)', '(Male singing-1.082-2.313)', '(Male singing-2.643-4.766)', '(Shout-2.713-3.25)', '(Male singing-6.663-9.451)', '(Shout-7.958-9.497)']"
  },
  "YUTfe2x4OL7k.wav": {
    "caption": "A hair dryer hums as a woman works, creating a soothing ambiance in a bathroom.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-2.155)', '(Hair dryer-0.0-5.268)', '(Female speech, woman speaking-2.663-4.34)', '(Female speech, woman speaking-5.261-6.526)', '(Music-5.268-10.0)', '(Television-5.289-10.0)', '(Female speech, woman speaking-7.33-7.715)', '(Male speech, man speaking-8.21-10.0)', '(Female speech, woman speaking-8.663-8.911)']"
  },
  "Ythno6oZ6Glo.wav": {
    "caption": "A woman speaks followed by a beep, as rodents scurry and patter in the background in a rodent-infested environment.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.198)', '(Female speech, woman speaking-0.0-4.727)', '(Background noise-0.0-10.0)', '(Generic impact sounds-1.874-4.249)', '(Mechanisms-2.91-3.26)', '(Mechanisms-3.632-3.97)', '(Mechanisms-4.249-4.645)', '(Generic impact sounds-5.25-5.413)', '(Generic impact sounds-6.205-6.356)', '(Female speech, woman speaking-6.589-7.602)', '(Generic impact sounds-7.264-7.451)', '(Mechanisms-7.52-8.103)', '(Generic impact sounds-7.975-8.137)', '(Generic impact sounds-8.638-9.15)', '(Female speech, woman speaking-9.255-10.0)', '(Mechanisms-9.267-9.686)']"
  },
  "YNhyaVMoGrdI.wav": {
    "caption": "A woman laughs and talks while ducks quack in the background, creating a cheerful atmosphere near a pond.",
    "timestamp_events": "['(Laughter-0.0-2.637)', '(Background noise-0.0-10.0)', '(Baby laughter-1.135-3.856)', '(Female speech, woman speaking-3.726-4.733)', '(Conversation-3.767-8.015)', '(Female speech, woman speaking-4.977-6.171)', '(Laughter-6.009-10.0)', '(Female speech, woman speaking-6.951-8.015)', '(Baby laughter-9.152-10.0)']"
  },
  "YwIB2TkDwAMo.wav": {
    "caption": "A dance performance is happening, followed by a crowd erupting in applause and cheers at a rock and roll concert.",
    "timestamp_events": "['(Music-0.015-10.0)', '(Female singing-0.059-1.318)', '(Female singing-1.782-3.881)', '(Female singing-4.337-6.201)', '(Female singing-6.635-7.416)', '(Clapping-7.349-10.0)']"
  },
  "YUHnsf6RRY5Q.wav": {
    "caption": "A woman delivers a speech while a crowd cheers, accompanied by music, in a lively event.",
    "timestamp_events": "['(Music-0.0-1.554)', '(Male speech, man speaking-0.295-1.539)', '(Crowd-1.687-10.0)', '(Music-1.694-10.0)', '(Female speech, woman speaking-2.821-3.94)', '(Male speech, man speaking-2.887-3.896)', '(Female speech, woman speaking-4.124-6.223)', '(Male speech, man speaking-6.414-6.863)', '(Female speech, woman speaking-6.944-8.321)', '(Male speech, man speaking-6.952-8.321)', '(Female speech, woman speaking-8.542-10.0)']"
  },
  "YViE5OmQVP1c.wav": {
    "caption": "A man confidently delivers a narration, while engaging in a conversation in an academic reception.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.406)', '(Conversation-0.0-10.0)', '(Background noise-0.0-10.0)', '(Female speech, woman speaking-1.467-3.165)', '(Female speech, woman speaking-3.509-6.072)', '(Female speech, woman speaking-6.416-10.0)']"
  },
  "YycFchFdtQrE.wav": {
    "caption": "A lively crowd erupts in cheers and applause as energetic music fills the large auditorium during a performance.",
    "timestamp_events": "['(Singing-0.0-1.498)', '(Music-0.0-10.0)', '(Cheering-1.932-8.164)', '(Singing-7.913-10.0)']"
  },
  "YQpJX3DpjuMo.wav": {
    "caption": "A woman speaks while birds chirp in the background, creating a serene atmosphere in a canyon.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-0.929)', '(Wind-0.0-10.0)', '(Background noise-0.0-10.0)', '(Chirp, tweet-1.009-2.053)', '(Chirp, tweet-2.351-2.5)', '(Female speech, woman speaking-2.351-3.349)', '(Female speech, woman speaking-4.576-5.585)', '(Chirp, tweet-4.633-5.929)', '(Chirp, tweet-6.342-7.351)', '(Female speech, woman speaking-7.156-8.555)', '(Female speech, woman speaking-9.048-9.805)']"
  },
  "Yt6rBv6zp5Fo.wav": {
    "caption": "A car engine revs up and down, emitting a heavy, low-frequency sound in a home theater environment.",
    "timestamp_events": "['(Accelerating, revving, vroom-0.0-0.591)', '(Background noise-0.0-10.0)', '(Car-0.0-10.0)', '(Accelerating, revving, vroom-1.017-1.406)', '(Accelerating, revving, vroom-1.87-3.568)', '(Tire squeal, skidding-3.702-5.228)', '(Tire squeal, skidding-6.156-7.532)', '(Accelerating, revving, vroom-7.831-10.0)']"
  },
  "YRtO-PZ9-d-c.wav": {
    "caption": "A man delivers a speech as the crowd applauds in a theater, accompanied by music and occasional percussion.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.309)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-1.474-3.529)', '(Male speech, man speaking-3.845-6.808)', '(Music-5.694-10.0)', '(Clapping-5.736-10.0)']"
  },
  "YwEPKRycf-8Q.wav": {
    "caption": "A woman speaks while repeatedly tapping on a hard surface in a small room.",
    "timestamp_events": "['(Background noise-0.008-10.0)', '(Male speech, man speaking-0.847-3.439)', '(Male speech, man speaking-3.653-4.455)', '(Tap-4.809-5.243)', '(Tap-5.464-6.922)', '(Tap-7.305-10.0)']"
  },
  "Yw7B6VroMY4k.wav": {
    "caption": "A distorted guitar plays accompanied by music in a television studio as a man speaks through an effects unit.",
    "timestamp_events": "['(Music-0.0-7.937)', '(Effects unit-0.0-7.969)', '(Mechanisms-0.902-1.226)', '(Mechanisms-5.633-10.0)', '(Male speech, man speaking-6.512-7.669)', '(Male speech, man speaking-7.882-8.764)', '(Male speech, man speaking-8.89-9.948)']"
  },
  "YRX4D5HJBj5E.wav": {
    "caption": "The sound of a power tool motor running and vibrating, accompanied by metal scraping, suggests a construction site.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Tap-0.093-0.355)', '(Tap-1.202-1.491)', '(Tap-2.235-2.586)', '(Tap-2.751-2.903)', '(Tap-4.535-4.673)', '(Tap-4.886-4.983)', '(Tap-5.548-5.665)', '(Tap-5.899-6.037)', '(Tap-6.367-6.539)', '(Tap-7.318-7.841)', '(Tap-8.475-8.564)', '(Tap-8.785-8.97)', '(Tap-9.515-9.673)']"
  },
  "YuYwvfxWF460.wav": {
    "caption": "The sound of food sizzling in a pan can be heard as a man speaks, indicating that someone is frying food in a kitchen.",
    "timestamp_events": "['(Male speech, man speaking-0.0-3.537)', '(Frying (food)-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Dishes, pots, and pans-4.485-4.775)', '(Male speech, man speaking-4.838-6.255)', '(Dishes, pots, and pans-7.161-7.583)', '(Male speech, man speaking-7.77-8.558)']"
  },
  "Yj1rMLzpK-AY.wav": {
    "caption": "Gunshots ring out followed by a man speaking, amidst background music and speech, implying a scene of intense action.",
    "timestamp_events": "['(Gunshot, gunfire-0.0-0.619)', '(Gunshot, gunfire-0.837-1.72)', '(Generic impact sounds-1.411-1.56)', '(Gunshot, gunfire-1.938-3.635)', '(Music-3.577-6.299)', '(Male speech, man speaking-4.989-7.856)', '(Clapping-5.0-5.229)', '(Clapping-5.344-5.585)', '(Clapping-5.665-5.929)', '(Clapping-6.307-6.502)', '(Whoosh, swoosh, swish-6.835-7.42)', '(Generic impact sounds-7.936-8.085)', '(Male speech, man speaking-7.982-10.0)', '(Generic impact sounds-9.335-9.461)']"
  },
  "YpaejR6Xspm0.wav": {
    "caption": "A vehicle engine hums while a group of people talk and laugh in an urban setting.",
    "timestamp_events": "['(Cheering-0.0-1.642)', '(Music-0.0-6.439)', '(Crowd-0.0-6.484)', '(Male speech, man speaking-1.232-2.077)', '(Single-lens reflex camera-2.345-2.564)', '(Human voice-2.572-2.824)', '(Male speech, man speaking-2.8-5.518)', '(Laughter-5.541-6.624)', '(Brief tone-6.423-6.983)', '(Male speech, man speaking-6.706-8.754)', '(Motor vehicle (road)-6.951-10.0)', '(Human voice-9.779-10.0)']"
  },
  "YWA74G58qF04.wav": {
    "caption": "A man chuckles and gives a speech in a small room, creating an atmosphere of introspection and focus.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.253)', '(Background noise-0.0-10.0)', '(Humming-0.273-0.591)', '(Breathing-0.28-0.688)', '(Male speech, man speaking-0.709-2.825)', '(Male speech, man speaking-2.97-3.869)', '(Male speech, man speaking-4.07-6.608)', '(Human voice-5.979-6.248)', '(Breathing-6.643-6.961)', '(Male speech, man speaking-6.954-10.0)', '(Giggle-8.911-9.264)']"
  },
  "Y7pqRqXjqeX4.wav": {
    "caption": "A child coughs as a woman speaks in a small room, possibly a laundromat, according to the audio-visual label.",
    "timestamp_events": "['(Female speech, woman speaking-9.246-10.0)', '(Tick-9.118-9.219)', '(Throat clearing-6.373-6.628)', '(Hands-5.842-5.948)', '(Breathing-1.891-2.565)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-1.641-1.832)']"
  },
  "OBPySxWxlcE.wav": {
    "caption": "A soothing melody plays softly as glass shatters abruptly, echoing in a small room with a bird chirping.",
    "timestamp_events": "['(Mechanisms-0.0-3.589)', '(Music-0.0-4.011)', '(Human voice-0.053-1.074)', '(Whistling-0.084-0.284)', '(Bird vocalization, bird call, bird song-0.2-0.389)', '(Animal-0.358-0.716)', '(Whistling-0.874-2.916)', '(Animal-1.105-1.463)', '(Human voice-1.368-2.411)', '(Bird vocalization, bird call, bird song-1.568-1.968)', '(Animal-1.916-2.242)', '(Bird vocalization, bird call, bird song-2.358-2.716)', '(Animal-2.684-3.074)', '(Bird vocalization, bird call, bird song-3.147-3.632)', '(Whistling-3.337-3.611)', '(Animal-3.495-4.0)', '(Generic impact sounds-3.821-4.095)', '(Bird flight, flapping wings-3.895-4.484)', '(Generic impact sounds-4.4-5.611)', '(Tick-5.621-6.316)', '(Music-6.537-10.0)', '(Generic impact sounds-9.6-9.811)']"
  },
  "3UAvkNVtoak.wav": {
    "caption": "A loud explosion reverberates through the air, followed by a man speaking, inside a shattered garage.",
    "timestamp_events": "['(Sound effect-0.0-0.559)', '(Glass shatter-0.567-2.126)', '(Explosion-2.165-3.961)', '(Male speech, man speaking-3.976-6.465)', '(Male speech, man speaking-6.614-7.402)', '(Breathing-7.386-7.693)', '(Male speech, man speaking-7.764-9.055)', '(Male speech, man speaking-9.252-10.0)']"
  },
  "Y9dw2tHprouQ.wav": {
    "caption": "The bass guitar plays alongside music, creating a musical atmosphere with various instruments.",
    "timestamp_events": "['(Music-0.0-10.0)']"
  },
  "Yp6C0ZGTj1Qw.wav": {
    "caption": "The sound of a power tool drilling is followed by footsteps shuffling on a hard surface, indicating someone working with tools in an outdoor, rural or natural environment.",
    "timestamp_events": "['(Chainsaw-0.0-4.084)', '(Wind-0.0-10.0)', '(Chirp, tweet-8.174-8.664)', '(Generic impact sounds-9.341-9.607)']"
  },
  "YADwAeRNCtHY.wav": {
    "caption": "Water splashes as people talk in the background on a boat, creating a lively atmosphere on the water.",
    "timestamp_events": "['(Breathing-0.0-1.145)', '(Waves, surf-0.0-10.0)', '(Wind-0.0-10.0)', '(Wind noise (microphone)-0.0-10.0)', '(Generic impact sounds-0.259-0.315)', '(Breathing-1.352-2.666)', '(Tick-2.147-2.23)', '(Tick-2.348-2.41)', '(Generic impact sounds-2.535-2.666)', '(Breathing-3.012-4.132)', '(Tick-3.123-3.199)', '(Tick-3.434-4.049)', '(Tick-4.153-4.222)', '(Female speech, woman speaking-4.858-6.352)', '(Tick-4.879-4.99)', '(Breathing-6.172-7.894)', '(Generic impact sounds-8.745-8.932)', '(Breathing-9.257-10.0)']"
  },
  "Y8-tsgalx0DI.wav": {
    "caption": "A man speaks followed by music playing on a guitar in a music studio, with the audio-visual label indicating Music; Tap; Speech.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.505)', '(Background noise-0.0-10.0)', '(Breathing-0.478-0.87)', '(Male speech, man speaking-0.87-2.753)', '(Male speech, man speaking-3.076-5.117)', '(Male speech, man speaking-5.516-7.227)', '(Male speech, man speaking-7.591-8.546)', '(Male speech, man speaking-8.815-9.632)', '(Male speech, man speaking-9.763-10.0)']"
  },
  "YleJ6fBbDoEU.wav": {
    "caption": "A choir sings gospel music as a classical music piece plays in the background, accompanied by a music ensemble.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Choir-1.14-10.0)']"
  },
  "ER1chrpTv8M.wav": {
    "caption": "People scream and yell while a cat meows, creating a chaotic atmosphere in a location that may be crowded or lively.",
    "timestamp_events": "['(Wind-0.465-4.624)', '(Male speech, man speaking-0.48-0.99)', '(Shout-0.48-0.99)', '(Wind noise (microphone)-1.009-1.25)', '(Male speech, man speaking-1.246-2.598)', '(Shout-1.272-2.583)', '(Bleat-2.572-3.785)', '(Giggle-3.86-4.624)']"
  },
  "Y5d7CDqONWAA.wav": {
    "caption": "A man speaks in a small room, with a high probability of speech in the audio event.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Male speech, man speaking-0.037-1.775)', '(Male speech, man speaking-1.664-1.709)', '(Male speech, man speaking-2.776-4.08)', '(Male speech, man speaking-4.514-5.626)', '(Male speech, man speaking-6.171-7.231)', '(Male speech, man speaking-8.388-10.0)']"
  },
  "YqKQYKUBC3gM.wav": {
    "caption": "A man delivers a speech in a small room, with the audio event labeled as \"Speech\" in the audio-visual label.",
    "timestamp_events": "['(Background noise-0.008-10.0)', '(Male speech, man speaking-0.015-0.891)', '(Male speech, man speaking-1.134-4.08)', '(Male speech, man speaking-4.588-7.106)', '(Male speech, man speaking-7.261-7.607)', '(Male speech, man speaking-8.093-8.343)', '(Male speech, man speaking-8.513-10.0)']"
  },
  "YfYfduD2yOyE.wav": {
    "caption": "A cat growls as it interacts with other animals in a domestic setting, possibly indicating territorial behavior.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.077-0.205)', '(Breathing-0.371-0.819)', '(Generic impact sounds-1.345-1.498)', '(Surface contact-1.434-1.652)', '(Generic impact sounds-2.023-2.177)', '(Growling-2.151-4.02)', '(Surface contact-4.507-4.853)', '(Growling-4.853-5.775)', '(Generic impact sounds-5.378-5.711)', '(Generic impact sounds-6.172-6.325)', '(Generic impact sounds-6.492-6.671)', '(Generic impact sounds-6.85-6.94)', '(Generic impact sounds-7.529-7.657)', '(Generic impact sounds-8.105-8.284)', '(Generic impact sounds-8.54-8.809)', '(Growling-8.796-10.0)', '(Generic impact sounds-9.539-9.706)', '(Generic impact sounds-9.821-9.949)']"
  },
  "Y8ivMLVc3utk.wav": {
    "caption": "A dog growls and barks in a domestic environment, possibly indicating the presence of other animals or intruders.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Dog-0.008-0.074)', '(Dog-0.251-0.479)', '(Dog-0.648-1.002)', '(Dog-1.208-1.606)', '(Dog-1.819-2.173)', '(Dog-2.246-2.622)', '(Dog-2.725-3.086)', '(Dog-3.196-3.483)', '(Dog-3.631-3.903)', '(Dog-3.991-4.19)', '(Dog-4.315-4.603)', '(Dog-5.472-6.613)', '(Bird-6.598-8.255)', '(Dog-8.167-8.388)', '(Dog-9.043-9.22)', '(Dog-9.441-9.639)', '(Dog-9.706-10.0)']"
  },
  "YViL1SkWhj-s.wav": {
    "caption": "A child repeatedly coughs and clears their throat while speaking in an art school classroom.",
    "timestamp_events": "['(Human voice-0.0-0.256)', '(Background noise-0.0-10.0)', '(Generic impact sounds-0.309-0.61)', '(Cough-0.948-1.407)', '(Cough-1.558-1.926)', '(Breathing-2.039-2.37)', '(Cough-2.551-2.716)', '(Female speech, woman speaking-2.777-3.461)', '(Cough-3.491-3.657)', '(Generic impact sounds-4.065-4.54)', '(Generic impact sounds-5.103-5.536)', '(Cough-5.726-5.974)', '(Breathing-6.148-6.734)', '(Cough-7.028-7.224)', '(Breathing-7.389-7.743)', '(Cough-7.863-8.104)', '(Breathing-8.232-9.338)', '(Tick-9.105-9.18)', '(Cough-9.406-10.0)']"
  },
  "YdqWivv-H95c.wav": {
    "caption": "A group of people passionately chant and sing a battle cry, creating a lively and energetic atmosphere.",
    "timestamp_events": "['(Battle cry-9.087-10.0)', '(Walk, footsteps-8.685-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)']"
  },
  "Yhf5bbqXxnTE.wav": {
    "caption": "A banjo plays with a bluegrass music in the background as a man in a red shirt performs on stage.",
    "timestamp_events": "['(Music-0.0-10.0)']"
  },
  "YKXJjTfNxihk.wav": {
    "caption": "A car horn honks multiple times inside a small room, indicating a vehicle horn event.",
    "timestamp_events": "['(Tap-5.775-5.928)', '(Vehicle horn, car horn, honking, toot-2.784-4.195)', '(Mechanisms-0.0-9.648)', '(Generic impact sounds-9.433-9.633)']"
  },
  "YIsiP-gu5dvE.wav": {
    "caption": "Birds chirp and a duck quacks as an owl hoots in an aquarium.",
    "timestamp_events": "['(Hoot-0.0-0.272)', '(Bird vocalization, bird call, bird song-0.0-10.0)', '(Hoot-0.395-0.705)', '(Hoot-1.199-2.361)', '(Hoot-2.54-6.993)', '(Hoot-7.22-7.681)', '(Hoot-9.598-10.0)']"
  },
  "8oN13PMMPbY.wav": {
    "caption": "A person whistles a song in an art studio while music plays in the background.",
    "timestamp_events": "['(Background noise-0.127-9.825)', '(Whistling-0.134-9.818)', '(Music-9.818-10.0)']"
  },
  "Y4yDtaQ6k9eM.wav": {
    "caption": "A person whispers while someone speaks in a small room, possibly in a beauty salon.",
    "timestamp_events": "['(Whispering-5.276-5.819)', '(Tap-8.339-8.48)', '(Giggle-6.803-7.094)', '(Background noise-0.0-10.0)', '(Human sounds-2.858-2.984)']"
  },
  "YNixh6EiMOL4.wav": {
    "caption": "Loud explosions boom while music plays and someone speaks, creating an intense atmosphere in a movie theater.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.444)', '(Music-0.0-10.0)', '(Video game sound-0.0-10.0)', '(Walk, footsteps-0.948-1.121)', '(Generic impact sounds-1.272-2.175)', '(Walk, footsteps-2.37-2.498)', '(Generic impact sounds-2.573-3.251)', '(Walk, footsteps-3.093-3.311)', '(Walk, footsteps-3.401-3.604)', '(Generic impact sounds-3.98-7.878)', '(Walk, footsteps-8.743-8.917)', '(Walk, footsteps-9.744-9.895)']"
  },
  "rCHnMVnhA0w.wav": {
    "caption": "The sound of a computer keyboard typing is accompanied by music in a music studio.",
    "timestamp_events": "['(Beep, bleep-0.0-0.313)', '(Music-0.0-10.0)', '(Computer keyboard-0.235-2.412)', '(Beep, bleep-2.347-2.751)', '(Computer keyboard-3.103-3.429)', '(Computer keyboard-3.611-5.945)', '(Beep, bleep-4.407-4.824)', '(Beep, bleep-5.398-5.893)', '(Computer keyboard-6.31-6.597)', '(Computer keyboard-6.806-7.301)', '(Computer keyboard-7.536-8.644)', '(Beep, bleep-8.449-8.853)']"
  },
  "YmFUoPzYN4d8.wav": {
    "caption": "The sound of music fills the air as a doorbell rings, creating a lively atmosphere in a house.",
    "timestamp_events": "['(Music-0.0-2.947)', '(Male singing-0.0-2.947)', '(Video game sound-0.0-4.196)', '(Mechanisms-2.947-4.193)', '(Doorbell-3.005-4.203)', '(Video game sound-7.55-10.0)', '(Music-7.556-10.0)']"
  },
  "fqUI3EH5SqI.wav": {
    "caption": "A motor vehicle engine is running and vibrating while an adult male speaks in the background in a blender-filled kitchen.",
    "timestamp_events": "['(Blender, food processor-0.0-10.0)', '(Male speech, man speaking-1.323-1.825)', '(Male speech, man speaking-2.333-3.364)']"
  },
  "1hizec7Ei2Y.wav": {
    "caption": "A man speaks followed by a series of gunshots in a rural area, with the sound of a heart murmur in the background.",
    "timestamp_events": "['(Wind-0.0-3.063)', '(Water-0.0-3.079)', '(Male speech, man speaking-0.039-1.402)', '(Wind noise (microphone)-1.331-1.85)', '(Male speech, man speaking-1.567-2.693)', '(Heart sounds, heartbeat-5.11-5.409)', '(Background noise-5.11-9.425)', '(Heart sounds, heartbeat-5.724-5.953)', '(Heart sounds, heartbeat-6.291-6.606)', '(Heart sounds, heartbeat-6.89-7.15)', '(Heart sounds, heartbeat-7.512-7.669)', '(Heart sounds, heartbeat-7.858-8.055)', '(Heart sounds, heartbeat-8.189-8.339)', '(Heart sounds, heartbeat-8.52-8.717)', '(Generic impact sounds-8.898-9.37)']"
  },
  "YRoe6w-1SJz8.wav": {
    "caption": "A man plays an electric guitar accompanied by music in a small room, creating a musical atmosphere.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Electronic tuner-0.0-10.0)']"
  },
  "YLa6VR4iJKcU.wav": {
    "caption": "The sound of a jingle and tinkling can be heard, suggesting a cheerful atmosphere with music playing in the background.",
    "timestamp_events": "['(Music-0.128-10.0)']"
  },
  "YqErxs0eK6E8.wav": {
    "caption": "Birds chirp and tweet as crickets and insects create a symphony of sounds in a natural environment.",
    "timestamp_events": "['(Insect-0.0-1.075)', '(Mechanisms-0.0-10.0)', '(Insect-1.713-2.727)', '(Insect-3.645-3.802)', '(Insect-4.012-4.309)', '(Insect-4.624-4.79)', '(Insect-5.184-5.516)', '(Insect-5.621-6.25)', '(Insect-6.364-6.469)', '(Insect-6.687-8.252)', '(Insect-8.706-8.82)', '(Tick-8.872-8.942)', '(Insect-9.607-9.72)']"
  },
  "Yq10cul64AYo.wav": {
    "caption": "A child speaks followed by a man speaking and a baby crying in a small room.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.346-0.677)', '(Child speech, kid speaking-0.843-1.591)', '(Human voice-1.591-1.787)', '(Surface contact-1.701-2.118)', '(Child speech, kid speaking-1.992-2.496)', '(Generic impact sounds-2.449-3.165)', '(Generic impact sounds-3.732-4.142)', '(Generic impact sounds-4.252-4.307)', '(Surface contact-4.346-4.795)', '(Generic impact sounds-4.85-5.016)', '(Male speech, man speaking-5.024-5.953)', '(Generic impact sounds-5.52-5.732)', '(Breathing-5.858-6.661)', '(Generic impact sounds-6.276-6.488)', '(Surface contact-6.48-6.874)', '(Child speech, kid speaking-6.614-6.921)', '(Generic impact sounds-6.898-7.15)', '(Tick-7.291-7.362)', '(Breathing-7.323-8.024)', '(Generic impact sounds-8.031-8.244)', '(Surface contact-8.346-9.488)', '(Child speech, kid speaking-8.37-9.913)', '(Tick-8.394-8.441)', '(Tick-9.465-9.52)', '(Generic impact sounds-9.52-10.0)']"
  },
  "YRnfU1fEkuRo.wav": {
    "caption": "A man speaks amidst a crowd of people talking in the background, while rain falls on a surface at a conference center.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Conversation-0.529-10.0)', '(Male speech, man speaking-0.612-1.595)', '(Male speech, man speaking-1.925-2.564)', '(Male speech, man speaking-2.88-4.069)', '(Male speech, man speaking-4.468-5.595)', '(Hubbub, speech noise, speech babble-5.615-10.0)', '(Male speech, man speaking-6.529-10.0)']"
  },
  "YK5i6x86jrN4.wav": {
    "caption": "A person is typing on a computer keyboard in a music studio, with a high probability of computer keyboard and typing events.",
    "timestamp_events": "['(Computer keyboard-0.0-4.52)', '(Computer keyboard-4.906-5.976)', '(Computer keyboard-6.236-10.0)']"
  },
  "Y6iGjb4bKsOg.wav": {
    "caption": "A woman sings accompanied by music, creating a harmonious melody in a chemistry lab.",
    "timestamp_events": "['(Female singing-0.0-1.758)', '(Music-0.0-10.0)', '(Female singing-2.446-6.244)', '(Breathing-7.102-7.424)', '(Female singing-7.549-10.0)']"
  },
  "YdvUgkJSZBk8.wav": {
    "caption": "A man speaks followed by a loud burst, then a woman speaks, all happening in a snake-infested environment.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.409)', '(Background noise-0.0-3.447)', '(Female speech, woman speaking-1.548-3.364)', '(Snake-3.493-6.252)', '(Human sounds-5.763-5.972)', '(Background noise-6.251-10.0)', '(Female speech, woman speaking-6.403-8.976)', '(Female speech, woman speaking-9.209-10.0)']"
  },
  "YKByZQ5IIvYo.wav": {
    "caption": "A motorcycle engine revs as a cow moos in the background on a livestock farm.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Moo-0.135-3.247)', '(Male speech, man speaking-0.148-1.771)', '(Generic impact sounds-1.87-2.042)', '(Generic impact sounds-2.497-3.395)', '(Male speech, man speaking-2.509-3.223)', '(Generic impact sounds-3.801-5.806)', '(Moo-3.838-5.006)', '(Male speech, man speaking-6.052-6.544)', '(Generic impact sounds-6.335-7.048)', '(Moo-7.023-10.0)', '(Generic impact sounds-7.245-8.032)', '(Generic impact sounds-8.204-9.213)', '(Generic impact sounds-9.446-9.791)']"
  },
  "Y-uJmhiCHPXU.wav": {
    "caption": "A man gives a speech with occasional gasps as footsteps can be heard in the background at a racecourse.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Breathing-0.362-1.25)', '(Male speech, man speaking-1.415-2.442)', '(Breathing-2.504-3.523)', '(Male speech, man speaking-3.599-4.37)', '(Male speech, man speaking-4.659-6.519)', '(Breathing-6.581-7.201)', '(Male speech, man speaking-7.428-9.239)', '(Male speech, man speaking-9.597-10.0)']"
  },
  "YmKE6pYSCt-w.wav": {
    "caption": "Cutlery and dishes clatter together as pots and pans clang in a bustling kitchen of a bakery/shop.",
    "timestamp_events": "['(Cutlery, silverware-2.197-2.512)', '(Dishes, pots, and pans-0.866-1.291)', '(Chopping (food)-9.819-9.961)', '(Tap-1.685-1.898)', '(Mechanisms-0.0-10.0)', '(Surface contact-5.079-5.496)']"
  },
  "YrYIwPq14ewU.wav": {
    "caption": "A man speaks followed by a baby crying and a woman speaking, as a dog barks in the background outside a house.",
    "timestamp_events": "['(Mechanisms-0.102-10.0)', '(Walk, footsteps-0.299-0.502)', '(Bird vocalization, bird call, bird song-0.312-2.098)', '(Male speech, man speaking-0.346-1.018)', '(Walk, footsteps-0.659-0.862)', '(Walk, footsteps-1.046-1.249)', '(Tick-1.324-1.399)', '(Tick-1.528-1.629)', '(Walk, footsteps-1.636-1.942)', '(Tick-1.982-2.077)', '(Walk, footsteps-2.125-2.512)', '(Dog-2.641-3.089)', '(Walk, footsteps-2.953-3.164)', '(Dog-3.252-4.277)', '(Bird vocalization, bird call, bird song-3.428-3.734)', '(Walk, footsteps-3.523-3.768)', '(Walk, footsteps-4.148-4.257)', '(Female speech, woman speaking-4.175-5.18)', '(Walk, footsteps-4.61-4.759)', '(Male speech, man speaking-5.2-5.906)', '(Child speech, kid speaking-5.2-5.92)', '(Dog-5.798-7.841)', '(Female speech, woman speaking-6.619-7.081)', '(Laughter-7.481-7.95)', '(Tick-7.828-7.909)', '(Tick-8.025-8.147)', '(Dog-8.282-9.158)', '(Dog-9.443-10.0)']"
  },
  "YI3z4A5M-XEQ.wav": {
    "caption": "The sound of metal clanking and a man speaking can be heard as gears and mechanisms are being operated in a workshop.",
    "timestamp_events": "['(Ratchet, pawl-0.406-5.58)', '(Male speech, man speaking-6.775-7.477)', '(Mechanisms-0.0-9.793)']"
  },
  "YRu0GM7Dill4.wav": {
    "caption": "A cow moos amidst the sounds of livestock and farm animals, suggesting it is in a working animal environment.",
    "timestamp_events": "['(Child speech, kid speaking-0.0-0.271)', '(Male speech, man speaking-0.0-0.656)', '(Conversation-0.0-10.0)', '(Wind-0.0-10.0)', '(Cowbell-0.638-1.294)', '(Female speech, woman speaking-0.691-1.399)', '(Child speech, kid speaking-0.795-1.425)', '(Tick-1.32-1.39)', '(Male speech, man speaking-1.39-5.009)', '(Child speech, kid speaking-2.823-4.091)', '(Moo-5.219-6.862)', '(Male speech, man speaking-5.245-5.979)', '(Generic impact sounds-5.315-5.49)', '(Child speech, kid speaking-6.862-7.911)', '(Male speech, man speaking-7.858-8.876)', '(Male speech, man speaking-9.1-10.0)', '(Moo-9.292-10.0)']"
  },
  "YYoGfsvQOEWc.wav": {
    "caption": "An emergency vehicle siren blares as a vehicle swiftly passes by on the road, indicating a possible police car chase.",
    "timestamp_events": "['(Police car (siren)-0.02-3.105)', '(Traffic noise, roadway noise-0.02-8.247)', '(Car passing by-0.931-4.576)', '(Tick-1.829-1.888)', '(Tick-2.903-2.975)']"
  },
  "G8i2JKIaEMk.wav": {
    "caption": "A man speaks while crinkling plastic inside a small room, creating a crackling sound.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.496)', '(Mechanisms-0.0-10.0)', '(Surface contact-0.331-0.504)', '(Generic impact sounds-1.457-1.543)', '(Thump, thud-1.984-2.181)', '(Tap-2.236-2.48)', '(Generic impact sounds-2.559-2.693)', '(Tap-2.811-2.945)', '(Crumpling, crinkling-3.024-3.591)', '(Male speech, man speaking-3.441-4.827)', '(Crumpling, crinkling-4.118-8.488)', '(Breathing-4.504-5.819)', '(Generic impact sounds-4.984-5.157)', '(Wind noise (microphone)-5.0-5.37)', '(Wind noise (microphone)-7.882-8.268)', '(Wind noise (microphone)-8.583-10.0)', '(Crumpling, crinkling-8.709-10.0)']"
  },
  "YqlmqzWaV9Co.wav": {
    "caption": "A man speaks while tapping objects, with the sound of a door closing and a sliding door opening in a workshop.",
    "timestamp_events": "['(Tools-0.0-2.455)', '(Background noise-0.0-8.268)', '(Male speech, man speaking-0.505-2.729)', '(Tools-2.759-3.715)', '(Tools-4.019-4.707)', '(Tools-5.199-5.351)', '(Tools-5.628-5.985)', '(Tools-6.119-6.316)', '(Male speech, man speaking-6.479-8.257)', '(Male speech, man speaking-9.702-10.0)']"
  },
  "YGkgw3EkMsHI.wav": {
    "caption": "A woman's voice is interrupted by a pop sound, followed by another woman speaking. The audio event is a cap gun.",
    "timestamp_events": "['(Child speech, kid speaking-0.0-0.936)', '(Surface contact-0.674-1.015)', '(Child speech, kid speaking-1.117-2.737)', '(Generic impact sounds-2.738-3.339)', '(Child speech, kid speaking-3.24-5.0)', '(Generic impact sounds-4.151-4.687)', '(Generic impact sounds-4.86-5.112)', '(Generic impact sounds-5.628-6.355)', '(Generic impact sounds-6.578-6.885)', '(Child speech, kid speaking-6.606-8.966)', '(Generic impact sounds-7.626-7.751)', '(Generic impact sounds-7.877-8.031)', '(Generic impact sounds-9.008-9.162)', '(Generic impact sounds-9.344-9.511)', '(Child speech, kid speaking-9.385-10.0)']"
  },
  "YIJf8N4RnbuI.wav": {
    "caption": "A man passionately delivers a speech while a crowd cheers and music plays in the background at a concert.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.395)', '(Crowd-0.0-10.0)', '(Male speech, man speaking-0.655-5.074)', '(Shout-2.077-3.377)', '(Human voice-2.215-2.719)', '(Human voice-4.124-4.782)', '(Male speech, man speaking-5.294-7.203)', '(Shout-5.294-8.608)', '(Whistling-5.367-5.789)', '(Music-7.105-10.0)', '(Clapping-7.495-9.705)', '(Whistling-8.056-9.916)', '(Male singing-9.64-10.0)']"
  },
  "Y4wXy58UF4Io.wav": {
    "caption": "A child sings with a probability of 0.80, accompanied by singing (0.34) and female singing (0.21), in an unknown environment.",
    "timestamp_events": "['(Clicking-7.11-7.189)', '(Breathing-7.37-7.819)', '(Child singing-7.772-10.0)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-8.906-9.315)']"
  },
  "YoDZKHTLvckA.wav": {
    "caption": "The sound of water running and a small animal scurrying can be heard inside a small room, possibly a bathroom.",
    "timestamp_events": "['(Generic impact sounds-0.0-2.084)', '(Mechanisms-0.0-10.0)', '(Water-0.419-0.757)', '(Water-1.537-1.898)', '(Generic impact sounds-3.108-3.562)', '(Tick-7.753-7.846)', '(Generic impact sounds-9.115-9.325)', '(Water-9.558-10.0)']"
  },
  "YtPEkFCdAhkE.wav": {
    "caption": "A man speaks while a rooster crows on a livestock farm, surrounded by cattle and other working animals.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Male speech, man speaking-0.107-0.787)', '(Female speech, woman speaking-0.464-1.096)', '(Generic impact sounds-0.478-0.622)', '(Cattle, bovinae-1.227-1.619)', '(Moo-1.591-3.701)', '(Surface contact-2.711-2.856)', '(Generic impact sounds-3.447-4.581)', '(Generic impact sounds-4.732-5.076)', '(Walk, footsteps-4.897-5.014)', '(Surface contact-5.289-5.797)', '(Walk, footsteps-6.168-6.272)', '(Walk, footsteps-6.705-7.103)', '(Generic impact sounds-7.268-7.777)', '(Surface contact-7.859-8.546)', '(Generic impact sounds-8.794-9.412)', '(Generic impact sounds-9.557-9.701)', '(Liquid-9.681-10.0)']"
  },
  "YLMbAilXy1Fc.wav": {
    "caption": "The sound of crashing waves and strong wind accompanies a musical performance in a lively discotheque. [Audio-Visual Label: Music; Flap]",
    "timestamp_events": "['(Wind noise (microphone)-0.0-0.338)', '(Crowd-0.0-9.557)', '(Music-0.0-9.557)', '(Wind noise (microphone)-0.503-0.733)', '(Wind noise (microphone)-0.936-1.403)', '(Wind noise (microphone)-1.685-3.991)', '(Wind noise (microphone)-4.299-8.109)', '(Wind noise (microphone)-8.26-9.557)']"
  },
  "Y6bKNHxKJm1o.wav": {
    "caption": "A dog whimpers and whimpers as soft animal sounds fill the air in a domestic environment.",
    "timestamp_events": "['(Thump, thud-0.0-0.551)', '(Female speech, woman speaking-0.0-1.212)', '(Television-0.0-10.0)', '(Background noise-0.0-10.0)', '(Bark-0.636-0.793)', '(Thump, thud-0.704-1.152)', '(Dog-0.868-1.279)', '(Thump, thud-1.268-2.023)', '(Bark-1.496-1.735)', '(Dog-1.69-1.982)', '(Female speech, woman speaking-1.855-3.044)', '(Thump, thud-2.215-2.343)', '(Bark-2.289-3.239)', '(Thump, thud-2.51-2.65)', '(Thump, thud-2.83-2.971)', '(Dog-3.089-3.298)', '(Thump, thud-3.099-3.252)', '(Thump, thud-3.419-3.534)', '(Music-3.483-10.0)', '(Bark-3.515-3.71)', '(Tap-3.713-3.854)', '(Bark-3.889-4.069)', '(Tap-4.008-4.136)', '(Tap-4.302-4.417)', '(Dog-4.39-4.525)', '(Tap-4.584-4.75)', '(Tap-4.942-5.07)', '(Bark-4.996-5.221)', '(Dog-5.213-5.46)', '(Tap-5.365-5.506)', '(Bark-5.497-5.692)', '(Female speech, woman speaking-5.647-10.0)', '(Dog-5.669-5.789)', '(Bark-5.969-6.193)', '(Dog-6.208-6.44)', '(Bark-6.545-6.769)', '(Tap-6.671-6.863)', '(Dog-6.739-7.038)', '(Generic impact sounds-7.029-7.183)', '(Bark-7.21-7.435)', '(Tap-7.439-7.567)', '(Dog-7.472-7.651)', '(Generic impact sounds-7.554-7.798)', '(Bark-7.838-8.033)', '(Dog-8.033-8.175)', '(Tap-8.054-8.182)', '(Bark-8.399-8.609)', '(Tap-8.553-8.656)', '(Tap-8.899-9.052)', '(Tap-9.232-9.424)', '(Tap-9.68-9.846)']"
  },
  "zvGy89JnfXI.wav": {
    "caption": "A gentle melody of music plays with the sound of a doorbell ringing in a cozy indoor setting.",
    "timestamp_events": "['(Music-4.583-10.0)', '(Gears-2.553-3.266)', '(Mechanisms-4.589-10.0)']"
  },
  "nPwJjECLmEA.wav": {
    "caption": "Synthetic singing harmonizes with jingle music playing in the background, creating a festive atmosphere in a playroom.",
    "timestamp_events": "['(Tap-0.0-0.516)', '(Synthetic singing-0.0-5.886)', '(Music-0.0-10.0)', '(Tap-0.788-4.209)', '(Tap-4.359-4.698)', '(Tap-4.827-5.601)', '(Tap-5.737-8.235)', '(Synthetic singing-6.117-8.187)', '(Tap-8.384-10.0)', '(Synthetic singing-8.432-10.0)']"
  },
  "Y52sTvbwi7Mg.wav": {
    "caption": "A power tool drills while music plays in the background, likely in a dental clinic.",
    "timestamp_events": "['(Drill-1.575-4.323)', '(Music-0.0-0.898)', '(Cricket-9.693-9.906)']"
  },
  "YUChcduGcOSc.wav": {
    "caption": "A man speaks followed by the sound of a person snoring, indicating a conversation interrupted by someone falling asleep.",
    "timestamp_events": "['(Mechanisms-0.012-4.853)', '(Generic impact sounds-0.13-0.379)', '(Generic impact sounds-0.435-0.92)', '(Tap-1.007-1.181)', '(Generic impact sounds-1.187-1.454)', '(Male speech, man speaking-1.616-2.318)', '(Generic impact sounds-2.61-2.728)', '(Grunt-3.032-4.723)', '(Generic impact sounds-4.716-4.853)']"
  },
  "SiVfjH0rseg.wav": {
    "caption": "The wind howls as water splashes and gurgles, while an adult male speaks on a boat in the urban outdoors.",
    "timestamp_events": "['(Creak-0.0-0.362)', '(Wind-0.0-10.0)', '(Creak-1.346-1.969)', '(Bird vocalization, bird call, bird song-6.417-6.74)', '(Bird vocalization, bird call, bird song-7.528-7.74)', '(Bird vocalization, bird call, bird song-7.969-8.205)', '(Bird vocalization, bird call, bird song-8.543-8.803)', '(Flap-8.984-9.803)']"
  },
  "YB2fgdFtLHw0.wav": {
    "caption": "A person whispers softly as they chew something, creating a quiet and intimate atmosphere in a room.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Breathing-0.594-1.257)', '(Tick-1.618-1.686)', '(Whispering-1.798-2.303)', '(Tick-1.821-1.881)', '(Tick-3.062-3.138)', '(Breathing-3.198-3.83)', '(Whispering-4.251-4.635)', '(Tick-4.695-4.74)', '(Tick-5.583-5.651)', '(Whispering-5.606-6.509)', '(Tick-6.215-6.29)', '(Tick-6.697-6.787)', '(Whispering-6.749-7.833)', '(Tick-6.9-6.938)', '(Tick-7.178-7.231)', '(Tick-7.54-7.607)', '(Tick-8.014-8.096)', '(Tick-8.284-8.33)', '(Tick-8.668-8.728)', '(Whispering-8.721-9.21)', '(Tick-9.737-9.827)']"
  },
  "suHiaiRqPtY.wav": {
    "caption": "A person snores loudly while occasionally snorting and breathing heavily, creating a peaceful yet noisy ambiance in a bedroom.",
    "timestamp_events": "['(Hiss-0.0-2.709)', '(Background noise-0.0-10.0)', '(Tick-3.062-3.13)', '(Tick-3.281-3.341)', '(Tick-3.552-3.619)', '(Hiss-3.642-6.561)']"
  },
  "YBOkGgGgtuo0.wav": {
    "caption": "A helicopter hums in the distance while wind rustles into the microphone, capturing the audio inside a small room.",
    "timestamp_events": "['(Fire-0.0-10.0)', '(Background noise-0.0-10.0)', '(Generic impact sounds-1.795-1.912)', '(Generic impact sounds-3.116-3.206)', '(Generic impact sounds-4.111-4.215)', '(Generic impact sounds-4.513-4.609)', '(Generic impact sounds-9.762-9.838)']"
  },
  "YQi2sXHT3Cxg.wav": {
    "caption": "Hip hop music plays at a probability of 0.85 as a ping sound is heard in a chemistry lab.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Male singing-5.619-10.0)']"
  },
  "Yq4R18YN6Jzk.wav": {
    "caption": "An emergency siren blares as a woman speaks, indicating the presence of an emergency vehicle; possibly in a city.",
    "timestamp_events": "['(Siren-0.0-3.796)', '(Mechanisms-3.335-9.876)', '(Female speech, woman speaking-3.605-9.867)', '(Tick-4.004-4.091)', '(Tick-4.543-4.63)', '(Bark-4.734-5.707)', '(Generic impact sounds-4.899-5.081)', '(Bark-5.811-6.089)', '(Bark-6.358-6.706)', '(Bark-7.131-9.242)', '(Tick-7.583-7.67)', '(Tick-8.026-8.104)', '(Tick-9.103-9.198)']"
  },
  "YgDcJszpO1qE.wav": {
    "caption": "The sound of a turkey gobbling can be heard amidst the background music, suggesting the audio takes place in a turkey farm.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Male speech, man speaking-0.361-1.094)', '(Male speech, man speaking-1.642-5.402)', '(Crumpling, crinkling-2.165-2.387)', '(Female speech, woman speaking-6.075-7.773)', '(Female speech, woman speaking-8.041-10.0)']"
  },
  "YXufU6CSSYvw.wav": {
    "caption": "The sound of a train passing by on railroad tracks, with train wheels squealing, in a rail transport environment.",
    "timestamp_events": "['(Clickety-clack-0.0-1.144)', '(Train-0.0-10.0)', '(Clickety-clack-2.039-2.498)', '(Clickety-clack-3.062-3.424)', '(Clickety-clack-4.733-7.193)', '(Clickety-clack-8.021-8.307)', '(Clickety-clack-8.804-9.496)']"
  },
  "YnsfVHkH7nuc.wav": {
    "caption": "Someone taps on a hard surface while music plays softly in the background, creating a clapping sound.",
    "timestamp_events": "['(Clapping-0.0-0.719)', '(Background noise-0.0-10.0)', '(Tap-0.87-1.44)', '(Clapping-1.311-1.676)', '(Tap-1.741-2.891)', '(Clapping-2.848-3.719)', '(Tap-3.257-3.536)', '(Tap-3.762-4.3)', '(Clapping-4.214-4.515)', '(Tap-4.687-5.665)', '(Clapping-5.687-6.472)', '(Tap-6.042-6.407)', '(Tap-6.526-7.16)', '(Clapping-7.053-7.461)', '(Tap-7.257-8.622)', '(Clapping-8.45-9.3)', '(Tap-8.956-9.192)', '(Tap-9.397-10.0)']"
  },
  "Y2NvsJSwiV5M.wav": {
    "caption": "A high pitched beep is followed by sonar sounds and faint music, indicating the presence of a submarine in the water.",
    "timestamp_events": "['(Sonar-0.0-1.798)', '(Noise-0.0-10.0)', '(Sonar-2.713-5.92)', '(Sonar-6.719-9.642)']"
  },
  "YlRiiHpas23U.wav": {
    "caption": "Several ducks quack loudly while a fowl honks and a goose makes occasional sounds in a peaceful pond.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Ducks, geese, waterfowl-0.0-10.0)', '(Tick-0.865-0.91)', '(Tick-0.978-1.053)', '(Male speech, man speaking-1.61-2.611)', '(Tick-3.476-3.567)', '(Tick-3.777-3.838)', '(Tick-3.943-4.026)', '(Wind noise (microphone)-4.342-10.0)', '(Male speech, man speaking-4.868-5.305)']"
  },
  "YodMuGQyhwJY.wav": {
    "caption": "A man speaks amidst the sound of music, followed by a siren, indicating an emergency vehicle, in an army base.",
    "timestamp_events": "['(Sound effect-0.0-0.396)', '(Background noise-0.827-1.618)', '(Sound effect-1.281-2.852)', '(Groan-1.56-2.398)', '(Siren-2.34-6.799)', '(Groan-2.561-2.91)', '(Male speech, man speaking-3.364-3.865)', '(Conversation-3.364-10.0)', '(Male speech, man speaking-4.156-6.17)', '(Male speech, man speaking-6.554-7.369)', '(Crowd-7.09-8.405)', '(Male speech, man speaking-7.718-10.0)', '(Explosion-8.056-9.663)', '(Machine gun-9.476-10.0)']"
  },
  "Y74p96VbDZe8.wav": {
    "caption": "Water rushes and gurgles as an adult male speaks in the background, creating the ambiance of a serene waterfall.",
    "timestamp_events": "['(Waterfall-0.207-9.269)', '(Human sounds-6.862-7.708)', '(Clapping-7.633-9.25)']"
  },
  "YOik1vL10TgQ.wav": {
    "caption": "The music intensifies as a woman's voice speaks, followed by a sudden explosion. The audio event suggests a music studio environment.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Rapping-0.022-0.192)', '(Rapping-0.428-1.646)', '(Rapping-1.817-3.247)', '(Sound effect-3.581-4.734)', '(Sound effect-5.333-6.888)', '(Sound effect-8.684-9.22)', '(Rapping-9.039-10.0)']"
  },
  "YDku0OUWU6Mw.wav": {
    "caption": "Keys jangle as a man speaks, possibly inside a vehicle.",
    "timestamp_events": "['(Brief tone-0.0-0.741)', '(Car-0.0-3.26)', '(Background noise-0.0-9.02)', '(Generic impact sounds-0.079-0.285)', '(Brief tone-0.845-2.089)', '(Tick-1.566-1.669)', '(Generic impact sounds-1.846-1.993)', '(Generic impact sounds-2.45-2.737)', '(Generic impact sounds-3.01-3.216)', '(Male speech, man speaking-3.268-3.68)', '(Generic impact sounds-3.628-3.805)', '(Surface contact-3.908-4.468)', '(Generic impact sounds-4.475-4.748)', '(Keys jangling-4.799-5.013)', '(Surface contact-5.124-5.44)', '(Male speech, man speaking-5.565-6.059)', '(Generic impact sounds-5.941-6.103)', '(Keys jangling-6.736-6.928)', '(Breathing-6.854-7.333)', '(Keys jangling-7.075-7.281)', '(Male speech, man speaking-7.34-7.782)', '(Keys jangling-7.569-8.357)', '(Breathing-7.856-8.357)']"
  },
  "YfvMI4eT3PYU.wav": {
    "caption": "A man burps loudly multiple times while speaking in a kitchen, with a faint light shining on him.",
    "timestamp_events": "['(Laughter-0.529-3.896)', '(Female speech, woman speaking-7.89-8.784)', '(Burping, eructation-8.86-10.0)', '(Male speech, man speaking-6.488-7.562)', '(Background noise-0.0-10.0)']"
  },
  "Y5QnkRhiSzPg.wav": {
    "caption": "A child sings while music plays and a piano softly accompanies in a church.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Child singing-4.031-6.276)', '(Child singing-6.598-9.26)']"
  },
  "ZMFF8qfgwW0.wav": {
    "caption": "A man speaks followed by a loud bang in a small room, where something is breaking and shattering.",
    "timestamp_events": "['(Surface contact-0.0-0.225)', '(Mechanisms-0.0-10.0)', '(Conversation-0.607-9.819)', '(Male speech, man speaking-0.615-1.386)', '(Female speech, woman speaking-2.54-4.311)', '(Generic impact sounds-4.384-6.277)', '(Squeak-6.439-7.016)', '(Generic impact sounds-6.594-6.732)', '(Generic impact sounds-7.008-7.3)', '(Male speech, man speaking-7.463-7.999)', '(Generic impact sounds-7.755-8.194)', '(Generic impact sounds-8.446-8.803)', '(Male speech, man speaking-9.063-9.835)', '(Generic impact sounds-9.689-10.0)']"
  },
  "YiYA3E1zztyY.wav": {
    "caption": "A woman whispers and speaks in a small room, creating a mix of soft and audible sounds.",
    "timestamp_events": "['(Whispering-0.0-3.288)', '(Mechanisms-0.0-10.0)', '(Whispering-4.742-5.326)', '(Whispering-6.36-7.85)', '(Breathing-8.457-8.831)', '(Whispering-9.071-9.715)']"
  },
  "YWlsdGtkWca8.wav": {
    "caption": "Ducks quack loudly while a honking sound of geese can be heard, suggesting a lively scene near a water body.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Honk-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Walk, footsteps-0.276-0.425)', '(Walk, footsteps-0.89-1.386)', '(Walk, footsteps-1.969-2.528)', '(Breathing-2.496-2.969)', '(Walk, footsteps-3.291-3.441)', '(Breathing-3.535-4.614)', '(Walk, footsteps-3.787-3.945)', '(Walk, footsteps-4.197-4.622)', '(Walk, footsteps-4.85-4.969)', '(Walk, footsteps-5.394-5.654)', '(Walk, footsteps-5.969-6.291)', '(Walk, footsteps-6.827-7.008)', '(Walk, footsteps-7.362-7.551)', '(Generic impact sounds-7.669-7.976)', '(Walk, footsteps-8.087-8.37)', '(Female speech, woman speaking-8.787-9.953)']"
  },
  "YIWArki3J1aQ.wav": {
    "caption": "A small engine of a lawn mower is running, while a vehicle passes by in the background.",
    "timestamp_events": "['(Lawn mower-0.0-10.0)', '(Medium engine (mid frequency)-0.0-10.0)']"
  },
  "s1eMgmzCMDM.wav": {
    "caption": "Rock music blares as an explosion rocks the stage, accompanied by a pulsating beat, creating a punk rock atmosphere.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Distortion-0.0-10.0)']"
  },
  "YbrFfXSyCtmU.wav": {
    "caption": "The sound of chewing and mastication can be heard in a small room, possibly from an animal.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Chewing, mastication-0.567-1.024)', '(Chewing, mastication-1.402-1.622)', '(Generic impact sounds-1.858-2.094)', '(Chewing, mastication-2.197-2.677)', '(Surface contact-2.638-4.142)', '(Generic impact sounds-3.646-3.764)', '(Chewing, mastication-4.165-4.409)', '(Surface contact-4.504-4.921)', '(Chewing, mastication-5.299-5.701)', '(Chewing, mastication-5.85-6.047)', '(Chewing, mastication-6.173-6.465)', '(Chewing, mastication-7.417-7.906)', '(Chewing, mastication-8.094-8.583)', '(Surface contact-9.244-9.866)']"
  },
  "YEpIiqRWXj1I.wav": {
    "caption": "A man delivers a speech in a large hall, while in the background, scissors can be heard cutting hair.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.186)', '(Mechanisms-0.0-10.0)', '(Female speech, woman speaking-0.752-1.365)', '(Male speech, man speaking-1.394-2.036)', '(Female speech, woman speaking-2.267-2.689)', '(Male speech, man speaking-2.788-4.309)', '(Male speech, man speaking-4.465-5.547)', '(Generic impact sounds-5.72-5.992)', '(Male speech, man speaking-6.056-6.865)', '(Male speech, man speaking-7.068-8.132)', '(Male speech, man speaking-8.276-9.017)', '(Male speech, man speaking-9.468-10.0)']"
  },
  "YKogHZtTSoKM.wav": {
    "caption": "A loud clang echoes through the server room as a man yells and a cat meows in the background.",
    "timestamp_events": "['(Video game sound-0.0-10.0)', '(Breaking-0.047-0.717)', '(Human voice-0.126-0.48)', '(Run-0.402-3.063)', '(Whack, thwack-0.961-1.433)', '(Sound effect-2.22-2.89)', '(Human voice-2.22-2.937)', '(Male speech, man speaking-3.039-3.543)', '(Music-3.551-8.598)', '(Sound effect-3.567-3.929)', '(Shout-6.323-7.276)', '(Human voice-7.063-8.976)', '(Ding-9.031-10.0)']"
  },
  "YBCdFli3EP1A.wav": {
    "caption": "The sound of a guitar being played accompanies a musical tune in a room with an electronic tuner.",
    "timestamp_events": "['(Music-0.0-10.0)']"
  },
  "Yh3fJME32tgc.wav": {
    "caption": "An electric shaver buzzes as music plays in the background inside a car interior.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)']"
  },
  "YRMfA-0f-aDk.wav": {
    "caption": "An alarm clock beeps twice, followed by a radio playing softly in the background in a bedroom.",
    "timestamp_events": "['(Sound effect-0.0-5.76)', '(Background noise-0.0-6.993)', '(Beep, bleep-2.287-2.438)', '(Beep, bleep-2.608-2.916)', '(Beep, bleep-3.124-3.426)', '(Beep, bleep-3.646-3.967)', '(Beep, bleep-4.143-4.457)', '(Beep, bleep-4.652-4.992)', '(Beep, bleep-5.181-5.514)', '(Beep, bleep-5.684-5.728)', '(Human sounds-6.194-7.024)']"
  },
  "Y1aJK75652Ns.wav": {
    "caption": "Sheep bleat and a man laughs amidst the sound of rustling and crunching, creating a lively atmosphere in a countryside with goats, music, and nature.",
    "timestamp_events": "['(Goat-0.23-0.845)', '(Goat-0.948-1.319)', '(Goat-1.652-2.01)', '(Background noise-2.151-5.378)', '(Bleat-2.177-2.663)', '(Bleat-2.907-3.406)', '(Chirp, tweet-3.444-3.752)', '(Bleat-3.675-4.558)', '(Sound effect-4.648-4.942)', '(Generic impact sounds-4.955-5.16)', '(Generic impact sounds-5.519-5.839)', '(Goat-5.915-6.095)', '(Music-6.172-10.0)', '(Generic impact sounds-7.324-9.501)', '(Sound effect-9.744-10.0)']"
  },
  "Y257RdPg5dXE.wav": {
    "caption": "A speech synthesizer utters words while a man speaks, creating an audio event labeled \"Speech; Speech synthesizer\" in a home theater environment.",
    "timestamp_events": "['(Male speech, man speaking-0.093-3.06)', '(Male speech, man speaking-3.6-6.248)', '(Male speech, man speaking-6.477-7.562)', '(Male speech, man speaking-7.763-8.537)', '(Male speech, man speaking-8.724-9.948)']"
  },
  "YxJxDpMtIWu8.wav": {
    "caption": "An electronic alarm beeps followed by a woman speaking in a small room, possibly an office or home.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.877-1.129)', '(Generic impact sounds-1.3-1.495)', '(Beep, bleep-1.657-2.104)', '(Beep, bleep-2.299-2.697)', '(Female speech, woman speaking-2.64-3.696)', '(Generic impact sounds-3.859-4.062)', '(Generic impact sounds-4.322-4.574)', '(Beep, bleep-5.102-5.524)', '(Beep, bleep-5.727-6.166)', '(Female speech, woman speaking-6.076-7.141)', '(Generic impact sounds-7.864-8.115)']"
  },
  "Y80nPyF9Fmq8.wav": {
    "caption": "A woman's voice can be heard speaking and laughing in a small room, with a probability of 0.88.",
    "timestamp_events": "['(Chuckle, chortle-0.0-0.355)', '(Mechanisms-0.0-10.0)', '(Breathing-0.387-0.777)', '(Female speech, woman speaking-0.907-1.484)', '(Conversation-0.907-9.802)', '(Female speech, woman speaking-1.646-1.939)', '(Generic impact sounds-1.988-2.142)', '(Generic impact sounds-2.28-2.605)', '(Tick-2.767-2.857)', '(Generic impact sounds-3.011-3.182)', '(Slam-3.214-3.409)', '(Female speech, woman speaking-3.255-3.767)', '(Generic impact sounds-3.32-3.45)', '(Tick-3.507-3.612)', '(Surface contact-3.628-3.994)', '(Female speech, woman speaking-3.929-4.611)', '(Surface contact-4.148-4.376)', '(Generic impact sounds-4.425-4.587)', '(Generic impact sounds-4.733-5.123)', '(Female speech, woman speaking-5.001-5.391)', '(Generic impact sounds-5.326-5.489)', '(Female speech, woman speaking-5.659-5.846)', '(Generic impact sounds-5.781-5.944)', '(Chuckle, chortle-6.293-7.048)', '(Generic impact sounds-6.886-7.3)', '(Microwave oven-7.252-10.0)', '(Generic impact sounds-7.479-7.641)', '(Tick-7.853-7.95)', '(Generic impact sounds-7.991-8.186)', '(Female speech, woman speaking-8.056-9.786)', '(Surface contact-8.608-9.136)', '(Generic impact sounds-9.161-9.38)', '(Generic impact sounds-9.583-9.721)']"
  },
  "Ys0ibfQ2p-kg.wav": {
    "caption": "People talking and laughing, followed by a popping sound, as fireworks explode in an urban environment.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Generic impact sounds-0.093-0.239)', '(Male speech, man speaking-0.107-0.508)', '(Conversation-0.114-9.492)', '(Generic impact sounds-0.501-0.626)', '(Male speech, man speaking-0.709-1.601)', '(Generic impact sounds-0.84-1.069)', '(Generic impact sounds-1.214-1.359)', '(Generic impact sounds-1.484-1.712)', '(Giggle-1.871-2.369)', '(Generic impact sounds-2.203-2.41)', '(Crackle-2.763-7.376)', '(Male speech, man speaking-4.139-4.402)', '(Female speech, woman speaking-4.9-5.259)', '(Female speech, woman speaking-5.591-6.338)', '(Male speech, man speaking-6.601-8.012)', '(Firecracker-7.369-9.132)', '(Female speech, woman speaking-8.828-9.471)', '(Generic impact sounds-9.388-9.526)', '(Human voice-9.547-10.0)']"
  },
  "XmBiDpC7uXE.wav": {
    "caption": "A man speaks followed by a door opening, revealing the audio event of Speech and Door.",
    "timestamp_events": "['(Male speech, man speaking-0.192-1.784)', '(Male speech, man speaking-1.923-3.271)', '(Printer-3.531-7.999)', '(Printer-8.405-9.453)']"
  },
  "YagvN8wDqelE.wav": {
    "caption": "The engine of a truck roars loudly as it accelerates on a raceway, creating a powerful and energetic sound.",
    "timestamp_events": "['(Truck-0.0-10.0)', '(Accelerating, revving, vroom-0.095-0.42)', '(Accelerating, revving, vroom-0.875-1.362)', '(Accelerating, revving, vroom-3.888-4.449)', '(Accelerating, revving, vroom-4.944-5.156)', '(Accelerating, revving, vroom-5.448-6.147)', '(Accelerating, revving, vroom-6.813-9.542)']"
  },
  "YHecoi0BUr-M.wav": {
    "caption": "A man speaks while a baby cries in the background, creating a noisy environment in a home setting.",
    "timestamp_events": "['(Background noise-0.0-9.351)', '(Male speech, man speaking-0.0-1.31)', '(Conversation-0.0-9.222)', '(Brief tone-0.504-0.75)', '(Brief tone-0.952-1.456)', '(Female speech, woman speaking-1.377-1.904)', '(Brief tone-1.887-3.858)', '(Shout-2.105-3.074)', '(Shout-3.595-4.295)', '(Brief tone-4.071-4.502)', '(Brief tone-4.603-4.771)', '(Male speech, man speaking-6.019-6.781)', '(Male speech, man speaking-7.346-8.371)', '(Male speech, man speaking-8.645-9.189)']"
  },
  "YvnnzihrCIB8.wav": {
    "caption": "The sound of a chainsaw fills the air as an engine roars nearby, indicating a sawing event in a wooded area.",
    "timestamp_events": "['(Chainsaw-0.063-10.0)', '(Tick-1.913-2.016)']"
  },
  "Y45cIGexaE3Q.wav": {
    "caption": "A man speaks as water splashes in the background on a sailboat, sailing on the open ocean.",
    "timestamp_events": "['(Male speech, man speaking-0.0-2.597)', '(Wind-0.0-10.0)', '(Water-0.0-10.0)', '(Sailboat, sailing ship-0.0-10.0)', '(Generic impact sounds-1.273-2.109)', '(Male speech, man speaking-3.767-6.52)', '(Wind noise (microphone)-7.666-7.934)', '(Male speech, man speaking-8.031-8.698)', '(Tick-8.113-8.251)', '(Wind noise (microphone)-8.161-9.169)', '(Male speech, man speaking-8.868-9.258)']"
  },
  "YQbr3kXycaw4.wav": {
    "caption": "A man screams followed by a person sneezing, with the sound of scraping in the background on a stage.",
    "timestamp_events": "['(Human sounds-0.0-6.634)', '(Grunt-6.667-7.479)', '(Human sounds-7.503-10.0)', '(Breathing-8.243-8.641)']"
  },
  "Ywkllgj06rcs.wav": {
    "caption": "A bird chirps in the distance followed by a bird chirping, indicating the presence of an owl in a natural environment.",
    "timestamp_events": "['(Owl-0.0-0.655)', '(Mechanisms-0.0-10.0)', '(Surface contact-0.818-1.289)', '(Generic impact sounds-1.598-2.532)', '(Surface contact-1.695-2.67)', '(Owl-2.784-3.84)', '(Generic impact sounds-3.182-3.304)', '(Generic impact sounds-3.962-4.831)', '(Surface contact-4.327-4.636)', '(Generic impact sounds-4.993-5.123)', '(Surface contact-5.172-5.481)', '(Generic impact sounds-5.448-5.562)', '(Surface contact-5.659-6.147)', '(Generic impact sounds-5.846-6.033)', '(Generic impact sounds-6.301-6.537)', '(Generic impact sounds-6.813-7.081)', '(Generic impact sounds-7.885-8.226)', '(Generic impact sounds-8.413-8.551)', '(Owl-8.446-8.957)', '(Generic impact sounds-9.031-9.51)', '(Surface contact-9.559-9.973)']"
  },
  "Y6aoZHNKEx-g.wav": {
    "caption": "A power tool motor is running and vibrating, with whirring sounds, while an adult male speaks in the background in a workshop.",
    "timestamp_events": "['(Motorcycle-0.007-9.48)']"
  },
  "YB4mZgEcE5SY.wav": {
    "caption": "A dog whimpers while a squeaky toy is being played with in a pet store.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Growling-0.433-0.921)', '(Generic impact sounds-0.961-1.016)', '(Generic impact sounds-1.142-1.213)', '(Squeak-1.417-2.756)', '(Growling-2.386-2.811)', '(Squeak-3.016-3.291)', '(Squeak-3.646-3.819)', '(Growling-3.835-4.315)', '(Squeak-4.654-4.913)', '(Cough-5.126-5.622)', '(Squeak-5.449-5.709)', '(Generic impact sounds-6.307-6.402)', '(Squeak-6.567-6.795)', '(Squeak-7.732-7.921)', '(Dog-8.016-8.732)', '(Generic impact sounds-9.205-9.315)', '(Growling-9.409-9.937)']"
  },
  "YEpySn-CXUxI.wav": {
    "caption": "The sound of rustling leaves and light rustling suggests that someone is inside a small room, possibly a study or library.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Scrape-1.134-1.688)', '(Tick-2.4-2.462)', '(Tick-3.002-3.085)', '(Generic impact sounds-3.769-3.866)', '(Tick-4.219-4.322)', '(Generic impact sounds-5.491-5.595)', '(Scrape-5.678-5.858)', '(Tap-5.844-6.01)', '(Scrape-6.127-6.812)', '(Tick-6.895-7.006)', '(Tick-7.538-7.621)', '(Generic impact sounds-9.737-9.841)']"
  },
  "YMy-px7AwGVQ.wav": {
    "caption": "A bell rings while people speak in the background, creating a lively atmosphere in a bustling city square.",
    "timestamp_events": "['(Human voice-0.0-0.181)', '(Hubbub, speech noise, speech babble-0.0-10.0)', '(Bell-0.78-3.47)', '(Tick-1.88-1.949)', '(Male speech, man speaking-1.937-2.252)', '(Male speech, man speaking-4.008-4.339)', '(Bell-4.054-7.402)', '(Generic impact sounds-5.913-5.969)', '(Tick-7.01-7.062)', '(Human sounds-8.142-8.315)', '(Bell-8.282-9.352)', '(Laughter-8.945-9.606)', '(Generic impact sounds-9.039-9.11)', '(Generic impact sounds-9.283-9.362)', '(Generic impact sounds-9.661-9.732)', '(Generic impact sounds-9.898-9.976)']"
  },
  "YD6I3-i7qMJs.wav": {
    "caption": "Wood being moved around as a sewing machine hums intermittently and a printer occasionally prints in a workshop.",
    "timestamp_events": "['(Generic impact sounds-0.0-1.622)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-1.874-2.377)', '(Generic impact sounds-2.491-3.628)', '(Generic impact sounds-3.832-5.521)', '(Surface contact-5.058-5.326)', '(Generic impact sounds-5.724-7.658)', '(Surface contact-7.138-7.536)', '(Generic impact sounds-7.869-8.551)', '(Generic impact sounds-8.698-9.282)', '(Generic impact sounds-9.396-9.542)']"
  },
  "YXub2jjq-eRI.wav": {
    "caption": "A DJ scratches a record with intense music playing, creating a lively atmosphere at an indoor stage.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)', '(Shout-7.146-9.737)']"
  },
  "YxAZQSkkualE.wav": {
    "caption": "The wind blows as a man speaks while a bicycle and a vehicle pass by in the audio.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Whispering-0.128-0.768)', '(Male speech, man speaking-1.036-1.269)', '(Generic impact sounds-1.385-1.921)', '(Bicycle, tricycle-3.481-4.342)', '(Wind noise (microphone)-4.035-4.165)', '(Male speech, man speaking-4.785-4.971)', '(Generic impact sounds-4.878-4.994)', '(Wind noise (microphone)-4.936-6.797)', '(Bicycle, tricycle-5.891-6.997)', '(Wind noise (microphone)-7.243-8.933)', '(Bicycle, tricycle-7.674-9.624)', '(Generic impact sounds-7.812-8.836)', '(Tick-9.185-9.302)', '(Male speech, man speaking-9.767-10.0)']"
  },
  "Y68Uacs6JPCk.wav": {
    "caption": "The sound of an idling engine can be heard, suggesting that the audio occurs in a vehicle.",
    "timestamp_events": "['(Engine knocking-0.0-10.0)', '(Medium engine (mid frequency)-0.0-10.0)']"
  },
  "KhuI97I3F0I.wav": {
    "caption": "A person plays a distorted electric guitar with a chorus effect, accompanied by music, in a coffee shop.",
    "timestamp_events": "['(Music-0.0-10.0)']"
  },
  "Y4333Ev3O07c.wav": {
    "caption": "A train horn blares as a train approaches, indicating the presence of a train on a railroad track.",
    "timestamp_events": "['(Train-0.0-10.0)', '(Train horn-0.307-2.157)', '(Train horn-2.748-5.11)', '(Train horn-5.677-6.496)', '(Train horn-6.701-10.0)']"
  },
  "Y3RtoY0e91l0.wav": {
    "caption": "A large motor vehicle engine is running in the background as an adult male speaks, indicating a bus or vehicle event.",
    "timestamp_events": "['(Heavy engine (low frequency)-0.0-9.2)']"
  },
  "YPwioLuN-KIo.wav": {
    "caption": "The sound of sizzling and stirring can be heard as food is being fried in a restaurant kitchen.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.008)', '(Mechanisms-0.0-10.0)', '(Sizzle-1.433-10.0)', '(Generic impact sounds-2.299-2.866)', '(Music-2.315-10.0)', '(Male speech, man speaking-3.181-4.638)', '(Tap-3.425-3.661)', '(Cutlery, silverware-4.15-4.654)', '(Cutlery, silverware-4.835-5.323)', '(Male speech, man speaking-5.189-6.567)', '(Cutlery, silverware-5.543-5.843)', '(Cutlery, silverware-6.709-6.898)', '(Male speech, man speaking-7.386-7.976)', '(Male speech, man speaking-8.268-10.0)']"
  },
  "YYgSs2cZQznI.wav": {
    "caption": "A man speaks in a small room followed by a pig oinking, suggesting a conversation or interaction in an indoor setting.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.995)', '(Male speech, man speaking-2.156-3.142)', '(Human voice-3.211-3.555)', '(Human voice-3.635-7.317)', '(Generic impact sounds-3.922-4.117)', '(Generic impact sounds-4.679-4.828)', '(Generic impact sounds-4.977-5.149)', '(Generic impact sounds-5.333-5.528)', '(Generic impact sounds-6.388-6.571)', '(Human voice-7.511-8.05)', '(Male speech, man speaking-8.44-9.667)', '(Human voice-9.656-10.0)']"
  },
  "YA5eIOPX4Dno.wav": {
    "caption": "A power tool drills while wind blows and a high pitched hissing sound fills the air, resembling a jet engine.",
    "timestamp_events": "['(Wind noise (microphone)-0.0-0.835)', '(Wind-0.0-10.0)', '(Tick-0.23-0.354)', '(Tick-0.505-0.588)', '(Tick-0.787-0.876)', '(Wind noise (microphone)-0.973-1.962)', '(Spray-1.014-2.251)', '(Wind noise (microphone)-2.175-4.938)', '(Tick-2.423-2.546)', '(Tick-2.746-2.835)', '(Tick-3.034-3.138)', '(Tick-3.268-3.412)', '(Spray-3.474-4.32)', '(Tick-4.416-4.478)', '(Spray-4.588-10.0)']"
  },
  "YiOAClY1MUpU.wav": {
    "caption": "A speaker addresses the crowd while music plays faintly in the background, creating an energetic atmosphere in the stadium. (Speech: 0.70, Crowd: 0.26, Music: 0.23, Audio-Visual Label: Bellow; Speech)",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Whistling-3.661-4.384)', '(Shout-4.514-5.188)', '(Shout-6.602-8.698)']"
  },
  "YAGCsK1lTkfM.wav": {
    "caption": "A cat meows while a dog howls, and a man laughs in the background, creating a lively atmosphere in a domestic setting.",
    "timestamp_events": "['(Caterwaul-0.0-3.872)', '(Wind-0.0-10.0)', '(Generic impact sounds-0.168-0.282)', '(Bird vocalization, bird call, bird song-0.282-0.558)', '(Generic impact sounds-1.029-1.167)', '(Bird vocalization, bird call, bird song-1.191-1.46)', '(Generic impact sounds-1.719-2.207)', '(Laughter-2.312-3.385)', '(Bird vocalization, bird call, bird song-3.336-3.596)', '(Laughter-3.905-5.399)', '(Bird vocalization, bird call, bird song-3.994-4.278)', '(Generic impact sounds-4.441-4.676)', '(Bird vocalization, bird call, bird song-5.383-5.716)', '(Caterwaul-5.464-10.0)', '(Tick-6.147-6.293)', '(Laughter-6.301-7.073)', '(Breathing-7.008-7.373)', '(Cough-7.252-7.918)', '(Breathing-7.991-8.405)', '(Bird vocalization, bird call, bird song-8.503-8.738)', '(Cough-9.096-9.575)', '(Generic impact sounds-9.542-9.705)']"
  },
  "yM7JF2Y0Az0.wav": {
    "caption": "A drum machine plays a rhythmic beat accompanied by music in a music studio.",
    "timestamp_events": "['(Music-0.0-10.0)']"
  },
  "Yhr-tBZ9v1bg.wav": {
    "caption": "Emergency vehicle sirens blare as a fire engine and ambulance rush through the bustling city streets.",
    "timestamp_events": "['(Fire engine, fire truck (siren)-0.0-10.0)', '(Wind-0.0-10.0)']"
  },
  "YYNLXnExjv7w.wav": {
    "caption": "Birds chirp and a frog croaks as a crow caws in the background, creating a lively atmosphere in a natural environment.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Mechanisms-0.148-10.0)', '(Animal-0.29-1.186)', '(Bird vocalization, bird call, bird song-0.705-1.433)', '(Animal-1.536-2.519)', '(Bird vocalization, bird call, bird song-1.784-2.052)', '(Animal-2.65-7.179)', '(Bird vocalization, bird call, bird song-3.323-4.21)', '(Bird vocalization, bird call, bird song-4.384-4.538)', '(Bird vocalization, bird call, bird song-4.746-4.979)', '(Bird vocalization, bird call, bird song-5.651-5.911)', '(Bird vocalization, bird call, bird song-6.148-6.361)', '(Bird vocalization, bird call, bird song-6.828-7.66)', '(Animal-7.512-8.088)', '(Human voice-7.901-8.576)', '(Bird vocalization, bird call, bird song-8.581-10.0)', '(Animal-8.87-10.0)']"
  },
  "YKYNILGRNiYY.wav": {
    "caption": "A sizzling sound is heard while food is being fried, accompanied by a man speaking in the background.",
    "timestamp_events": "['(Noise-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-0.551-0.87)', '(Conversation-0.57-9.681)', '(Male speech, man speaking-1.073-2.937)', '(Generic impact sounds-1.952-2.126)', '(Generic impact sounds-3.015-3.246)', '(Tick-3.285-3.401)', '(Male speech, man speaking-4.454-5.266)', '(Laughter-5.517-6.184)', '(Male speech, man speaking-6.396-7.527)', '(Tick-7.546-7.672)', '(Tick-8.174-8.3)', '(Male speech, man speaking-8.551-9.701)']"
  },
  "YdxAXqgRVvKY.wav": {
    "caption": "A man speaks while a hair dryer runs in a veterinarian's office, creating a constant humming sound.",
    "timestamp_events": "['(Laughter-0.0-0.879)', '(Hair dryer-0.0-9.966)', '(Chuckle, chortle-8.781-9.966)']"
  },
  "YWThlVvZxVyU.wav": {
    "caption": "A phone rings while a woman speaks in a server room, accompanied by background music and occasional speech.",
    "timestamp_events": "['(Radio-0.0-1.159)', '(Mechanisms-0.0-10.0)', '(Brief tone-1.045-1.557)', '(Radio-2.637-6.187)', '(Male speech, man speaking-2.637-3.645)', '(Male speech, man speaking-3.767-7.625)', '(Surface contact-7.057-7.268)', '(Radio-7.276-8.876)', '(Male speech, man speaking-7.983-10.0)', '(Radio-9.347-10.0)']"
  },
  "pLqvYlIX9MU.wav": {
    "caption": "A man speaks followed by a loud explosion, suggesting that the audio takes place in an environment where speech and explosive events occur.",
    "timestamp_events": "['(Explosion-8.008-9.583)', '(Male speech, man speaking-4.189-4.898)', '(Tick-3.756-3.829)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-9.425-9.937)']"
  },
  "YA-uLcvvBcso.wav": {
    "caption": "Food sizzles and is stirred as an adult male speaks in a quiet environment, accompanied by faint vehicle and water sounds.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Generic impact sounds-0.428-0.574)', '(Generic impact sounds-1.516-1.654)', '(Ratchet, pawl-2.312-10.0)', '(Generic impact sounds-4.018-4.132)']"
  },
  "YdnDILSTKH5s.wav": {
    "caption": "A man speaks while a pig oinks in the background, creating a rural atmosphere.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.695)', '(Conversation-0.0-10.0)', '(Waves, surf-0.0-10.0)', '(Wind noise (microphone)-0.0-10.0)', '(Male speech, man speaking-0.979-5.01)', '(Male speech, man speaking-5.467-6.29)', '(Human voice-6.732-7.244)', '(Grunt-7.293-8.779)', '(Breathing-8.862-9.305)', '(Male speech, man speaking-9.298-10.0)']"
  },
  "YYSlKMpCnRDA.wav": {
    "caption": "The clock ticks steadily, creating a rhythmic tick-tock sound effect in a quiet room.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Tick-0.052-0.155)', '(Tick-0.278-0.354)', '(Tick-0.485-0.581)', '(Tick-0.684-0.787)', '(Tick-0.911-0.979)', '(Tick-1.096-1.186)', '(Tick-1.282-1.371)', '(Tick-1.495-1.591)', '(Tick-1.701-1.784)', '(Tick-1.907-1.983)', '(Tick-2.107-2.196)', '(Tick-2.313-2.382)', '(Tick-2.505-2.581)', '(Tick-2.691-2.794)', '(Tick-2.918-2.993)', '(Tick-3.124-3.206)', '(Tick-3.33-3.406)', '(Tick-3.509-3.598)', '(Tick-3.736-3.804)', '(Tick-3.928-4.01)', '(Ding-4.116-4.88)', '(Tick-4.134-4.21)', '(Tick-4.361-4.437)', '(Tick-4.567-4.65)', '(Tick-4.773-4.849)', '(Tick-4.979-5.062)', '(Tick-5.199-5.268)', '(Tick-5.392-5.474)', '(Tick-5.612-5.715)', '(Tick-5.839-5.9)', '(Tick-6.01-6.107)', '(Tick-6.21-6.313)', '(Tick-6.416-6.505)', '(Tick-6.622-6.691)', '(Tick-6.828-6.897)', '(Tick-7.034-7.117)', '(Tick-7.241-7.309)', '(Tick-7.426-7.509)', '(Tick-7.632-7.722)', '(Tick-7.825-7.921)', '(Tick-8.065-8.148)', '(Tick-8.272-8.361)', '(Tick-8.485-8.567)', '(Tick-8.711-8.794)', '(Tick-8.918-8.993)', '(Tick-9.096-9.179)', '(Tick-9.303-9.385)', '(Tick-9.529-9.591)', '(Tick-9.701-9.777)', '(Tick-9.9-10.0)']"
  },
  "YiwAoPcpRL5U.wav": {
    "caption": "A sine wave plays with a faint background music and the occasional sound of a passing vehicle.",
    "timestamp_events": "['(Sine wave-0.0-9.068)']"
  },
  "YrKBrhg-3HQs.wav": {
    "caption": "Soft music plays as a heart murmur is heard, followed by a sudden loud bang in a hospital room.",
    "timestamp_events": "['(Music-0.0-4.643)', '(Heart sounds, heartbeat-4.725-5.323)', '(Heart sounds, heartbeat-6.67-7.124)', '(Heart sounds, heartbeat-8.519-8.952)', '(Splash, splatter-8.794-10.0)']"
  },
  "mcn2m3hClP0.wav": {
    "caption": "A man gives a speech with a speech synthesizer in the background, indicating a speech event in an indoor environment.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.391)', '(Male speech, man speaking-1.874-8.213)']"
  },
  "Y4kQGVksBzfw.wav": {
    "caption": "A man clears his throat followed by soothing music playing in a movie theater.",
    "timestamp_events": "['(Cough-4.061-4.616)', '(Music-5.034-7.831)', '(Tick-0.691-0.78)', '(Background noise-5.025-7.826)', '(Male singing-2.571-3.403)']"
  },
  "Y01WPztJHYe8.wav": {
    "caption": "A man confidently delivers a speech at a podium, his voice resonating in an indoor setting. (Audio-visual label: Narration, monologue; Male speech, man speaking; Speech)",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Reverberation-0.008-0.291)', '(Breathing-0.268-0.908)', '(Male speech, man speaking-1.047-2.898)', '(Breathing-3.164-3.91)', '(Male speech, man speaking-4.089-4.929)', '(Reverberation-4.819-5.433)', '(Male speech, man speaking-5.61-6.703)', '(Breathing-6.761-7.403)', '(Male speech, man speaking-7.467-9.456)', '(Breathing-9.653-10.0)']"
  },
  "YsThLSiwayWc.wav": {
    "caption": "Water pours out of a faucet, creating a steady stream, while occasional drips can be heard in the background.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.23-1.168)', '(Pump (liquid)-1.124-2.679)', '(Generic impact sounds-2.643-3.054)', '(Generic impact sounds-3.626-4.689)', '(Pump (liquid)-4.77-6.307)', '(Generic impact sounds-6.307-7.076)', '(Generic impact sounds-7.469-8.487)', '(Pump (liquid)-8.398-10.0)', '(Generic impact sounds-9.917-10.0)']"
  },
  "YOErpZ6GWees.wav": {
    "caption": "Church bells ring as people talk in the distance, creating a serene atmosphere in a peaceful village.",
    "timestamp_events": "['(Change ringing (campanology)-0.0-10.0)']"
  },
  "Y5BmS4XqiuZY.wav": {
    "caption": "Water runs continuously from a faucet as it fills a bathtub, creating a soothing and tranquil ambiance in a bathroom.",
    "timestamp_events": "['(Pump (liquid)-0.0-10.0)']"
  },
  "Yah7iBQ7FeO0.wav": {
    "caption": "A man speaks while music plays and a car horn honks in the background on a subway train.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.167)', '(Subway, metro, underground-0.0-10.0)', '(Music-0.0-10.0)', '(Male speech, man speaking-1.728-2.816)', '(Male speech, man speaking-2.979-4.49)', '(Male speech, man speaking-4.806-5.773)', '(Male speech, man speaking-6.009-7.447)', '(Male speech, man speaking-7.723-9.022)', '(Male speech, man speaking-9.364-10.0)']"
  },
  "Yd1LTpzb6FPE.wav": {
    "caption": "A dog whimpers while music plays in the background, resembling the sound of a basketball bouncing in a bookstore.",
    "timestamp_events": "['(Music-0.087-10.0)', '(Squeal-2.629-3.157)', '(Basketball bounce-3.377-3.669)', '(Squeal-3.97-5.131)', '(Basketball bounce-4.839-5.066)', '(Squeal-5.286-5.684)', '(Basketball bounce-5.359-5.627)', '(Squeal-5.887-6.537)', '(Generic impact sounds-7.82-8.064)', '(Squeal-8.259-9.055)', '(Sound effect-9.25-10.0)']"
  },
  "YhFgWZmFG9c0.wav": {
    "caption": "Rain falls onto a hard surface as wood creaks, indicating a rainfall on a patio in a yard.",
    "timestamp_events": "['(Rain on surface-0.0-0.257)', '(Wind-0.0-10.0)', '(Thump, thud-0.387-0.704)', '(Rain on surface-0.509-2.727)', '(Thump, thud-2.784-3.157)', '(Rain on surface-2.987-4.018)', '(Rain on surface-4.181-5.164)', '(Rain on surface-5.286-7.479)', '(Rain on surface-7.633-10.0)']"
  },
  "Y1NkDKBAtfcY.wav": {
    "caption": "Soft music plays with a gentle ding-dong sound as marimba and xylophone create a soothing ambiance in an art gallery.",
    "timestamp_events": "['(Music-0.542-10.0)', '(Tick-9.51-9.648)', '(Breathing-9.607-10.0)']"
  },
  "KJF1deXG8mc.wav": {
    "caption": "A woman speaks followed by three consecutive clanks of glassware in a restaurant kitchen.",
    "timestamp_events": "['(Female speech, woman speaking-8.242-10.0)', '(Dishes, pots, and pans-3.712-4.126)', '(Glass chink, clink-4.243-4.546)', '(Human sounds-0.568-0.802)', '(Breathing-7.993-8.2)', '(Mechanisms-0.0-10.0)']"
  },
  "Y6Qx-Ps4Qroo.wav": {
    "caption": "The sound of a ticking clock fills the air as it rocks back and forth in a coffee shop.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Tick-0.062-0.184)', '(Tick-0.33-0.477)', '(Generic impact sounds-0.574-0.883)', '(Tick-0.899-1.029)', '(Generic impact sounds-1.037-1.663)', '(Tick-1.167-1.256)', '(Tick-1.533-1.622)', '(Tick-2.109-2.247)', '(Tick-2.402-2.499)', '(Tick-2.662-2.8)', '(Tick-3.027-3.149)', '(Tick-3.32-3.417)', '(Tick-3.596-3.702)', '(Generic impact sounds-3.677-3.775)', '(Tick-3.937-4.083)', '(Generic impact sounds-4.092-4.189)', '(Tick-4.23-4.36)', '(Tick-4.506-4.652)', '(Tick-4.815-4.936)', '(Tick-5.131-5.237)', '(Tick-5.424-5.554)', '(Tick-5.708-5.822)', '(Tick-5.944-6.098)', '(Generic impact sounds-5.976-6.301)', '(Tick-6.293-6.431)', '(Tick-6.618-6.78)', '(Tick-6.918-7.073)', '(Generic impact sounds-7.024-7.243)', '(Human voice-7.089-8.389)', '(Tick-7.235-7.365)', '(Tick-7.528-7.641)', '(Tick-7.82-7.966)', '(Generic impact sounds-8.121-8.243)', '(Tick-8.129-8.275)', '(Generic impact sounds-8.478-9.754)', '(Tick-8.763-8.868)']"
  },
  "Y9FryzfUVnno.wav": {
    "caption": "A woman speaks while a dog barks in the background, creating a lively atmosphere in the park.",
    "timestamp_events": "['(Bark-9.575-10.0)', '(Tap-9.134-9.346)', '(Tick-8.819-8.969)', '(Background noise-0.0-10.0)', '(Child speech, kid speaking-9.504-10.0)']"
  },
  "Y-NN1-W7XzEE.wav": {
    "caption": "A man passionately delivers a speech, his voice resonating with conviction, in an art gallery filled with captivating black and white photographs.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.323)', '(Background noise-0.0-10.0)', '(Breathing-1.303-1.536)', '(Male speech, man speaking-1.557-3.0)', '(Breathing-3.021-3.248)', '(Male speech, man speaking-3.248-4.856)', '(Breathing-4.87-5.096)', '(Male speech, man speaking-5.117-7.096)', '(Breathing-7.124-7.344)', '(Male speech, man speaking-7.344-9.447)', '(Breathing-9.426-9.694)', '(Male speech, man speaking-9.701-10.0)']"
  },
  "YWZ-ZjJzchEY.wav": {
    "caption": "Goats bleat as farm animals and livestock make noise in the background on a sunny day at a farm.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Generic impact sounds-0.01-0.072)', '(Bleat-0.045-1.701)', '(Generic impact sounds-0.375-0.485)', '(Generic impact sounds-0.918-1.014)', '(Bleat-1.818-2.952)', '(Goat-2.278-3.351)', '(Human voice-2.292-2.918)', '(Generic impact sounds-2.952-3.289)', '(Bleat-3.268-4.168)', '(Generic impact sounds-4.278-4.375)', '(Bleat-4.292-4.732)', '(Generic impact sounds-4.725-5.041)', '(Bleat-4.938-5.701)', '(Generic impact sounds-6.155-6.258)', '(Bleat-6.485-8.052)', '(Generic impact sounds-6.663-6.787)', '(Bleat-8.505-8.911)', '(Generic impact sounds-8.753-8.856)', '(Generic impact sounds-9.076-9.179)', '(Bleat-9.467-9.983)', '(Generic impact sounds-9.619-9.694)']"
  },
  "YVzGOjcOj9fo.wav": {
    "caption": "Gunshots ring out as a man delivers a speech, creating a chaotic and intense atmosphere.",
    "timestamp_events": "['(Male speech, man speaking-0.0-2.109)', '(Conversation-0.0-4.511)', '(Background noise-0.0-10.0)', '(Gunshot, gunfire-2.109-3.282)', '(Male speech, man speaking-3.31-4.525)', '(Gunshot, gunfire-4.595-6.187)', '(Shout-5.0-5.489)', '(Shout-5.866-6.187)', '(Sound effect-6.257-8.617)', '(Sound effect-8.925-9.33)', '(Gunshot, gunfire-9.33-10.0)']"
  },
  "YK4-xBCHkoew.wav": {
    "caption": "A high pitched beep is followed by a person whistling in an environment with domestic animals or pets.",
    "timestamp_events": "['(Hiccup-9.449-9.677)', '(Background noise-0.0-10.0)']"
  },
  "YO9AdMudcL2c.wav": {
    "caption": "A woman's voice speaks over music while a dog growls in the background, suggesting a lively atmosphere in a playroom.",
    "timestamp_events": "['(Speech synthesizer-0.0-1.344)', '(Music-0.0-4.278)', '(Crunch-1.344-1.639)', '(Speech synthesizer-1.825-2.725)', '(Speech synthesizer-3.557-3.866)', '(Shout-3.557-3.928)', '(Shout-4.196-4.773)', '(Breathing-4.979-5.199)', '(Breathing-5.371-5.619)', '(Thump, thud-5.701-5.99)', '(Shout-6.052-7.096)', '(Sound effect-7.199-9.186)', '(Glass chink, clink-9.103-9.591)', '(Glass chink, clink-9.701-10.0)']"
  },
  "YKeI2qQdOjuA.wav": {
    "caption": "A man speaks while rubbing something, creating a scratching sound, in a shoe shop with faint background music.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Surface contact-0.179-0.37)', '(Surface contact-0.729-0.787)', '(Tick-0.873-0.925)', '(Tick-1.07-1.139)', '(Tick-1.301-1.371)', '(Male speech, man speaking-1.44-1.764)', '(Tick-1.475-1.533)', '(Scratch-1.631-3.436)', '(Male speech, man speaking-1.862-2.279)', '(Tick-3.939-4.02)', '(Surface contact-4.361-4.864)', '(Tick-5.067-5.124)', '(Male speech, man speaking-5.159-5.437)', '(Tick-5.385-5.448)', '(Male speech, man speaking-5.518-6.102)', '(Scratch-6.038-7.779)', '(Human sounds-8.248-8.352)', '(Tick-9.774-9.832)']"
  },
  "vUgvSKhhfbY.wav": {
    "caption": "A man speaks while a dog whimpers in the background, creating a Bow-wow; Speech audio-visual label.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.411)', '(Male speech, man speaking-0.603-6.591)', '(Human sounds-6.609-8.539)']"
  },
  "YlDapDelZLvA.wav": {
    "caption": "The sound of music fills the air as a bell rings, accompanied by the rhythmic beats of drums in a music studio.",
    "timestamp_events": "['(Music-0.0-10.0)']"
  },
  "Nxtqm2s8sLU.wav": {
    "caption": "A synthetic singing voice harmonizes with a melodic piano tune in a recreation room.",
    "timestamp_events": "['(Music-0.0-9.044)', '(Synthetic singing-0.242-2.077)', '(Synthetic singing-3.42-4.754)', '(Synthetic singing-6.531-7.556)', '(Synthetic singing-7.701-8.686)', '(Clapping-9.073-10.0)']"
  },
  "Y-JVgOQIAFaI.wav": {
    "caption": "The guitar strums along with the music, creating a harmonious melody in a musical performance.",
    "timestamp_events": "['(Music-0.008-10.0)']"
  },
  "YFN1rC23Rrlg.wav": {
    "caption": "An emergency vehicle siren blares loudly as traffic noise fills the street, indicating the presence of an ambulance or fire truck.",
    "timestamp_events": "['(Ambulance (siren)-0.0-2.165)', '(Traffic noise, roadway noise-0.0-10.0)', '(Air horn, truck horn-2.468-4.273)', '(Fire engine, fire truck (siren)-7.113-10.0)']"
  },
  "Y4lMdau8KRyM.wav": {
    "caption": "A man speaks while music plays in the background, creating a lively atmosphere in a hardware store.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Beep, bleep-0.135-0.493)', '(Beep, bleep-0.647-0.966)', '(Male speech, man speaking-1.614-4.966)', '(Male speech, man speaking-5.217-10.0)']"
  },
  "EZQnTHLRMZ4.wav": {
    "caption": "Latin American music plays as a man sings on stage with a band, captivating the crowd in an indoor setting.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Male singing-2.995-6.585)', '(Male singing-6.894-8.373)']"
  },
  "YOqRDImr1wj4.wav": {
    "caption": "A man speaks amidst music playing in the background, while artillery fire can be heard, suggesting a theater performance.",
    "timestamp_events": "['(Male speech, man speaking-0.0-2.15)', '(Music-0.0-10.0)', '(Machine gun-1.175-2.792)', '(Male speech, man speaking-2.345-3.547)', '(Tick-4.685-4.806)', '(Male speech, man speaking-4.831-5.789)', '(Male speech, man speaking-6.537-8.056)', '(Male speech, man speaking-8.535-9.786)']"
  },
  "Ycf8kZWXN9C0.wav": {
    "caption": "The telephone rings, followed by a man speaking in a small room, creating a dial tone effect.",
    "timestamp_events": "['(Telephone dialing, DTMF-0.0-1.227)', '(Mechanisms-0.0-10.0)', '(Busy signal-1.653-2.237)', '(Busy signal-2.684-3.227)', '(Busy signal-3.681-4.217)', '(Busy signal-4.684-5.268)', '(Busy signal-5.715-6.272)', '(Busy signal-6.746-7.344)', '(Generic impact sounds-7.591-7.983)', '(Breathing-8.175-8.663)', '(Male speech, man speaking-8.684-10.0)']"
  },
  "YMTnrE2a-wUg.wav": {
    "caption": "A man speaks while a baby cries, creating a babbling audio event in a small room.",
    "timestamp_events": "['(Male speech, man speaking-0.053-0.941)', '(Background noise-0.053-10.0)', '(Tick-0.895-0.978)', '(Tick-1.099-1.257)', '(Male speech, man speaking-1.437-5.041)', '(Breathing-4.169-4.485)', '(Babbling-4.281-6.185)', '(Breathing-6.057-6.26)', '(Human voice-6.328-6.539)', '(Laughter-6.396-7.479)', '(Breathing-6.486-6.802)', '(Male speech, man speaking-7.464-8.917)', '(Tick-9.27-9.323)', '(Breathing-9.443-9.752)', '(Tick-9.601-9.661)', '(Tick-9.797-9.887)']"
  },
  "Y7F4Hh3JiCVs.wav": {
    "caption": "The sound of flowing water and gurgling can be heard as an adult male speaks in the background in a rural, natural environment.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Waterfall-0.0-10.0)']"
  },
  "Y4GorkPZ6sOc.wav": {
    "caption": "Hip hop music plays softly as a man speaks in the background, creating a lively atmosphere in an indoor stage.",
    "timestamp_events": "['(Synthetic singing-0.0-0.272)', '(Music-0.0-10.0)', '(Synthetic singing-0.464-2.766)', '(Synthetic singing-2.897-4.725)', '(Synthetic singing-4.938-6.711)', '(Synthetic singing-6.835-7.619)', '(Synthetic singing-7.866-10.0)']"
  },
  "YhUZkoRD0zFY.wav": {
    "caption": "A baby cries while a woman speaks in a small room.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Child speech, kid speaking-0.32-1.371)', '(Female speech, woman speaking-0.849-3.433)', '(Generic impact sounds-3.227-3.825)', '(Female speech, woman speaking-3.619-4.567)', '(Generic impact sounds-4.526-4.835)', '(Generic impact sounds-5.138-5.536)', '(Child speech, kid speaking-5.344-6.815)', '(Female speech, woman speaking-5.969-6.897)', '(Generic impact sounds-6.876-7.467)', '(Female speech, woman speaking-7.303-8.299)', '(Generic impact sounds-8.004-8.32)', '(Generic impact sounds-8.849-9.179)', '(Generic impact sounds-9.385-9.763)']"
  },
  "YeH-tgCJKgls.wav": {
    "caption": "A crowd of people cheers and applauds as runners sprint in a race on an athletic field. (Speech: 0.73, Run: 0.54)",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Run-0.0-10.0)', '(Shout-0.0-10.0)', '(Male speech, man speaking-2.641-4.823)', '(Male speech, man speaking-5.576-10.0)']"
  },
  "YehV5s9vGUVU.wav": {
    "caption": "Footsteps crunch on leaves then transition to shuffling on gravel, suggesting someone is walking in a rural area, possibly encountering a snake.",
    "timestamp_events": "['(Background noise-0.014-9.103)', '(Walk, footsteps-1.4-5.455)', '(Bird-2.086-3.091)', '(Generic impact sounds-5.57-7.955)', '(Bird-7.982-9.103)']"
  },
  "YFNgKvPexLyk.wav": {
    "caption": "A man speaks while a baby cries in a small room, creating a somber atmosphere.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.956)', '(Conversation-0.0-10.0)', '(Background noise-0.0-10.0)', '(Female speech, woman speaking-0.489-0.956)', '(Throat clearing-1.219-1.61)', '(Male speech, man speaking-1.317-2.912)', '(Baby cry, infant cry-2.265-3.16)', '(Male speech, man speaking-3.19-4.853)', '(Baby cry, infant cry-3.491-4.251)', '(Female speech, woman speaking-4.628-5.643)', '(Male speech, man speaking-5.124-5.448)', '(Baby cry, infant cry-5.372-5.877)', '(Male speech, man speaking-5.809-6.464)', '(Laughter-6.26-7.216)', '(Male speech, man speaking-7.291-8.721)', '(Female speech, woman speaking-7.464-8.292)', '(Male speech, man speaking-8.871-10.0)', '(Female speech, woman speaking-9.263-10.0)']"
  },
  "YGy8AsjakgCc.wav": {
    "caption": "A man speaks while crumpling material in a small room, accompanied by the sound of jangling keys.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.933)', '(Mechanisms-0.0-10.0)', '(Breathing-0.835-1.242)', '(Crumpling, crinkling-1.505-2.588)', '(Male speech, man speaking-2.114-2.777)', '(Breathing-2.837-3.288)', '(Crumpling, crinkling-3.078-4.116)', '(Breathing-3.77-4.432)', '(Crumpling, crinkling-4.582-4.853)', '(Male speech, man speaking-4.74-7.351)', '(Crumpling, crinkling-5.899-7.457)', '(Crumpling, crinkling-7.743-8.021)', '(Breathing-8.269-8.804)', '(Crumpling, crinkling-8.352-8.743)']"
  },
  "Yd1gE89KLxcs.wav": {
    "caption": "Music plays in the background as a crowd applauds and cheers, creating a lively atmosphere in a crowded venue.",
    "timestamp_events": "['(Speech-0.0-2.514)', '(Mechanisms-0.0-10.0)', '(Tick-0.377-0.433)', '(Tick-0.601-0.698)', '(Clapping-2.779-3.128)', '(Cheering-2.779-8.128)', '(Clapping-3.436-10.0)', '(Cheering-9.497-10.0)']"
  },
  "Ygdr7bd8olO8.wav": {
    "caption": "A dog growls persistently while a cat purrs softly, creating a harmonious symphony of domestic animal sounds in a cozy home.",
    "timestamp_events": "['(Purr-0.0-4.955)', '(Mechanisms-0.0-9.434)', '(Generic impact sounds-0.499-0.678)', '(Generic impact sounds-0.849-1.208)', '(Surface contact-0.997-1.8)', '(Generic impact sounds-1.831-2.244)', '(Surface contact-2.306-2.555)', '(Generic impact sounds-3.42-3.545)', '(Generic impact sounds-3.747-4.059)', '(Generic impact sounds-4.402-4.854)', '(Generic impact sounds-5.056-5.196)', '(Surface contact-5.103-5.485)', '(Generic impact sounds-5.461-5.664)', '(Surface contact-5.757-6.256)', '(Generic impact sounds-5.866-6.1)', '(Purr-6.116-6.357)', '(Generic impact sounds-6.552-6.856)', '(Purr-7.043-7.386)', '(Generic impact sounds-7.767-7.985)', '(Purr-8.071-8.39)', '(Generic impact sounds-8.78-8.912)']"
  },
  "YJu6fWv9FkzA.wav": {
    "caption": "A glass clinks as a bell rings, creating a melodic sound in a room with background music playing.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Music-0.582-2.361)', '(Glass-2.272-10.0)', '(Music-3.239-4.059)']"
  },
  "YDgzwB7oyzyw.wav": {
    "caption": "Loud pops and crackles echo through the street as a crowd cheers and someone gives a speech, accompanied by fireworks.",
    "timestamp_events": "['(Crowd-0.0-5.859)', '(Background noise-0.0-10.0)', '(Firecracker-0.34-1.165)', '(Firecracker-1.516-1.777)', '(Firecracker-2.093-2.299)', '(Firecracker-2.526-3.227)', '(Firecracker-3.591-3.825)', '(Firecracker-4.175-4.437)', '(Firecracker-4.711-5.138)', '(Firecracker-5.9-6.691)', '(Crowd-6.546-7.88)', '(Firecracker-7.818-9.083)', '(Crowd-8.973-10.0)']"
  },
  "YIAXpbQcov3o.wav": {
    "caption": "Two women laugh and chuckle in a dorm room, creating a lively and joyful atmosphere.",
    "timestamp_events": "['(Laughter-0.0-0.681)', '(Female speech, woman speaking-0.0-2.644)', '(Conversation-0.0-10.0)', '(Breathing-0.453-0.681)', '(Laughter-0.803-1.308)', '(Breathing-1.333-1.569)', '(Laughter-1.65-2.66)', '(Breathing-2.693-3.442)', '(Female speech, woman speaking-3.018-6.276)', '(Breathing-4.321-4.777)', '(Laughter-4.623-6.227)', '(Breathing-6.154-6.992)', '(Female speech, woman speaking-6.732-9.476)', '(Laughter-8.597-9.142)', '(Female speech, woman speaking-9.672-10.0)']"
  },
  "YM0uRNuZdjcY.wav": {
    "caption": "A man whispers and then speaks, followed by breathing, in a quiet environment with occasional writing sounds.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Male speech, man speaking-0.256-2.087)', '(Breathing-2.356-4.161)', '(Male speech, man speaking-4.302-4.955)', '(Breathing-4.763-5.698)', '(Whispering-5.826-6.953)', '(Breathing-6.748-7.388)', '(Whispering-7.439-7.964)', '(Whispering-9.232-10.0)']"
  },
  "YmFOLnQmlMXw.wav": {
    "caption": "A person whispers and breathes heavily while chewing and speaking in a serene environment near a creek.",
    "timestamp_events": "['(Stream, river-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Female speech, woman speaking-1.722-2.354)', '(Female speech, woman speaking-2.794-4.402)', '(Female speech, woman speaking-5.797-6.237)', '(Female speech, woman speaking-7.639-8.272)', '(Female speech, woman speaking-8.608-10.0)']"
  },
  "YM0vwoUeXfLU.wav": {
    "caption": "A person snores loudly while people talk in the distance, creating a peaceful ambiance in a bedroom.",
    "timestamp_events": "['(Snoring-0.0-0.412)', '(Background noise-0.0-10.0)', '(Breathing-0.444-0.745)', '(Snoring-0.737-1.719)', '(Snoring-1.825-3.864)', '(Human sounds-3.401-3.872)', '(Breathing-3.921-4.1)', '(Snoring-4.092-5.172)', '(Breathing-5.156-5.334)', '(Snoring-5.399-5.651)', '(Breathing-5.651-6.829)', '(Male speech, man speaking-6.626-7.82)', '(Snoring-7.365-8.478)', '(Male speech, man speaking-8.316-9.291)', '(Breathing-8.706-10.0)', '(Female speech, woman speaking-9.494-10.0)']"
  },
  "YfI-oB9YuHa0.wav": {
    "caption": "A man speaks while a horse trots and people sing in the background in a ballroom.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.843)', '(Music-0.993-10.0)', '(Male singing-1.084-6.403)', '(Tap dance-1.52-10.0)', '(Male speech, man speaking-1.681-1.983)', '(Male speech, man speaking-2.423-2.725)', '(Male speech, man speaking-3.467-3.9)', '(Male speech, man speaking-4.299-4.629)', '(Male speech, man speaking-5.385-6.237)', '(Male singing-8.202-10.0)']"
  },
  "YzzlYZX0r4iM.wav": {
    "caption": "A dog barks while people speak, creating a lively atmosphere in a domestic setting with pets and speech.",
    "timestamp_events": "['(Background noise-0.073-10.0)', '(Bark-0.093-0.356)', '(Bark-0.488-0.737)', '(Bark-0.84-1.048)', '(Human voice-1.248-2.369)', '(Bark-1.767-1.919)', '(Human voice-2.597-3.759)', '(Bark-2.604-2.894)', '(Bark-3.365-3.593)', '(Male speech, man speaking-3.413-5.508)', '(Human voice-3.904-6.152)', '(Male speech, man speaking-5.709-6.297)', '(Bark-5.778-6.062)', '(Bark-6.484-6.684)', '(Human voice-6.484-7.21)', '(Bark-7.078-7.355)', '(Male speech, man speaking-7.493-7.728)', '(Bark-7.887-8.51)', '(Male speech, man speaking-8.351-8.703)', '(Bark-9.174-9.423)', '(Human voice-9.554-10.0)', '(Bark-9.796-10.0)']"
  },
  "YKQnpCGAM7eo.wav": {
    "caption": "Electronic music plays as a drum kit creates rhythmic beats, accompanied by occasional typewriter sounds, in a music studio.",
    "timestamp_events": "['(Sound effect-0.053-3.205)', '(Beep, bleep-1.046-1.159)', '(Beep, bleep-2.032-2.175)', '(Beep, bleep-3.047-3.16)', '(Music-3.175-10.0)', '(Typewriter-6.14-7.449)', '(Typewriter-7.818-8.427)', '(Typewriter-8.653-9.383)', '(Typewriter-9.631-10.0)']"
  },
  "YEDsIqibDOvU.wav": {
    "caption": "A person taps their fingers on a table while music plays in the background at an entertainment center.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Noise-0.0-10.0)', '(Tap dance-0.0-10.0)']"
  },
  "YFKl6JRM7D44.wav": {
    "caption": "People are speaking while music plays and bells ring in a chemistry lab, creating a lively atmosphere.",
    "timestamp_events": "['(Glass-0.0-10.0)', '(Music-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)']"
  },
  "YlWLgxGBv-K4.wav": {
    "caption": "The drums beat loudly as the crowd cheers and applauds, creating a rock music atmosphere in a conference center.",
    "timestamp_events": "['(Music-0.0-4.176)', '(Applause-3.243-10.0)', '(Crowd-3.251-10.0)', '(Whistling-5.094-6.238)', '(Shout-5.5-6.358)', '(Whistling-8.269-8.668)', '(Shout-8.548-9.564)']"
  },
  "YE3UUOFwRHXg.wav": {
    "caption": "A man speaks with a speech synthesizer as music plays in the background, creating an electronic atmosphere.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.606)', '(Music-0.0-10.0)', '(Breathing-1.648-1.858)', '(Male speech, man speaking-1.858-3.003)', '(Breathing-3.045-3.338)', '(Male speech, man speaking-3.352-5.237)', '(Breathing-5.293-5.587)', '(Male speech, man speaking-5.587-6.816)', '(Male speech, man speaking-7.277-8.282)', '(Human sounds-8.799-10.0)', '(Breathing-8.994-9.19)', '(Male speech, man speaking-9.204-10.0)']"
  },
  "YI0GjYjd0oY0.wav": {
    "caption": "The sound of glass shattering is accompanied by a bell ringing repeatedly, creating a chaotic atmosphere in an office.",
    "timestamp_events": "['(Music-0.0-6.652)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.166-1.249)', '(Generic impact sounds-2.415-3.537)', '(Generic impact sounds-4.567-6.546)', '(Generic impact sounds-6.975-8.48)', '(Music-8.458-10.0)', '(Generic impact sounds-9.075-9.225)', '(Generic impact sounds-9.383-9.85)']"
  },
  "YN7dvsk67MNI.wav": {
    "caption": "The sound of sizzling food fills the air as music plays and a woman speaks in a kitchen.",
    "timestamp_events": "['(Child speech, kid speaking-0.0-0.684)', '(Water tap, faucet-0.0-10.0)', '(Music-0.0-10.0)', '(Child speech, kid speaking-2.263-3.869)', '(Child speech, kid speaking-4.777-5.587)', '(Child speech, kid speaking-6.089-7.053)', '(Tick-6.885-7.039)', '(Tick-8.059-8.226)', '(Child speech, kid speaking-9.162-9.818)']"
  },
  "YG6NTjpU-uvI.wav": {
    "caption": "The sound of cutlery and dishes being tapped can be heard while a man speaks in a restaurant kitchen.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.097)', '(Background noise-0.0-10.0)', '(Boiling-0.0-10.0)', '(Cutlery, silverware-0.18-0.374)', '(Cutlery, silverware-0.435-0.636)', '(Male speech, man speaking-0.576-1.391)', '(Male speech, man speaking-2.057-3.111)', '(Male speech, man speaking-5.116-6.604)', '(Male speech, man speaking-6.702-8.19)', '(Male speech, man speaking-8.571-9.394)']"
  },
  "YCyMoIbd3owY.wav": {
    "caption": "A man speaks on stage as a crowd cheers and children shout in an orchestra pit.",
    "timestamp_events": "['(Applause-7.252-10.0)', '(Crowd-6.252-10.0)', '(Male speech, man speaking-3.543-6.252)', '(Shout-6.351-8.297)', '(Background noise-0.0-10.0)', '(Breathing-3.276-3.543)', '(Children shouting-8.323-10.0)']"
  },
  "Yl2CRfIkwYB4.wav": {
    "caption": "The sound of music is accompanied by the distinctive noise of a helicopter flying by in a rural outdoor setting.",
    "timestamp_events": "['(Aircraft engine-0.0-10.0)', '(Wind-0.0-10.0)', '(Music-0.0-10.0)']"
  },
  "YgVfrWLTumiI.wav": {
    "caption": "Synthetic singing accompanies a Christian music tune, creating a cozy atmosphere inside a small room.",
    "timestamp_events": "['(Synthetic singing-0.0-0.622)', '(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Synthetic singing-2.268-4.803)', '(Synthetic singing-4.984-7.394)', '(Synthetic singing-7.543-10.0)']"
  },
  "YIj1umQzgOoY.wav": {
    "caption": "A person whistles while music plays softly in the background in a movie theater.",
    "timestamp_events": "['(Whistling-0.0-0.134)', '(Music-0.0-10.0)', '(Background noise-0.0-10.0)', '(Whistling-0.236-0.354)', '(Whistling-0.465-0.882)', '(Whistling-1.646-1.787)', '(Whistling-1.984-2.079)', '(Whistling-2.173-2.283)', '(Whistling-2.457-3.969)', '(Whistling-4.291-4.874)', '(Breathing-4.591-4.866)', '(Whistling-5.606-5.992)', '(Whistling-6.197-6.543)', '(Whistling-6.866-7.551)', '(Breathing-7.102-7.354)', '(Whistling-7.795-8.063)', '(Whistling-8.307-8.953)', '(Human voice-9.299-10.0)', '(Whistling-9.551-9.756)']"
  },
  "YLwNFrxoGLko.wav": {
    "caption": "The sound of a train horn echoes as railroad crossing bells ring, indicating the presence of a train passing by.",
    "timestamp_events": "['(Wind-0.0-10.0)', '(Train-0.0-10.0)', '(Bell-0.444-6.072)', '(Train horn-6.411-9.248)', '(Bell-8.984-10.0)']"
  },
  "YLiwPIqTpmKc.wav": {
    "caption": "A guitar strums while someone sings and a band plays music in a music studio.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Noise-0.0-10.0)', '(Female singing-0.0-10.0)']"
  },
  "YM6rXbTuTx3s.wav": {
    "caption": "A passionate speech is delivered as the crowd erupts into battle cries, filling the barbershop with energy.",
    "timestamp_events": "['(Battle cry-0.0-1.963)', '(Male speech, man speaking-1.974-4.263)', '(Battle cry-4.35-7.148)', '(Clapping-6.725-9.458)', '(Male speech, man speaking-7.712-8.428)', '(Male speech, man speaking-9.09-9.458)']"
  },
  "Yn8KnzhAwcTA.wav": {
    "caption": "Children are singing and playing music while a crowd cheers and children shout in a school graduation ceremony.",
    "timestamp_events": "['(Child singing-0.0-1.492)', '(Wind-0.0-10.0)', '(Music-0.0-10.0)', '(Child singing-1.752-4.018)', '(Child singing-4.481-5.269)', '(Child singing-5.489-6.407)', '(Male singing-5.521-6.228)']"
  },
  "YH6C8wQ0X20s.wav": {
    "caption": "A man speaks inside a small room while keys jangle, suggesting he is in a mechanical fan-filled environment.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.88)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.936-4.008)', '(Male speech, man speaking-1.55-2.737)', '(Breathing-2.765-3.547)', '(Male speech, man speaking-4.246-5.531)', '(Breathing-5.279-6.173)', '(Generic impact sounds-6.117-6.592)', '(Breathing-6.578-7.5)', '(Generic impact sounds-6.83-7.193)', '(Male speech, man speaking-8.142-9.651)']"
  },
  "YFwTFMLjvsww.wav": {
    "caption": "The guitar strums along with background music as a crowd cheers and enjoys the concert on stage.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Clapping-0.2-0.542)', '(Clapping-0.688-1.159)', '(Clapping-1.33-1.719)', '(Clapping-1.882-2.272)', '(Clapping-2.467-2.865)', '(Clapping-3.044-3.466)', '(Clapping-3.612-3.994)', '(Clapping-4.165-4.603)', '(Clapping-4.782-5.172)', '(Clapping-5.334-5.716)', '(Clapping-5.846-6.309)', '(Clapping-6.464-7.382)', '(Clapping-7.56-8.519)', '(Clapping-8.681-9.356)']"
  },
  "YmhwuZTe5jIo.wav": {
    "caption": "A siren blares as a dog howls, suggesting an alarm or emergency situation, possibly in a residential area.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Fire alarm-0.03-1.753)', '(Dog-0.656-1.09)', '(Howl-1.776-2.727)', '(Fire alarm-2.526-3.454)', '(Fire alarm-3.881-5.177)', '(Howl-3.97-4.928)', '(Bark-5.091-5.261)', '(Fire alarm-5.56-6.701)', '(Fire alarm-6.886-8.432)', '(Fire alarm-8.633-9.81)']"
  },
  "YGCjHPB88Jg4.wav": {
    "caption": "A man sings while strumming a guitar in a dressing room, creating a melodic musical atmosphere.",
    "timestamp_events": "['(Male singing-0.0-0.564)', '(Music-0.0-4.018)', '(Background noise-0.0-10.0)', '(Male singing-1.347-3.996)', '(Male singing-4.221-5.41)', '(Music-4.597-10.0)', '(Male singing-7.178-10.0)']"
  },
  "YF3wwKUEwpy0.wav": {
    "caption": "A man speaks while biting and chewing something, accompanied by the sound of crumpling material in a dressing room.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.745)', '(Mechanisms-0.0-10.0)', '(Biting-0.745-1.037)', '(Chewing, mastication-1.078-3.149)', '(Chewing, mastication-3.32-3.442)', '(Male speech, man speaking-3.499-4.449)', '(Chewing, mastication-3.905-4.051)', '(Surface contact-4.62-5.099)', '(Chewing, mastication-4.717-4.88)', '(Male speech, man speaking-5.131-7.463)', '(Surface contact-5.944-6.813)', '(Surface contact-7.17-7.706)', '(Chewing, mastication-7.544-8.096)', '(Surface contact-8.291-9.039)', '(Chewing, mastication-8.308-8.446)', '(Chewing, mastication-9.356-9.981)', '(Brief tone-9.713-9.965)', '(Male speech, man speaking-9.721-9.973)']"
  },
  "YjZX5twZFMzE.wav": {
    "caption": "A motorcycle engine revs up multiple times, creating a roaring sound in an urban environment.",
    "timestamp_events": "['(Accelerating, revving, vroom-0.0-2.175)', '(Motorcycle-0.0-10.0)', '(Engine knocking-1.588-4.846)', '(Accelerating, revving, vroom-4.184-10.0)', '(Engine knocking-5.546-7.201)']"
  },
  "Yl8PYK5Sc0w0.wav": {
    "caption": "A man speaks amidst the pleasant sound of birds chirping in an outdoor setting, possibly in a park or garden.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-0.819)', '(Chirp, tweet-0.0-0.845)', '(Conversation-0.0-10.0)', '(Male speech, man speaking-0.102-0.615)', '(Male speech, man speaking-0.832-1.344)', '(Chirp, tweet-0.96-3.303)', '(Female speech, woman speaking-1.485-3.214)', '(Male speech, man speaking-2.433-7.35)', '(Female speech, woman speaking-3.496-4.942)', '(Chirp, tweet-3.521-3.995)', '(Chirp, tweet-4.174-4.392)', '(Chirp, tweet-4.52-4.814)', '(Chirp, tweet-5.045-5.429)', '(Female speech, woman speaking-5.198-7.682)', '(Chirp, tweet-5.787-6.287)', '(Chirp, tweet-6.581-6.799)', '(Chirp, tweet-6.94-8.041)', '(Male speech, man speaking-7.746-8.617)', '(Chirp, tweet-8.399-10.0)', '(Male speech, man speaking-8.784-10.0)']"
  },
  "YKZip3k3Ij0M.wav": {
    "caption": "A rooster crows twice while chickens and fowls make noise in the background on a farm.",
    "timestamp_events": "['(Bird-0.0-0.255)', '(Fowl-1.356-3.587)', '(Hubbub, speech noise, speech babble-2.836-6.189)', '(Bird-6.12-9.348)']"
  },
  "YfAa-cpEpK1Y.wav": {
    "caption": "Pigeons coo and flap their wings as they gather on a tiled patio, creating a peaceful ambiance.",
    "timestamp_events": "['(Mechanisms-0.0-9.444)', '(Wind-0.0-9.46)', '(Generic impact sounds-0.021-0.146)', '(Coo-0.123-0.695)', '(Generic impact sounds-0.476-1.314)', '(Coo-0.899-1.181)', '(Surface contact-1.189-1.542)', '(Coo-1.44-2.028)', '(Generic impact sounds-1.604-1.714)', '(Generic impact sounds-2.043-2.153)', '(Coo-2.13-2.843)', '(Generic impact sounds-2.326-2.435)', '(Generic impact sounds-2.624-2.733)', '(Coo-3.094-3.643)', '(Generic impact sounds-3.98-4.254)', '(Surface contact-4.254-4.387)', '(Coo-4.364-4.513)', '(Generic impact sounds-4.607-4.975)', '(Coo-4.756-5.085)', '(Generic impact sounds-5.195-5.32)', '(Generic impact sounds-5.571-5.963)', '(Surface contact-6.143-6.81)', '(Coo-6.183-6.873)', '(Generic impact sounds-7.625-7.813)', '(Generic impact sounds-8.37-8.519)', '(Bird flight, flapping wings-8.487-9.444)']"
  },
  "YDe-hL7mmyPM.wav": {
    "caption": "A train horn blares loudly as it passes through a rail transport area, indicating the presence of a train.",
    "timestamp_events": "['(Train horn-0.0-4.459)', '(Wind-0.0-10.0)', '(Train-0.0-10.0)', '(Chirp, tweet-0.035-0.428)', '(Chirp, tweet-1.053-1.816)', '(Chirp, tweet-2.932-5.269)', '(Train horn-5.205-5.865)', '(Chirp, tweet-5.72-8.415)', '(Train horn-6.75-10.0)', '(Chirp, tweet-9.277-9.63)']"
  },
  "Yj03cah7gGFU.wav": {
    "caption": "A woman laughs and coughs followed by a woman speaking, creating a lively atmosphere in a room.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Cough-0.632-1.374)', '(Breathing-1.356-1.928)', '(Conversation-1.803-10.0)', '(Male speech, man speaking-1.83-2.268)', '(Cough-2.25-2.688)', '(Female speech, woman speaking-2.92-4.824)', '(Hubbub, speech noise, speech babble-2.956-10.0)', '(Female speech, woman speaking-5.011-6.629)', '(Male speech, man speaking-7.46-8.487)', '(Female speech, woman speaking-8.657-10.0)']"
  },
  "YdcgqwhnmyBw.wav": {
    "caption": "A crowd erupts in cheers and applause as music plays, singers sing, and someone shouts in a large, indoor room.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Choir-0.0-10.0)', '(Shout-0.375-3.598)', '(Shout-3.907-4.931)', '(Shout-5.392-6.272)', '(Shout-6.835-8.004)', '(Shout-8.333-10.0)']"
  },
  "Ye9rFLFyOTJQ.wav": {
    "caption": "A motor vehicle engine runs while people talk in the background, creating a bustling atmosphere in an outdoor stage.",
    "timestamp_events": "['(Male speech, man speaking-0.0-4.823)', '(Liquid-0.0-10.0)', '(Noise-0.0-10.0)', '(Male speech, man speaking-6.208-7.6)', '(Male speech, man speaking-7.908-9.534)']"
  },
  "YISxOV4i0CTI.wav": {
    "caption": "A man speaks while objects are tapped, indicating the audio event of a sliding door in an unknown environment.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Drawer open or close-0.081-1.333)', '(Male speech, man speaking-1.871-2.813)', '(Drawer open or close-2.821-5.648)', '(Male speech, man speaking-3.859-5.442)', '(Male speech, man speaking-7.217-8.299)']"
  },
  "YEfy4k1bjoSY.wav": {
    "caption": "A group of people clapping and singing while a beatboxing sound accompanies them in a crowded venue.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Female singing-6.228-10.0)']"
  },
  "YGYex47j3ykw.wav": {
    "caption": "A guitar is being played on stage while music is being played, creating a lively atmosphere.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Male singing-0.0-10.0)', '(Female singing-0.0-10.0)']"
  },
  "YGw5ShKNyx0w.wav": {
    "caption": "A hair dryer hums softly while a woman speaks in the background at a beauty salon.",
    "timestamp_events": "['(Hair dryer-0.0-10.0)', '(Female speech, woman speaking-1.797-2.705)', '(Hubbub, speech noise, speech babble-1.797-7.186)', '(Conversation-1.804-6.217)', '(Female speech, woman speaking-3.034-3.742)', '(Male speech, man speaking-4.168-6.333)']"
  },
  "Yk68xWjEnJkc.wav": {
    "caption": "Birds chirp in the background followed by an insect buzzing, creating a lively atmosphere on the farm.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.541)', '(Chicken, rooster-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.986-1.643)', '(Generic impact sounds-2.097-2.551)', '(Generic impact sounds-3.034-3.585)', '(Generic impact sounds-4.019-5.507)', '(Generic impact sounds-6.377-7.073)', '(Generic impact sounds-7.99-8.126)']"
  },
  "Ylg-K5wOQs0U.wav": {
    "caption": "Music plays softly as a crowd sings along with a choir, creating a harmonious atmosphere in the room.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Choir-0.0-10.0)', '(Male speech, man speaking-0.46-1.549)', '(Male speech, man speaking-1.719-2.524)', '(Male speech, man speaking-3.499-4.806)', '(Male speech, man speaking-9.347-10.0)']"
  },
  "YkWQTexbT40U.wav": {
    "caption": "A sewing machine hums as a woman speaks and music plays in the background in a bustling workshop.",
    "timestamp_events": "['(Mechanisms-0.07-3.283)', '(Hubbub, speech noise, speech babble-3.295-8.161)', '(Child speech, kid speaking-3.306-7.183)', '(Human sounds-7.264-7.858)', '(Laughter-7.392-8.172)', '(Music-7.73-10.0)']"
  },
  "YhmYXluiYfqQ.wav": {
    "caption": "A race car accelerates and skids while music plays in the background at an auto racing event.",
    "timestamp_events": "['(Accelerating, revving, vroom-0.0-3.239)', '(Race car, auto racing-0.0-3.307)', '(Music-0.015-10.0)', '(Accelerating, revving, vroom-6.789-7.365)', '(Race car, auto racing-6.829-10.0)', '(Accelerating, revving, vroom-7.788-10.0)']"
  },
  "YKjISzQTTIq4.wav": {
    "caption": "An adult male speaks followed by a thump, while humming can be heard in the background; possibly in a music studio.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Breathing-0.315-0.803)', '(Male singing-0.811-1.85)', '(Breathing-1.984-2.748)', '(Male singing-2.835-3.654)', '(Male singing-3.787-4.622)', '(Human sounds-4.244-4.339)', '(Breathing-4.63-4.906)', '(Human sounds-4.945-5.087)', '(Breathing-5.197-5.488)', '(Human sounds-5.606-5.787)', '(Breathing-5.772-6.26)', '(Human sounds-6.299-6.409)', '(Male singing-6.331-7.362)', '(Human sounds-6.969-7.071)', '(Human sounds-7.638-7.819)', '(Breathing-7.961-8.299)', '(Human sounds-8.394-8.504)', '(Breathing-8.551-8.953)', '(Human sounds-8.984-9.11)', '(Male singing-9.031-10.0)', '(Human sounds-9.362-9.465)', '(Human sounds-9.717-9.787)']"
  },
  "YHZbQ3lTObas.wav": {
    "caption": "A man sings while rock and roll music plays in a physics laboratory.",
    "timestamp_events": "['(Male singing-0.0-2.101)', '(Music-0.0-10.0)', '(Choir-2.166-3.507)', '(Male singing-3.466-5.684)', '(Choir-5.659-10.0)', '(Male singing-7.43-9.843)']"
  },
  "YIkr9QTWUhlg.wav": {
    "caption": "The crowd erupts in applause as a guitar strums and music fills the air in a lively concert.",
    "timestamp_events": "['(Music-0.0-6.035)', '(Background noise-0.0-10.0)', '(Applause-5.884-10.0)', '(Shout-5.884-10.0)', '(Crowd-5.884-10.0)']"
  },
  "YF9u0yepVtGQ.wav": {
    "caption": "A man sings while music plays and the crowd cheers in an outdoor stage performance.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Male singing-0.531-2.067)', '(Male singing-2.458-3.785)', '(Male singing-4.385-9.791)', '(Cheering-7.975-10.0)']"
  },
  "Ygp7x498MNv0.wav": {
    "caption": "A woman passionately delivers a speech, her voice clear and confident, in a setting that seems to be a boxing ring.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-0.94)', '(Conversation-0.0-8.635)', '(Mechanisms-0.0-8.67)', '(Male speech, man speaking-0.975-1.376)', '(Male speech, man speaking-1.812-3.119)', '(Female speech, woman speaking-3.452-3.933)', '(Male speech, man speaking-3.452-3.991)', '(Female speech, woman speaking-4.128-4.427)', '(Male speech, man speaking-4.45-4.759)', '(Male speech, man speaking-4.874-5.677)', '(Female speech, woman speaking-6.044-8.67)', '(Male speech, man speaking-6.433-7.305)', '(Female speech, woman speaking-8.75-10.0)']"
  },
  "Ye4Xna4X2aQQ.wav": {
    "caption": "A choir sings harmoniously with male and female voices, creating a captivating performance in a subway station.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Choir-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Clapping-0.346-0.441)', '(Clapping-1.165-1.26)', '(Clapping-1.378-1.521)', '(Clapping-1.961-2.063)', '(Clapping-2.797-2.967)', '(Clapping-3.659-3.836)', '(Clapping-4.406-4.562)', '(Clapping-4.65-4.861)', '(Clapping-5.173-5.465)', '(Clapping-6.069-6.239)', '(Clapping-6.87-7.054)', '(Clapping-7.746-7.916)', '(Clapping-8.561-8.826)', '(Clapping-9.369-9.525)', '(Clapping-9.769-10.0)']"
  },
  "Yjf09nabzA44.wav": {
    "caption": "Rain falls hard as a man speaks, with a probability of 0.61 for speech and 0.25 for a vehicle.",
    "timestamp_events": "['(Windscreen wiper, windshield wiper-0.0-10.0)', '(Car-0.0-10.0)', '(Rain on surface-0.0-10.0)', '(Male speech, man speaking-2.395-2.56)', '(Male speech, man speaking-2.766-4.107)', '(Male speech, man speaking-4.684-6.375)', '(Male speech, man speaking-7.323-8.918)', '(Male speech, man speaking-9.88-10.0)']"
  },
  "YF-okl2dAEFg.wav": {
    "caption": "A crowd erupts in applause and cheers as a rooster crows, creating an energetic atmosphere in an outdoor setting.",
    "timestamp_events": "['(Whoop-0.0-0.23)', '(Background noise-0.0-10.0)', '(Human sounds-0.237-3.722)', '(Cheering-1.557-10.0)', '(Applause-1.841-10.0)', '(Whoop-3.385-6.333)', '(Human voice-4.127-4.993)', '(Whoop-7.289-8.753)', '(Whoop-9.577-9.962)']"
  },
  "YITLVr0NJwE0.wav": {
    "caption": "A motor vehicle engine runs while people talk in the background at a stadium/football game. (Audio-Visual Label: Vehicle; Hubbub, speech noise, speech babble)",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.355)', '(Hubbub, speech noise, speech babble-0.0-7.219)', '(Male speech, man speaking-0.558-2.824)', '(Male speech, man speaking-2.946-3.279)', '(Male speech, man speaking-3.417-4.002)', '(Male speech, man speaking-4.148-4.668)', '(Male speech, man speaking-4.806-5.424)', '(Vehicle-4.961-7.219)', '(Male speech, man speaking-5.749-6.845)', '(Wind-7.211-10.0)', '(Breathing-7.373-7.641)', '(Male speech, man speaking-7.706-8.543)', '(Breathing-8.584-8.746)', '(Male speech, man speaking-8.795-10.0)']"
  },
  "YFVFChFbbq7c.wav": {
    "caption": "A group of people singing can be heard in the background as music plays in a large indoor public space.",
    "timestamp_events": "['(Male singing-0.0-7.673)', '(Music-0.015-7.681)', '(Clapping-0.052-0.206)', '(Clapping-0.457-0.759)', '(Clapping-0.891-1.23)', '(Clapping-1.429-1.907)', '(Clapping-1.974-2.732)', '(Clapping-2.909-3.167)', '(Clapping-3.307-3.697)', '(Clapping-3.829-4.234)', '(Clapping-4.36-4.61)', '(Clapping-4.801-5.074)', '(Clapping-5.295-5.575)', '(Clapping-5.751-6.09)', '(Clapping-6.201-6.576)', '(Clapping-6.731-7.084)', '(Clapping-7.261-7.74)', '(Music-7.819-10.0)', '(Male singing-7.85-10.0)', '(Clapping-8.226-8.535)', '(Clapping-8.719-9.05)', '(Clapping-9.227-9.58)', '(Clapping-9.757-10.0)', '(Music-9.898-9.906)']"
  },
  "YHsjupPU6aYo.wav": {
    "caption": "A dog whimpers while people talk in the background at a pet shop, with a mouse and speech being the dominant audio events.",
    "timestamp_events": "['(Squeal-0.0-0.753)', '(Television-0.0-9.575)', '(Mechanisms-0.0-9.575)', '(Generic impact sounds-0.062-0.355)', '(Male speech, man speaking-0.062-4.425)', '(Generic impact sounds-0.639-1.468)', '(Squeal-0.883-3.304)', '(Generic impact sounds-2.077-2.662)', '(Squeal-3.799-5.676)', '(Male speech, man speaking-4.587-5.391)', '(Male speech, man speaking-5.643-7.008)', '(Squeal-6.78-7.706)', '(Male speech, man speaking-7.3-8.178)', '(Generic impact sounds-7.861-8.048)', '(Squeal-7.983-8.803)', '(Generic impact sounds-8.243-8.714)', '(Squeal-8.974-9.575)', '(Generic impact sounds-9.039-9.169)', '(Generic impact sounds-9.315-9.51)']"
  },
  "YEf5oIwsVXls.wav": {
    "caption": "A baby cries while music plays in the background, suggesting a domestic environment with a pet cat nearby.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Television-0.0-10.0)']"
  },
  "YFFUKr4IiRR0.wav": {
    "caption": "The sound of a typewriter fills the music studio as someone types on the keyboard intermittently.",
    "timestamp_events": "['(Typewriter-0.0-1.864)', '(Mechanisms-0.0-9.945)', '(Ding-1.384-3.81)', '(Typewriter-2.264-4.815)', '(Typewriter-4.992-5.561)', '(Typewriter-5.721-5.881)', '(Typewriter-5.997-6.654)', '(Typewriter-7.195-7.431)', '(Tick-9.542-9.639)', '(Tick-9.833-9.945)']"
  },
  "Ye8dhd515Tm0.wav": {
    "caption": "A man sings into a microphone as music plays, and the audience cheers in an outdoor stage setting.",
    "timestamp_events": "['(Music-0.0-6.094)', '(Cheering-6.197-10.0)', '(Shout-7.236-10.0)', '(Whoop-9.244-10.0)', '(Male singing-0.0-5.85)']"
  },
  "YkVGND3NGxH4.wav": {
    "caption": "A crowd erupts in cheers as a chant echoes through a stadium during a soccer game.",
    "timestamp_events": "['(Crowd-0.062-10.0)', '(Choir-0.07-10.0)', '(Whistling-0.412-2.832)', '(Whistling-3.141-4.546)', '(Whistling-5.651-6.309)', '(Music-6.366-10.0)']"
  },
  "YGpOdBPRWW4U.wav": {
    "caption": "The sound of water gushing can be heard as a man speaks in the background, implying a busy environment.",
    "timestamp_events": "['(Pour-0.0-10.0)', '(Male speech, man speaking-0.344-1.124)', '(Generic impact sounds-0.849-1.089)', '(Clang-1.8-2.626)', '(Generic impact sounds-2.236-2.534)', '(Generic impact sounds-3.291-3.555)', '(Male speech, man speaking-3.888-4.117)', '(Generic impact sounds-4.954-5.206)', '(Generic impact sounds-7.041-7.225)', '(Generic impact sounds-7.546-7.718)', '(Male speech, man speaking-8.956-10.0)', '(Generic impact sounds-9.186-9.369)']"
  },
  "YdIvjYbPRyJU.wav": {
    "caption": "A crow caws loudly as the sound of a bird flapping its wings can be heard in the distance.",
    "timestamp_events": "['(Bird-0.0-0.376)', '(Background noise-0.0-10.0)', '(Generic impact sounds-0.993-3.98)', '(Bird-4.372-4.485)', '(Bird-4.695-5.004)', '(Generic impact sounds-5.297-5.831)', '(Bird-5.974-7.306)', '(Generic impact sounds-7.269-8.427)', '(Bird-7.517-8.39)', '(Bird-8.623-9.044)', '(Generic impact sounds-9.059-9.263)', '(Bird-9.308-10.0)']"
  },
  "YKUy3kDYj590.wav": {
    "caption": "A woman speaks while a duck quacks, accompanied by music and a giggle, creating a lively atmosphere.",
    "timestamp_events": "['(Female singing-0.0-10.0)', '(Laughter-0.008-1.606)', '(Music-0.008-10.0)', '(Laughter-1.907-4.522)', '(Female speech, woman speaking-2.879-3.851)', '(Female speech, woman speaking-4.404-7.924)', '(Female speech, woman speaking-8.255-9.337)']"
  },
  "YMyngcM5D5E4.wav": {
    "caption": "A man speaks as water flows, creating a soothing ambiance of speech and gentle water sounds in a bathroom.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.595)', '(Wind-0.0-10.0)', '(Liquid-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-2.927-7.043)', '(Male speech, man speaking-8.164-8.721)', '(Male speech, man speaking-9.443-10.0)']"
  },
  "YLN0wlCy--hc.wav": {
    "caption": "The techno music blares as the crowd erupts in cheers and applause at the outdoor stage.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Shout-0.395-4.806)']"
  },
  "Yk66bTjbqu0Q.wav": {
    "caption": "A man speaks as a crowd cheers and music plays in the background inside a public space.",
    "timestamp_events": "['(Whoop-0.0-0.449)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Female speech, woman speaking-0.362-0.811)', '(Male speech, man speaking-0.394-1.44)', '(Female speech, woman speaking-1.142-1.921)', '(Male speech, man speaking-1.937-5.394)', '(Shout-4.63-10.0)', '(Male speech, man speaking-6.055-7.457)', '(Male speech, man speaking-8.307-10.0)']"
  },
  "YjT5NNJf9ipQ.wav": {
    "caption": "A woman stirs and fries food in a restaurant kitchen, creating a sizzling sound.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-1.191)', '(Music-0.0-10.0)', '(Sizzle-0.0-10.0)', '(Female speech, woman speaking-1.557-2.475)', '(Dishes, pots, and pans-1.679-1.874)', '(Dishes, pots, and pans-2.085-2.377)', '(Female speech, woman speaking-2.686-3.271)', '(Dishes, pots, and pans-3.06-3.239)', '(Dishes, pots, and pans-3.807-3.994)', '(Female speech, woman speaking-4.148-5.887)', '(Dishes, pots, and pans-4.157-4.473)', '(Dishes, pots, and pans-4.863-5.261)', '(Dishes, pots, and pans-6.699-7.17)', '(Dishes, pots, and pans-7.731-7.958)', '(Dishes, pots, and pans-8.08-8.259)', '(Dishes, pots, and pans-8.421-8.665)']"
  },
  "YggEIJvo6wPg.wav": {
    "caption": "A race car revs its engine and screeches its tires on the race track, creating an exhilarating sound of auto racing.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Car-0.0-10.0)', '(Male singing-0.766-2.457)', '(Accelerating, revving, vroom-2.457-7.144)', '(Male singing-3.021-8.979)', '(Accelerating, revving, vroom-8.196-10.0)']"
  },
  "YMU5X9QoaJrk.wav": {
    "caption": "A horse trots while people talk in an urban environment, creating a lively atmosphere.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Run-5.405-9.578)', '(Hubbub, speech noise, speech babble-0.0-10.0)']"
  },
  "YmSRrB-GAUo8.wav": {
    "caption": "A lively crowd erupts into applause and cheering as music plays in the indoor stage environment.",
    "timestamp_events": "['(Applause-0.266-6.79)', '(Music-0.266-10.0)', '(Hubbub, speech noise, speech babble-4.26-10.0)']"
  },
  "YEFb2dVVbBKw.wav": {
    "caption": "A man walks while talking, his footsteps are audible, and he speaks outside in a rural environment.",
    "timestamp_events": "['(Wind-0.439-10.0)', '(Cricket-0.439-10.0)', '(Door-0.907-1.321)', '(Door-1.849-2.077)', '(Male speech, man speaking-2.14-2.431)', '(Male speech, man speaking-2.659-2.957)', '(Walk, footsteps-3.141-3.287)', '(Male speech, man speaking-3.365-3.697)', '(Walk, footsteps-3.726-3.888)', '(Walk, footsteps-4.408-4.506)', '(Male speech, man speaking-4.775-5.107)', '(Walk, footsteps-5.172-5.237)', '(Male speech, man speaking-5.688-6.961)', '(Walk, footsteps-5.716-5.814)', '(Walk, footsteps-6.228-6.334)', '(Walk, footsteps-6.683-6.797)', '(Walk, footsteps-7.122-7.341)', '(Bark-7.471-7.991)', '(Male speech, man speaking-7.493-9.298)', '(Bark-8.153-8.6)', '(Walk, footsteps-8.763-8.868)', '(Walk, footsteps-9.193-9.445)', '(Walk, footsteps-9.77-9.973)']"
  },
  "Yl5YZ2nsDPTU.wav": {
    "caption": "A woman's speech is accompanied by the continuous sound of a sewing machine running in a small room.",
    "timestamp_events": "['(Female speech, woman speaking-0.0-0.67)', '(Sewing machine-0.0-7.57)', '(Conversation-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Female speech, woman speaking-1.543-1.783)', '(Female speech, woman speaking-2.107-4.673)', '(Female speech, woman speaking-5.425-6.095)', '(Female speech, woman speaking-6.298-6.742)', '(Female speech, woman speaking-7.615-10.0)']"
  },
  "YlOJUo9qV12k.wav": {
    "caption": "A baby cries while a man speaks in an airplane cabin, creating a sobbing and speech audio event.",
    "timestamp_events": "['(Female speech, woman speaking-5.78-6.748)', '(Male speech, man speaking-7.724-10.0)', '(Baby cry, infant cry-4.409-7.402)', '(Mechanisms-0.0-10.0)']"
  },
  "YlOwCeLdSn74.wav": {
    "caption": "A boat motor roars while water splashes and gurgles, as an adult male speaks in the background on a speedboat.",
    "timestamp_events": "['(Background noise-0.0-3.034)', '(Water-0.0-3.053)', '(Male speech, man speaking-0.164-3.063)', '(Motorboat, speedboat-3.063-10.0)']"
  },
  "YF77-qB48bNc.wav": {
    "caption": "A man speaks while music plays and something shatters, creating a lively atmosphere in an aquarium.",
    "timestamp_events": "['(Music-0.0-6.983)', '(Sound effect-2.085-3.377)', '(Sound effect-3.702-4.027)', '(Sound effect-4.157-4.717)', '(Sound effect-4.863-6.131)', '(Sound effect-6.325-6.829)', '(Mechanisms-6.959-10.0)', '(Male speech, man speaking-7.016-8.324)', '(Male speech, man speaking-9.006-10.0)', '(Child speech, kid speaking-9.152-9.835)']"
  },
  "Yi0lJhaj34LQ.wav": {
    "caption": "The food sizzles as a woman speaks in the kitchen while stirring and frying the ingredients.",
    "timestamp_events": "['(Sizzle-0.0-10.0)', '(Stir-0.505-0.808)', '(Stir-1.062-3.282)', '(Female speech, woman speaking-2.282-2.833)', '(Stir-4.691-6.423)', '(Female speech, woman speaking-5.653-6.468)', '(Stir-6.629-7.928)', '(Female speech, woman speaking-7.695-8.968)', '(Stir-8.127-8.485)', '(Stir-8.959-9.447)', '(Female speech, woman speaking-9.14-9.885)']"
  },
  "YIt7mU9zMI4w.wav": {
    "caption": "The sizzling sound of food being stirred in a pan can be heard, while a man speaks in the background.",
    "timestamp_events": "['(Cutlery, silverware-0.0-0.233)', '(Stir-0.0-4.351)', '(Mechanisms-0.0-10.0)', '(Cutlery, silverware-0.379-0.68)', '(Cutlery, silverware-1.289-1.565)', '(Cutlery, silverware-2.312-2.8)', '(Male speech, man speaking-2.816-4.116)', '(Cutlery, silverware-3.011-3.214)', '(Cutlery, silverware-4.278-4.701)', '(Male speech, man speaking-4.676-5.001)', '(Cutlery, silverware-5.172-5.391)', '(Male speech, man speaking-5.229-5.814)', '(Surface contact-5.822-6.171)', '(Cutlery, silverware-5.944-6.179)', '(Liquid-6.309-7.341)', '(Tick-7.463-7.576)', '(Male speech, man speaking-7.853-9.721)', '(Pour-8.023-10.0)']"
  },
  "YHoJt1z0NAlg.wav": {
    "caption": "A motorcycle engine idles and then revs up, creating the sound of a vehicle in motion.",
    "timestamp_events": "['(Engine knocking-0.0-10.0)', '(Motorcycle-0.0-10.0)', '(Accelerating, revving, vroom-3.326-6.448)', '(Accelerating, revving, vroom-8.774-10.0)']"
  },
  "YdsuMoRXcbfo.wav": {
    "caption": "Rain falls as birds chirp and an ice cream truck plays music in the background, creating a peaceful atmosphere.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Surface contact-0.087-0.485)', '(Generic impact sounds-0.672-1.143)', '(Generic impact sounds-2.02-2.564)', '(Generic impact sounds-3.084-3.312)', '(Generic impact sounds-3.466-3.97)', '(Crumpling, crinkling-4.067-4.912)', '(Crumpling, crinkling-5.074-5.968)', '(Surface contact-6.106-6.634)', '(Generic impact sounds-6.78-7.089)', '(Crumpling, crinkling-7.406-9.087)', '(Crumpling, crinkling-9.25-9.819)']"
  },
  "YDpsuqeLyntU.wav": {
    "caption": "The sound of a hammer hitting wood echoes in an elevator shaft, accompanied by faint speech and the distant noise of a vehicle.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Male speech, man speaking-0.768-1.048)', '(Generic impact sounds-1.7-3.749)', '(Generic impact sounds-4.47-4.68)', '(Male speech, man speaking-5.911-8.34)', '(Generic impact sounds-6.717-7.614)', '(Generic impact sounds-7.812-8.021)', '(Clang-7.835-8.51)', '(Male speech, man speaking-9.161-9.81)', '(Clang-9.511-10.0)']"
  },
  "YiCG6dm9HkAE.wav": {
    "caption": "People singing and playing music with a rattling instrument in the background at a lively gathering.",
    "timestamp_events": "['(Choir-0.0-2.199)', '(Music-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.022-3.832)', '(Choir-3.109-7.934)', '(Human voice-6.699-7.057)', '(Clapping-7.723-7.836)', '(Laughter-8.129-8.933)', '(Clapping-8.413-8.543)', '(Clapping-9.096-9.461)', '(Choir-9.12-10.0)']"
  },
  "YgxUc60nE46A.wav": {
    "caption": "A whip cracks loudly while music plays softly in the background, as something is being sprayed in an indoor booth.",
    "timestamp_events": "['(Singing-0.0-10.0)', '(Music-0.0-10.0)', '(Whip-2.361-2.67)', '(Whip-3.261-3.612)', '(Whip-3.983-4.251)', '(Whip-4.918-5.206)', '(Whip-7.364-7.694)', '(Whip-8.107-8.333)', '(Whip-8.952-9.199)', '(Whip-9.736-10.0)']"
  },
  "YH5tKoTp-RHs.wav": {
    "caption": "A man passionately delivers a speech, eliciting cheers from a lively crowd in a discotheque.",
    "timestamp_events": "['(Crowd-0.0-10.0)', '(Background noise-0.0-10.0)', '(Shout-0.73-3.025)', '(Conversation-0.843-8.947)', '(Male speech, man speaking-0.858-2.972)', '(Female speech, woman speaking-3.303-4.981)', '(Shout-3.762-4.733)', '(Male speech, man speaking-5.109-8.999)', '(Shout-8.33-10.0)', '(Laughter-9.075-10.0)']"
  },
  "YmJE5GEh7UM8.wav": {
    "caption": "A heavy metal song plays with a pulsating beat as rock music fills the air in a crowded concert hall.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Shout-4.583-6.628)', '(Mechanisms-0.0-10.0)']"
  },
  "YJs25I4Tsifc.wav": {
    "caption": "Water gurgles and trickles, creating a soothing sound as it flows in an underwater coral reef in the ocean.",
    "timestamp_events": "['(Trickle, dribble-6.945-10.0)', '(Water-1.094-10.0)', '(Sound effect-4.708-7.467)', '(Mechanisms-0.0-10.0)']"
  },
  "Ydrv7QxlQQE0.wav": {
    "caption": "A man speaks amidst the chatter of a crowd in an urban setting, suggesting an outdoor gathering or event.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.048)', '(Conversation-0.0-10.0)', '(Background noise-0.0-10.0)', '(Human voice-1.062-2.832)', '(Male speech, man speaking-1.961-2.625)', '(Male speech, man speaking-3.282-3.911)', '(Child speech, kid speaking-3.883-4.609)', '(Child speech, kid speaking-4.803-5.522)', '(Child speech, kid speaking-5.612-6.394)', '(Child speech, kid speaking-6.622-8.309)', '(Male speech, man speaking-7.161-8.385)', '(Child speech, kid speaking-8.406-8.842)', '(Giggle-8.869-9.264)', '(Male speech, man speaking-9.174-10.0)', '(Human voice-9.409-10.0)']"
  },
  "YDL6-uzNe3Ng.wav": {
    "caption": "A woman laughs and talks while burping in a kitchen, creating a lively and casual atmosphere.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Laughter-0.134-2.705)', '(Female speech, woman speaking-1.199-2.423)', '(Conversation-1.22-9.083)', '(Laughter-2.849-3.103)', '(Laughter-3.323-3.856)', '(Laughter-4.01-8.251)', '(Female speech, woman speaking-4.601-8.175)', '(Female speech, woman speaking-8.361-9.138)', '(Breathing-8.373-8.616)', '(Burping, eructation-8.581-9.509)', '(Breathing-9.55-10.0)', '(Laughter-9.653-10.0)']"
  },
  "YhBsNc8TxxkA.wav": {
    "caption": "Children laugh and scream with joy as they play, creating a lively and energetic atmosphere in a playground.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Laughter-0.117-1.676)', '(Breathing-1.688-2.096)', '(Laughter-2.049-7.066)', '(Conversation-3.341-8.894)', '(Child speech, kid speaking-3.364-4.307)', '(Child speech, kid speaking-4.68-5.192)', '(Child speech, kid speaking-5.425-6.019)', '(Child speech, kid speaking-6.182-7.02)', '(Shout-7.171-7.94)', '(Child speech, kid speaking-7.963-8.883)', '(Shout-8.906-10.0)']"
  },
  "YHvOnZiA425I.wav": {
    "caption": "A sewing machine hums inside a small room, indicating the audio event of a sewing machine.",
    "timestamp_events": "['(Mechanisms-0.0-10.0)', '(Surface contact-0.232-1.246)', '(Generic impact sounds-1.314-2.56)', '(Generic impact sounds-2.725-3.333)', '(Sewing machine-3.478-7.217)', '(Generic impact sounds-8.213-8.889)', '(Generic impact sounds-9.614-9.913)']"
  },
  "YhW0YsknCvaI.wav": {
    "caption": "The sound of a vehicle engine running is accompanied by a man speaking, suggesting a conversation inside a car.",
    "timestamp_events": "['(Accelerating, revving, vroom-0.0-10.0)', '(Vehicle-0.0-10.0)', '(Male speech, man speaking-0.0-0.557)', '(Male speech, man speaking-0.828-1.46)', '(Male speech, man speaking-1.847-5.094)', '(Male speech, man speaking-5.394-7.197)', '(Male speech, man speaking-7.48-8.008)', '(Male speech, man speaking-8.496-9.772)']"
  },
  "YJkC2LfKpT1k.wav": {
    "caption": "A race car revs its engine and tires squeal as it speeds around the track during an auto racing event.",
    "timestamp_events": "['(Accelerating, revving, vroom-0.0-1.445)', '(Tire squeal, skidding-0.0-3.567)', '(Race car, auto racing-0.0-10.0)', '(Accelerating, revving, vroom-3.529-6.712)', '(Accelerating, revving, vroom-7.299-8.683)', '(Tire squeal, skidding-7.329-10.0)']"
  },
  "YFKWArdlknOk.wav": {
    "caption": "Cutlery and dishes clink as pots and pans are stirred, suggesting a bustling kitchen environment.",
    "timestamp_events": "['(Stir-0.0-0.787)', '(Music-0.0-3.144)', '(Mechanisms-0.0-10.0)', '(Stir-0.897-3.199)', '(Female speech, woman speaking-1.777-3.055)', '(Stir-3.536-7.653)', '(Female speech, woman speaking-3.784-4.423)', '(Stir-7.845-8.54)', '(Female speech, woman speaking-9.055-10.0)']"
  },
  "Yi-BqkD7y49k.wav": {
    "caption": "A man speaks while a cap gun is fired, creating a speech and cap gun audio event in an unknown environment.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.027)', '(Conversation-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Child speech, kid speaking-0.398-1.269)', '(Generic impact sounds-0.564-0.778)', '(Generic impact sounds-1.276-1.463)', '(Generic impact sounds-1.732-1.912)', '(Generic impact sounds-2.106-2.306)', '(Scrape-2.376-2.887)', '(Generic impact sounds-2.521-2.68)', '(Generic impact sounds-2.846-3.06)', '(Generic impact sounds-3.302-3.434)', '(Generic impact sounds-3.579-3.745)', '(Generic impact sounds-4.015-4.222)', '(Male speech, man speaking-4.443-5.087)', '(Generic impact sounds-4.471-4.637)', '(Generic impact sounds-5.107-5.356)', '(Male speech, man speaking-5.315-5.965)', '(Generic impact sounds-6.58-6.836)', '(Male speech, man speaking-6.898-7.811)', '(Generic impact sounds-7.037-7.223)', '(Generic impact sounds-7.417-7.659)', '(Generic impact sounds-7.97-8.157)', '(Generic impact sounds-8.697-8.925)', '(Child speech, kid speaking-8.786-9.111)', '(Generic impact sounds-9.07-9.236)', '(Male speech, man speaking-9.215-10.0)']"
  },
  "YjUNxXsdXAJ4.wav": {
    "caption": "A church bell rings while a speech is being delivered in a large room, with people talking in the background.",
    "timestamp_events": "['(Church bell-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-0.534-1.144)', '(Male speech, man speaking-2.084-2.671)', '(Male speech, man speaking-5.072-5.959)']"
  },
  "YDp3XonyhanI.wav": {
    "caption": "The food sizzles in the pan as a woman stirs and fries it, creating a delightful aroma in the kitchen.",
    "timestamp_events": "['(Sizzle-0.0-3.575)', '(Female speech, woman speaking-0.395-0.978)', '(Conversation-0.433-10.0)', '(Mechanisms-3.603-10.0)', '(Female speech, woman speaking-3.827-7.137)', '(Female speech, woman speaking-7.444-9.176)', '(Human sounds-8.994-9.288)', '(Breathing-9.274-9.804)', '(Female speech, woman speaking-9.902-10.0)']"
  },
  "YhuK4Xf5xrYA.wav": {
    "caption": "The audience erupts in applause and clapping as a man delivers a speech, creating an energetic atmosphere.",
    "timestamp_events": "['(Whip-0.0-0.615)', '(Applause-0.16-8.681)', '(Whip-0.769-3.336)', '(Human voice-1.955-2.897)', '(Whoosh, swoosh, swish-4.416-4.668)', '(Laughter-4.741-6.033)']"
  },
  "YFTGNPbfxcuE.wav": {
    "caption": "A person breathes heavily before starting to speak, with audio events indicating tearing. The audio occurs in a small room.",
    "timestamp_events": "['(Sound effect-0.075-0.444)', '(Sound effect-0.632-1.392)', '(Sound effect-1.512-3.439)', '(Background noise-3.619-10.0)', '(Cat-4.146-6.664)', '(Cat-7.148-7.555)', '(Cat-8.081-8.473)']"
  },
  "YGZS0AFTpVv4.wav": {
    "caption": "The sound of a power tool drilling can be heard as wood is being rubbed, indicating a woodworking activity in progress.",
    "timestamp_events": "['(Generic impact sounds-0.03-1.642)', '(Generic impact sounds-1.893-3.542)', '(Mechanisms-4.036-7.342)', '(Background noise-7.71-10.0)']"
  },
  "Ycwzz1fNEUqg.wav": {
    "caption": "A woman speaks while a baby cries in a small room, creating a mix of speech and babbling sounds.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.688)', '(Female speech, woman speaking-0.0-0.745)', '(Mechanisms-0.0-10.0)', '(Generic impact sounds-0.948-3.905)', '(Baby cry, infant cry-1.005-2.231)', '(Female speech, woman speaking-1.622-3.515)', '(Baby cry, infant cry-2.597-3.434)', '(Generic impact sounds-4.416-4.831)', '(Female speech, woman speaking-5.066-6.399)', '(Generic impact sounds-6.114-6.358)', '(Generic impact sounds-6.91-7.252)', '(Generic impact sounds-8.763-8.998)', '(Baby cry, infant cry-9.607-10.0)']"
  },
  "Ygefic-LXX7w.wav": {
    "caption": "A woman sings while a baby laughs, accompanied by background music, creating a joyful atmosphere in a veterinarians_office.",
    "timestamp_events": "['(Female singing-0.0-1.258)', '(Mechanisms-0.0-10.0)', '(Burping, eructation-1.191-1.423)', '(Female singing-1.461-1.775)', '(Baby laughter-1.775-2.846)', '(Female singing-2.659-2.944)', '(Female singing-3.034-4.487)', '(Burping, eructation-4.464-4.734)', '(Baby laughter-4.884-5.416)', '(Baby laughter-5.978-6.255)', '(Breathing-6.839-7.139)', '(Breathing-7.768-8.322)', '(Female singing-8.584-10.0)', '(Burping, eructation-9.356-9.603)', '(Baby laughter-9.94-10.0)']"
  },
  "Ykk9DM5ZbcAA.wav": {
    "caption": "An adult male speaks and a crowd laughs in a field at a tree farm, creating a chuckle and chortle audio event.",
    "timestamp_events": "['(Male speech, man speaking-0.0-0.899)', '(Conversation-0.0-10.0)', '(Laughter-1.013-1.776)', '(Male speech, man speaking-1.37-1.76)', '(Male speech, man speaking-1.849-2.813)', '(Laughter-2.767-3.71)', '(Male speech, man speaking-2.956-4.386)', '(Laughter-4.408-5.334)', '(Sound effect-5.269-8.421)', '(Laughter-6.829-7.609)', '(Male speech, man speaking-8.405-10.0)']"
  },
  "Yet4naViJESE.wav": {
    "caption": "A man sings with music playing in the background as a crowd cheers in an indoor stage.",
    "timestamp_events": "['(Female singing-0.0-3.385)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Female singing-3.71-10.0)']"
  },
  "YK-quxM8X0xc.wav": {
    "caption": "A rhythmic music plays while a tap sound occasionally interrupts in a television studio.",
    "timestamp_events": "['(Music-0.0-10.0)', '(Hubbub, speech noise, speech babble-0.0-10.0)', '(Tap dance-0.115-0.298)', '(Tap dance-0.447-0.562)', '(Tap dance-0.791-1.032)', '(Tap dance-1.227-1.456)', '(Tap dance-1.583-1.869)', '(Tap dance-2.351-2.523)', '(Tap dance-3.206-3.371)', '(Tap dance-3.544-3.727)', '(Tap dance-3.945-4.151)', '(Tap dance-4.369-4.518)', '(Tap dance-4.702-4.897)', '(Tap dance-5.011-5.218)', '(Tap dance-5.459-5.642)', '(Tap dance-5.929-6.112)', '(Tap dance-6.594-6.808)', '(Tap dance-6.979-8.395)', '(Tap dance-8.581-8.732)', '(Tap dance-9.002-9.163)', '(Tap dance-9.335-9.564)', '(Tap dance-9.713-10.0)']"
  },
  "YIK-SmFvA4jY.wav": {
    "caption": "Keys jangle as someone sprays a hard surface, creating a rhythmic sound, possibly in a gymnasium or indoor space.",
    "timestamp_events": "['(Generic impact sounds-0.0-0.416)', '(Mechanisms-0.0-10.0)', '(Breathing-0.519-1.199)', '(Generic impact sounds-1.165-2.478)', '(Generic impact sounds-2.711-2.876)', '(Generic impact sounds-3.096-4.588)', '(Breathing-4.258-4.828)', '(Generic impact sounds-5.385-5.66)', '(Breathing-5.412-6.107)', '(Generic impact sounds-6.065-6.437)', '(Generic impact sounds-6.753-7.845)', '(Breathing-8.072-8.711)', '(Generic impact sounds-8.127-9.412)', '(Breathing-8.979-9.715)']"
  },
  "Yecdp6PSmOQQ.wav": {
    "caption": "A child screams repeatedly while a dog whimpers in a veterinarian's office, surrounded by other domestic animals.",
    "timestamp_events": "['(Human sounds-0.0-0.336)', '(Background noise-0.0-10.0)', '(Dog-0.102-0.924)', '(Human sounds-1.395-2.395)', '(Dog-2.227-3.714)', '(Human sounds-4.16-5.051)', '(Dog-4.958-6.328)', '(Human sounds-7.093-7.933)', '(Dog-8.335-10.0)']"
  },
  "YKCvlD4EJ360.wav": {
    "caption": "The sound of rock and roll music fills the air as a crowd cheers and claps in a subway station.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.882)', '(Crowd-0.0-10.0)', '(Music-0.0-10.0)', '(Speech-2.532-3.897)', '(Male speech, man speaking-5.026-5.586)', '(Male speech, man speaking-6.854-9.071)']"
  },
  "YJ1c7oJXJkY0.wav": {
    "caption": "A man speaks amidst the croaking of frogs in an environment that seems to be an aquarium.",
    "timestamp_events": "['(Male speech, man speaking-0.0-1.588)', '(Frog-0.0-10.0)', '(Mechanisms-0.0-10.0)', '(Male speech, man speaking-2.603-3.243)', '(Male speech, man speaking-4.605-6.087)', '(Male speech, man speaking-8.781-10.0)']"
  },
  "YI1NFIjTEHUc.wav": {
    "caption": "People are talking while water splashes in an urban area, accompanied by music playing in the background.",
    "timestamp_events": "['(Stream, river-0.0-7.536)', '(Mechanisms-0.0-7.536)', '(Crowd-0.519-6.808)']"
  },
  "YcrvhdOAAJWI.wav": {
    "caption": "A large crowd cheers and cheers as children shout, creating a lively atmosphere in an indoor setting.",
    "timestamp_events": "['(Shout-0.155-1.208)', '(Male speech, man speaking-0.164-0.628)', '(Laughter-0.841-1.884)', '(Cheering-1.546-10.0)', '(Female speech, woman speaking-4.986-5.787)', '(Female speech, woman speaking-6.29-6.802)', '(Laughter-6.705-10.0)', '(Male speech, man speaking-7.681-8.754)']"
  },
  "YmL1qRKPy9os.wav": {
    "caption": "A man speaks with some clicking sounds as scissors are being used in a small room.",
    "timestamp_events": "['(Background noise-0.0-10.0)', '(Male speech, man speaking-0.546-2.196)', '(Male speech, man speaking-2.443-3.653)', '(Male speech, man speaking-4.127-4.629)', '(Male speech, man speaking-4.835-6.505)', '(Scissors-5.742-6.093)', '(Crumpling, crinkling-6.278-7.364)', '(Scissors-7.364-7.763)', '(Crumpling, crinkling-8.065-8.897)', '(Male speech, man speaking-8.423-10.0)']"
  },
  "YeWIESbG9Mcg.wav": {
    "caption": "A man passionately delivers a speech in a small room, creating an intense atmosphere.",
    "timestamp_events": "['(Surface contact-0.0-0.322)', '(Mechanisms-0.0-10.0)', '(Breathing-0.882-2.293)', '(Male speech, man speaking-1.082-1.809)', '(Male speech, man speaking-2.313-5.377)', '(Surface contact-2.334-2.846)', '(Surface contact-4.035-4.367)', '(Male speech, man speaking-6.912-7.244)', '(Male speech, man speaking-7.576-8.323)', '(Breathing-8.302-9.658)', '(Male speech, man speaking-9.16-10.0)', '(Surface contact-9.72-10.0)']"
  }
}