{"4963357278": {"audio_captions": ["The baby is shouting while people are talking in the foreground.", "The children are talking loudly, and some people are talking in the background.", "A child and an adult were talking."], "visual_captions": ["A snake is moving around the plant.", "A snake is eating a rat.", "The owner fed a snake."], "audio_visual_captions": ["The snake is attempting to eat the entire rat.", "The snake is eating the rat.", "Snake is catching the rat.", "The snake is eating some pieces of meat.", "The snake is at home, the baby is also at home."], "GPT_AV_captions": ["A snake is eating a rat while people are talking in the background.", "The snake is at home eating a rat, and a baby is shouting.", "A snake is moving around a plant and eating a rat while children and adults talk."]}, "4964516093": {"audio_captions": ["The girl and the children are speaking and laughing.", "The children had a funny conversation with their parents, and they were making fun of the children.", "The child is talking to the mother, and the mother replied to the child's question while also laughing at the child's reply."], "visual_captions": ["Two children are dancing.", "The two girls are dancing.", "Baby girls are playing in the house.", "Two children are playing and they fall down."], "audio_visual_captions": ["The children expressed their love.", "Two children are playing while wearing costumes of a husband and wife.", "Two children are dancing.", "Two children are dancing with hugs and having fun."], "GPT_AV_captions": ["Two children are dancing and laughing together.", "The children are playing and having a funny conversation with their parents.", "Two children are dancing, expressing their love and having fun."]}, "4967363921": {"audio_captions": ["A man and a woman are having a conversation.", "Someone is interviewing a woman about something.", "The man and the woman are talking about the picnic."], "visual_captions": ["The lady was talking to a cameraman on one side, while another woman was eating on the other side. The lady was smiling while talking to the cameraman.", "Two women are sitting on a chair at an open restaurant. One girl is eating cake while the other girl is talking with someone.", "The girls are having a fun time eating together."], "audio_visual_captions": ["Someone is interviewing a lady and the lady is answering his questions.", "Two women are eating at a restaurant while someone takes a picture of them. The women are beautiful.", "The women are talking and eating with smiles on their faces.", "One woman is eating food and another woman is talking."], "GPT_AV_captions": ["A man is interviewing a woman while another woman is eating at an open restaurant.", "Two women are at a restaurant; one is eating while the other is talking and smiling.", "The women are having a conversation and enjoying their time at the restaurant."]}, "4969723020": {"audio_captions": ["Two people are talking loudly while they are driving.", "There is  loud sound of the wind in the background and some people are talking.", "The boys are playing in the water and talking."], "visual_captions": ["Three men are in a grass field, and one of them swings a baseball bat in an attempt to hit a can of beverage that is thrown at him. Eventually, he succeeds and causes the can to explode.", "The person is playing the basketball game and is thoroughly enjoying it.", "A man is playing baseball with his friends.", "Three men are playing a baseball game."], "audio_visual_captions": ["They are playing baseball in the park.", "Three people are playing on the grassy field.", "Three men are playing a baseball game."], "GPT_AV_captions": ["Three men are playing baseball in a grassy field.", "Three men are playing a baseball game in the park.", "Three men are playing baseball and talking loudly."]}, "4972231631": {"audio_captions": ["The people are talking and working.", "People are talking while they work.", "Some people doing some activity and talking about something."], "visual_captions": ["A man consumes a large amount of delicious food with his extended family.", "A family is seen eating together and they appear to be joyful and happy in their family.", "At a food table, a family is enjoying a variety of foods. A lady opens a box and finds a lot of food inside.", "The food is on the table, and people are happily eating it in the home."], "audio_visual_captions": ["Some people are eating food while others are serving the food.", "The family members are eating at the dining table.", "The entire family is eating delicious food at the dining table and talking to each other.", "The family is eating a variety of foods at the dining table."], "GPT_AV_captions": ["A family is eating a variety of delicious foods at the dining table and talking to each other.", "People are happily eating and talking while some are serving food at the dining table.", "The family members are joyfully eating together and conversing at the dining table."]}, "4981531978": {"audio_captions": ["The old person is speaking and the dog is barking.", "One child and his mother are playing with a dog.", "The boy is talking and laughing."], "visual_captions": ["Two donkeys were following a lady, who was running to the other side.", "A woman is running with a ball in her hand, and two donkeys are running behind her. She runs faster, causing the donkeys to stop and watch her.", "A woman is running and an animal is following her.", "A woman is being followed by two donkeys, and after that, only one donkey runs."], "audio_visual_captions": ["Donkeys are running towards a woman.", "A girl is running around the garden, and two donkeys are following her.", "The donkeys are chasing the woman, and she is happier.", "The Donkeys are chasing a girl and she is running with fear."], "GPT_AV_captions": ["A woman is running with two donkeys following her, and she appears happy.", "A woman is being chased by two donkeys, and she is running with a ball in her hand.", "A woman is running around the garden with two donkeys following her."]}, "4983163710": {"audio_captions": ["The two or more people are talking loudly and laughing.", "Two women are making too much noise. They are talking and laughing with each other, and there are also some disturbing sounds coming from the surroundings.", "The two girls were laughing and speaking loudly."], "visual_captions": ["The women are having a party.", "People are drinking and eating at the table. All the people are enjoying themselves.", "The friends are enjoying a dinner party.", "Girls with drinks in their hands."], "audio_visual_captions": ["There are some women drinking vodka at the dining table and laughing with each other.", "A group of members are eating fruits, drinking, and talking.", "The girls are consuming alcohol and having a good time.", "The women are drinking drinks and then tasting the lemon."], "GPT_AV_captions": ["A group of women are drinking and laughing at a dinner party.", "The women are enjoying themselves, eating, drinking, and talking loudly.", "Friends are having a good time, consuming alcohol and tasting lemon."]}, "4983786005": {"audio_captions": ["The lady is speaking loudly and is being very serious.", "She was speaking to the baby.", "Conversation between the mom and son.", "The woman was speaking seriously."], "visual_captions": ["The boy is cycling and playing in the park.", "A kid was riding a bicycle and fell down. However, he got back on the bicycle.", "A very young child, wearing a helmet, pedals a bicycle down a sidewalk. They make a turn and fall off, but quickly get back on and continue pedaling down the sidewalk.", "A small boy is playing on a bicycle by the roadside.", "The baby boy slipped from the cycle while cycling."], "audio_visual_captions": ["A woman is following a little boy who is learning to ride a bicycle.", "A boy is riding a bicycle.", "A small boy is riding a bicycle and falls down on the grass.", "The child is cycling on the road. The child prioritizes safety by wearing helmet."], "GPT_AV_captions": ["A woman is speaking seriously to a small boy who is learning to ride a bicycle and falls down but gets back up.", "A young child, wearing a helmet, is cycling on the sidewalk and falls off, but quickly gets back on while a woman follows.", "A boy is riding a bicycle, falls down, and gets back up while a woman speaks to him seriously."]}, "4987887725": {"audio_captions": ["A woman is singing a song.", "The music is being played and the woman is singing a song in the background.", "A woman is singing and there is a noisy background sound."], "visual_captions": ["An old woman is playing music.", "A woman is placing a keyboard on the street, and people are giving her money.", "A woman is singing a song on the road, and people are paying her to sing.", "An old woman is playing a musical instrument on the roadside."], "audio_visual_captions": ["A woman is sitting and singing the song.", "A lady beggar sings a song and plays an instrument, then two people give her some money.", "The lady plays a musical instrument."], "GPT_AV_captions": ["A woman is singing a song while playing a musical instrument on the street, and people are giving her money.", "An old woman is playing music and singing on the roadside, and passersby are paying her.", "A woman is performing a song with a musical instrument on the street, and people are donating money to her."]}, "4992338194": {"audio_captions": ["There is background party music and people are enjoying themselves. The party is enjoyable, with everyone, including children, having a good time.", "The friends are enjoying the party and playing games.", "A woman is shouting and people are enjoying in the background.", "Some people are enjoying the party music."], "visual_captions": ["The robot is demonstrating its work in front of people.", "The robot has a very impressive way of moving and observing people.", "The researchers are presenting the final output of the robot.", "More people are watching the robot."], "audio_visual_captions": ["This robot is an experiment conducted by those people. The experiment with the robot is going well, so all the people are smiling.", "A group of people is standing there, watching the robot as it performs a task. They are all cheering and encouraging the robot.", "Introduction and live demonstration of robots."], "GPT_AV_captions": ["People are enjoying a party with background music while a robot is being demonstrated to the crowd.", "The robot is performing tasks impressively, and the crowd, including children, is cheering and smiling.", "Researchers are presenting the robot's final output, and everyone is having a good time at the party."]}, "4999127441": {"audio_captions": ["A group of people is singing a happy birthday song. The celebrant blows out a candle right after, and they all cheer together with applause.", "The birthday celebration is being held.", "A person is celebrating a birthday party."], "visual_captions": ["The father surprised his son with a birthday cake.", "The boy is blowing out the candles on the cake.", "The son spent his birthday with his family.", "A small boy is celebrating his birthday with a cake.", "The birthday boy is experiencing a very happy moment."], "audio_visual_captions": ["A child is celebrating his birthday with his parents.", "The little boy blew out the candle on a birthday cake.", "They are celebrating a boy's birthday.", "The boy blew out the candles on his birthday cake at the party."], "GPT_AV_captions": ["A child is celebrating his birthday with his family, blowing out the candles on his cake as everyone sings and cheers.", "The boy is having a joyful birthday party, surrounded by his parents and receiving applause after blowing out the candles.", "A small boy celebrates his birthday with a cake, his family singing happy birthday and cheering as he blows out the candles."]}, "4999665957": {"audio_captions": ["There are people speaking and shouting in the background.", "The sound of the beep is very audible.", "The people are celebrating a birthday party and everyone is enjoying themselves."], "visual_captions": ["A group of people is celebrating the birthdays of an elderly woman and a man.", "A family is celebrating their parents' anniversary.", "They are celebrating their birthday with cake.", "The entire family is celebrating the birthday party.", "A family is celebrating their grandparents' special day."], "audio_visual_captions": ["The family was celebrating the grandma's birthday.", "They are celebrating a birthday party.", "Celebrating a birthday party with two cakes."], "GPT_AV_captions": ["A family is celebrating a birthday party with two cakes, and everyone is enjoying themselves.", "The family is celebrating the birthdays of an elderly woman and a man, with people speaking and shouting in the background.", "A group of people is celebrating a birthday party, and the sound of a beep is very audible."]}, "5008618500": {"audio_captions": ["A mother and her child were talking about something.", "Both ladies are talking together and expressing their opinions.", "The child is talking with his mom."], "visual_captions": ["A woman is caressing two children.", "A mother is holding a newborn baby and showing it to her older sister.", "A mother is showing her newborn baby to her daughter, and the child is very happy to see the little one."], "audio_visual_captions": ["The mother is caring for her newborn baby, and one child is observing the baby.", "The mother is speaking to the child.", "A mother is explaining her newborn baby to her older child."], "GPT_AV_captions": ["A mother is talking to her child while holding a newborn baby.", "A mother is showing her newborn baby to her older child, who is happy to see the baby.", "The mother is caring for her newborn baby and speaking to her older child."]}, "5013421988": {"audio_captions": ["A child is crying, and then the mother speaks to the child.", "The baby is shouting and the women are talking to this baby.", "A girl is speaking with a lot of smiles."], "visual_captions": ["The child is sitting on a stool chair.", "There is a cute little baby sitting on a small baby chair. The baby is biting everything, such as their finger and the chair. Additionally, there is a white furry dog lying on the floor beside them.", "The baby was playing in the chair and looking at another side. The baby's hand was inside the mouth and looking at other places.", "The baby was sitting and playing."], "audio_visual_captions": ["The child was playing and sitting in a place.", "A baby is sitting in the baby chair and trying to reach for the book nearby.", "The baby is sitting in a small chair and playing in an adorable manner."], "GPT_AV_captions": ["A baby is sitting on a small chair, playing and occasionally biting their finger.", "The baby is sitting in a baby chair, with a white furry dog lying on the floor beside them, while the mother speaks to the child.", "The child is sitting on a stool chair, playing and looking around, with the mother talking to the baby."]}, "5015000984": {"audio_captions": ["A man was walking in the water.", "There is a lake or a river with water.", "This person is very happy and enjoying themselves fully while swimming in the water."], "visual_captions": ["The dog is very happy swimming in the swimming pool.", "A German Shepherd dog is happily swimming in a pool. Two other dogs and a man can be seen in the video.", "A dog is swimming in the swimming pool.", "There is a dog swimming in the pool. Another dog is on the other side of the pool. There is also a man lying on a chair and watching the dog.", "The German Shepherd dog is swimming in the pool."], "audio_visual_captions": ["A dog is splashing in a pool, swimming, and then it swims to the side to exit the pool and shakes.", "The dog is playing in the swimming pool.", "A dog is currently swimming in the water.", "The dog is playing in the swimming pool."], "GPT_AV_captions": ["A German Shepherd dog is happily swimming and splashing in a pool, with two other dogs and a man nearby.", "The dog is enjoying itself while swimming in the pool, with another dog on the other side and a man watching from a chair.", "A dog is swimming in the pool, then swims to the side to exit and shakes off the water."]}, "5017166671": {"audio_captions": ["There is a music party happening.", "A boisterous crowd is cheering while a performer sings, and the sound of instruments accompanies in the background.", "Many musicians are playing their instruments and a singer is singing a song on the stage.", "There is good music playing and some enjoyable activities happening."], "visual_captions": ["Many musicians are sitting on the stage and playing their instruments.", "The musical band is playing good and lively songs.", "A group of people are singing a song and playing musical instruments to enjoy the function. The people are encouraged to do so.", "The six people plays the piano, guitar, and violin to create beautiful music."], "audio_visual_captions": ["There are four members playing music.", "The orchestra is playing an instrument while the man is singing on the stage.", "The group of musicians is playing the music.", "The music is very pleasant."], "GPT_AV_captions": ["A group of musicians is playing various instruments on stage while a man sings, creating a lively and enjoyable atmosphere.", "Many musicians are performing on stage, playing instruments like the piano, guitar, and violin, with a boisterous crowd cheering them on.", "The musical band is delivering a pleasant performance with a mix of singing and instrumental music, engaging the audience in the celebration."]}, "5029903979": {"audio_captions": ["The baby is shouting while people are talking in the background.", "The music is heard very well.", "The baby is shouting, the TV is playing music, and the father is talking with their baby."], "visual_captions": ["A man took a small toy from a baby's hand while the baby was trying to put it in its mouth.", "A baby is playing with a toy and laughing.", "A baby boy is playing with his dad.", "The baby boy is playing with his father."], "audio_visual_captions": ["The baby was having fun with his father.", "It is a baby playing with a toy.", "The baby is smiling and talking with their dad, and the baby is also playing with a toy.", "The child is playing with his father.", "A baby boy is holding the toy, and his grandfather takes the toy to the baby for him to play with. The baby is trying to grab the toy with his lips."], "GPT_AV_captions": ["A baby boy is playing with his father, laughing and shouting while the TV plays music in the background.", "The baby is smiling and talking with his dad, trying to grab a toy with his lips as his father takes it from him.", "The baby boy is having fun with his father, playing with a toy and making noise while people talk in the background."]}, "5033359225": {"audio_captions": ["Two people were talking, but it was very noisy.", "One person is shouting while others are laughing.", "Driving the car or bike."], "visual_captions": ["A lifeboat is pulling another boat with guests in a lake.", "Six people are enjoying their water ride.", "There is a ship heading out to sea with a group of six people on board. The ship has a very impressive appearance.", "The jet ski was connected to a regular boat for a ride along the entire river."], "audio_visual_captions": ["Six humans are riding in a boat.", "People are playing in the river and riding the boat.", "Many people are boating in the water.", "Two boats are riding in the river. One boat is following the other boat."], "GPT_AV_captions": ["Six people are enjoying a boat ride in the river, with one boat pulling another.", "People are riding boats in the river, having fun and laughing despite the noise.", "Two boats are moving along the river, with one boat towing the other."]}, "5041383030": {"audio_captions": ["A man is speaking while some people are laughing in the background.", "A man tells a joke to make the lady smile.", "Conversation between them is good and healthy."], "visual_captions": ["A group of family members is having a discussion about an important matter. In the video, there are three women and two men present. It appears that one of the men is taking the lead and doing most of the talking.", "The father was talking with the family and explaining something.", "A man is talking about his thoughts.", "Two people are talking in the room.", "The man is telling a story to others."], "audio_visual_captions": ["The people are speaking.", "Two elderly men and two elderly women are engaged in conversation.", "The man is speaking to the person.", "The entire family is spending time together, speaking and enjoying each other's company.", "Many people are sitting on the sofa and discussing interesting matters that others find enjoyable to listen to. They are also engaging in conversation with laughter."], "GPT_AV_captions": ["A man is speaking to his family, making them laugh and smile while discussing an important matter.", "The family, consisting of three women and two men, is having a lively conversation with laughter and enjoyment.", "The father is leading a discussion with the family, sharing his thoughts and stories, creating a good and healthy conversation."]}, "5042865125": {"audio_captions": ["This baby was laughing, enjoying the parents' cute, beautiful, interesting, and happy presence.", "It sounds like a game involving children shooting guns.", "The parent is talking to their child. The child's voice is sweet."], "visual_captions": ["A woman is carrying a large toy helicopter and walking towards a child who is playing with a small helicopter. She shows the helicopter to the child.", "Mom is helping her child arrange the toys.", "The mom is playing with her daughter."], "audio_visual_captions": ["The mother and son enjoy playing together, which is very fun, lovely, and caring.", "A woman is entertaining a young child by playing with him.", "The mother is playing with the baby.", "A mother and son were playing with toys.", "The kid and mother are playing a game."], "GPT_AV_captions": ["A mother is playing with her child, showing a large toy helicopter while the child plays with a small one.", "The mother and her son are enjoying a fun and lovely time together, arranging and playing with toys.", "The mom is engaging her baby in a playful and caring manner, making the child laugh and enjoy the moment."]}, "5049587564": {"audio_captions": ["There is a baby shouting and two children are talking loudly.", "The women and the baby are playing in the water.", "The ladies  are talking and shouting. They are very lively."], "visual_captions": ["A group of kids is holding a large ring and sitting down.", "The children are playing in a park.", "Six children were playing with the ring in front of their parents.", "Children played with a round tube.", "The children are playing in the playground and enjoying themselves. They are having a ring in their hands while sitting and playing."], "audio_visual_captions": ["A group of children is playing with a ring on the ground.", "Children are playing in the park with their parents' guidance.", "A group of children is playing in the ground.", "Children enjoy playing at the park.", "The group of kids is holding the circular ring with their fingers to balance it evenly while playing on the ground."], "GPT_AV_captions": ["A group of children is playing with a ring in the park, enjoying themselves while their parents watch.", "The children are lively and shouting as they play with a large ring on the playground.", "Six children are sitting and holding a circular ring, playing energetically while their parents are nearby."]}, "5050116958": {"audio_captions": ["The statements in this conversation are spoken by multiple people, including a sweet male voice.", "There are some conversations between them.", "Many people are talking about various matters and there are small noises in the background. One woman was speaking loudly about some argumentative matters and also laughing."], "visual_captions": ["A man is talking about his friend.", "A group of people are staying at home and enjoying themselves with friends, then engaging in conversation with everyone.", "The family is very happy/enjoying themselves."], "audio_visual_captions": ["People are talking and doing some activities.", "The friends are enjoying themselves.", "The people are having fun, they are friends. They are shooting a video for social media."], "GPT_AV_captions": ["A group of friends are at home, talking and enjoying themselves, with some background noises and laughter.", "People are having fun and engaging in conversations, with a woman speaking loudly at times.", "Friends are enjoying their time together, talking about various matters and shooting a video for social media."]}, "5056964274": {"audio_captions": ["Men and women are speaking in unintelligible sounds.", "A woman was discussing something.", "A woman is speaking to a child while people are walking in the background."], "visual_captions": ["A boy is currently drinking the juice.", "The child is consuming a soft drink.", "The child is drinking juice and eating bread.", "A boy is drinking the juice."], "audio_visual_captions": ["The child is drinking cold drinks and eating some food.", "There is one child drinking the juice. The child is having the snacks.", "The baby was drinking juice.", "A child was enjoying his juice.", "Someone gave juice and bread to a small baby."], "GPT_AV_captions": ["A child is drinking juice and eating bread while people are walking in the background.", "A boy is drinking juice and having snacks.", "A child is enjoying juice and some food."]}, "5064681723": {"audio_captions": ["The birds are making sounds in the park.", "The person is commenting on a picture of a wolf and expressing gratitude to the viewer.", "The woman speaks softly in moments of silence."], "visual_captions": ["In the early morning, people were walking with their baby and dog, and then they watched deer along with others.", "There are some deer standing in the forest.", "In a forest, there are two men, a baby, and a dog, all of whom are watching deer."], "audio_visual_captions": ["The man was capturing the video of deer.", "Deer are found in forest areas, and people visit them with their toddlers and pets.", "The deer are searching for food."], "GPT_AV_captions": ["In the early morning, people with their baby and dog are watching deer in the forest.", "The man is capturing a video of the deer while birds are making sounds in the park.", "The woman speaks softly in moments of silence as the deer search for food."]}, "5070310138": {"audio_captions": ["A little girl is speaking with another person.", "The baby was laughing a lot, and the father was discussing how cute the baby was. They were both happy and enjoying the baby.", "The baby is saying something and the man is responding.", "The person and the baby are speaking."], "visual_captions": ["The baby is playing with toys while taking a bath.", "A baby was playing with water.", "The father is watching the kid play in the bathtub.", "A child is playing in the bathtub."], "audio_visual_captions": ["A baby was having fun with his father in the tub.", "The child had fun with his father.", "The baby was playing with the water.", "A baby is playing in the bathtub in front of their dad."], "GPT_AV_captions": ["A baby is playing with water in the bathtub while the father watches and responds to the baby.", "The baby is having fun in the bathtub, interacting with the father who finds the baby cute and laughs along.", "A child is enjoying bath time, playing with toys and water, while the dad engages in conversation with the baby."]}, "5082198541": {"audio_captions": ["The baby is crying and making loud noises.", "The baby is making annoying sounds and there is some background noise.", "The baby is laughing and playing."], "visual_captions": ["A baby is playing with a cat. The baby is very happy with the cat. The baby and the cat are slowly going to another place.", "A little boy and a cat are playing.", "One child is playing with a cat.", "The baby boy is playing with a cat."], "audio_visual_captions": ["A baby is playing with a cat, pulling its tail and crawling on the floor.", "The child is playing with a cat.", "The child is playing with a cat."], "GPT_AV_captions": ["A baby is playing with a cat, pulling its tail and crawling on the floor.", "A baby is playing with a cat and making noises.", "A baby boy is playing with a cat and making sounds."]}, "5082890299": {"audio_captions": ["The baby was playing with his or her parents.", "A child is crying and people are laughing.", "Mom and the child are enjoying themselves."], "visual_captions": ["A father is playing with his child by letting the air out of the balloon.", "The baby is playing with her father, playing a balloon game.", "A man is playing with a child, and the child is laughing.", "A man is playing with his son with a balloon.", "The baby was playing with a balloon."], "audio_visual_captions": ["The man is blowing a balloon, and the baby is laughing loudly.", "A man is playing with a baby and a balloon.", "Dad shows the child a balloon game."], "GPT_AV_captions": ["A man is playing with his child using a balloon, and the child is laughing.", "The baby is playing with a balloon while the parents are enjoying themselves.", "A father is entertaining his baby with a balloon game, and the baby is laughing loudly."]}, "5096827532": {"audio_captions": ["The birthday party is currently happening and the process of cutting the cake has begun.", "A girl is singing a song.", "The party is for the baby's birthday."], "visual_captions": ["The children are excited about the birthday party.", "The little girl celebrated her birthday with her family.", "A child was enjoying his birthday cake.", "The baby blew out the birthday cake candle."], "audio_visual_captions": ["One child has a birthday, and their family is celebrating the birthday party. There is one mother and two children enjoying the party.", "He is celebrating his birthday with his family.", "The baby looked adorable while celebrating their birthday with this cake and seemed very happy and enjoyed eating it."], "GPT_AV_captions": ["A baby is celebrating their birthday with their family, and the children are excited about the party.", "The baby blew out the birthday cake candle and looked adorable while enjoying the cake.", "A girl is singing a song during the birthday party, and everyone seems very happy."]}, "5104115508": {"audio_captions": ["Playing a musical instrument while hearing people's sounds in the background.", "There is live music playing and people can be heard having conversations in the background.", "The music program is currently playing."], "visual_captions": ["A couple was cutting their wedding cake.", "The wedding anniversary cake is cut at  the party .", "The bride and groom are cutting the cake at their wedding reception.", "The people are celebrating anniversary by cutting cake.", "Married couple is cutting a cake at a function."], "audio_visual_captions": ["During a wedding ceremony, the couple cuts the cake while a guest takes a video.", "A newly married couple is cutting the cake while people are watching in the background.", "A birthday party is taking place where a man and a woman are cutting the cake.", "The couple is cutting the wedding cake and enjoying it.", "The couple is cutting the cake. The cake's color is black and white."], "GPT_AV_captions": ["A couple is cutting their wedding cake while live music plays and people converse in the background.", "The bride and groom are cutting the cake at their wedding reception with guests watching and music playing.", "During a wedding ceremony, the couple cuts the cake as guests celebrate and a musical performance is heard."]}, "5107014713": {"audio_captions": ["The people are making background noise.", "The noise of many people is loud.", "A woman is talking loudly, and people are shouting and making noise in the background."], "visual_captions": ["The elephant is walking and playing.", "The two elephants were eating the pumpkin.", "An elephant is holding a pumpkin with its trunk."], "audio_visual_captions": ["The elephants are walking out of the room and attempting to eat some fruits, while the crowd surrounding the elephants is shouting happily.", "The elephant comes out of the room and eats the pumpkin while all the people are shouting in the background.", "Two elephants came to the curve and ate the big fruit in the zoo. The people were encouraging it."], "GPT_AV_captions": ["Two elephants are walking out of the room and eating pumpkins while people are shouting and making noise in the background.", "The elephants are playing and eating pumpkins as the crowd surrounding them shouts happily.", "An elephant is holding a pumpkin with its trunk while people in the background are making loud noises and shouting."]}, "5107391081": {"audio_captions": ["Multiple adults are laughing and talking intermittently, while a young child laughs and makes noise occasionally in the background.", "The baby was playing in the water with daddy.", "A baby is shouting and people are talking around.", "The baby is shouting while people are talking in the background."], "visual_captions": ["The mom and dad teach the child swimming.", "His daughter is practicing swimming.", "Two people are playing with one child in the river.", "A baby is attempting to swim, and the baby's parents are helping the baby swim.", "A man helped the baby to swim."], "audio_visual_captions": ["Her husband cracked a joke and they were laughing.", "The baby and parents are playing in the pool.", "The family is enjoying themselves in a pond with a child."], "GPT_AV_captions": ["A baby is playing in the water while the parents help and laugh together.", "The family is enjoying themselves in a pond, with the baby attempting to swim.", "The baby is shouting and laughing as the parents teach swimming in the water."]}, "5107595441": {"audio_captions": ["It sounds like someone is talking.", "Someone is watching television.", "The man is engaging the audience."], "visual_captions": ["Cats and kittens are eating food.", "The cat was eating while two cats were watching.", "The cats were playing and eating food.", "The owner was playing with three cats.", "There are many cats on the bed. One small cat is eating, while another one is playing with a person. The big cat is sitting and eating while looking in another direction."], "audio_visual_captions": ["The boy is playing with three cats.", "There are many cats on the bed. One of them is a big cat, and another cat is eating. Another cat is playing with a person, and these cats are playing. The big cat is eating and sitting.", "There are three cats sitting and one cat eating the food. Next, another cat is playing with the man."], "GPT_AV_captions": ["A man is playing with three cats on the bed; one cat is eating, another is playing, and a big cat is sitting and eating while looking in another direction.", "There are many cats on the bed; one small cat is eating, another is playing with a person, and the big cat is sitting and eating.", "The man is engaging with the audience while playing with three cats; one cat is eating, another is playing, and the big cat is sitting and eating."]}, "5112223863": {"audio_captions": ["Friends enjoyed the birthday celebration party.", "Some people are singing in a group.", "People are enjoying the party with their friends.", "Friends and relatives are enjoying the party."], "visual_captions": ["The child is enjoying a lot at their birthday celebration.", "Mom is celebrating her kid's birthday.", "A baby is celebrating his birthday with his friends by blowing out sparkling candles.", "Three children are enjoying the birthday party."], "audio_visual_captions": ["The lady and three babies are celebrating the birthday, and they are blowing out the candle.", "The birthday baby was cutting cake.", "It was a birthday celebration for a baby!"], "GPT_AV_captions": ["A baby is celebrating their birthday with friends and family, blowing out sparkling candles.", "Friends and relatives are enjoying the birthday party, singing and celebrating together.", "A mother is celebrating her child's birthday, and the child is cutting the cake with friends."]}, "5112579753": {"audio_captions": ["A baby is making \"Owh\" sounds in a quiet environment.", "A baby is making some annoying sounds.", "The baby is playing a game with its mother."], "visual_captions": ["The baby plays and drinks the milk. It is so cute.", "One child is playing and drinking some milk from a bottle.", "The baby is drinking milk that her mom is feeding to him in a bottle.", "Feeding milk to the baby."], "audio_visual_captions": ["The baby is drinking a bottle of milk.", "The baby was drinking very well.", "The baby is drinking the milk more actively."], "GPT_AV_captions": ["A baby is making sounds while drinking milk from a bottle.", "The baby is being fed milk from a bottle by its mother.", "The baby is actively drinking milk and making noises."]}, "5116088152": {"audio_captions": ["A girl is speaking to someone.", "Two people had a conversation about their favorite fruits.", "The women and the man are sharing the fruits and eating."], "visual_captions": ["The baby is eating the apple, and it is very tasty.", "The baby was eating fruits, and the fruits are bananas. We are seeing something very beautiful.", "The kid is chewing the fruits."], "audio_visual_captions": ["The baby is eating fruits, and their parents are recording it.", "A baby tries to eat fruits like bananas.", "The cute baby is eating a banana.", "The baby is eating a banana.", "The child is eating a banana."], "GPT_AV_captions": ["A baby is eating a banana while their parents are recording it.", "The baby is enjoying a banana, and their parents are capturing the moment.", "A child is eating a banana, and their parents are filming the scene."]}, "5133435424": {"audio_captions": ["The baby was happy to talk to the father.", "A man is playing with a child, and both the child and the man are laughing. Then, a woman joins them, and she is also laughing.", "The man is playing with the child and laughing. The child is shouting and playing.", "A man is talking to the child."], "visual_captions": ["A man, who is wearing sunglasses, assists a blonde boy in putting on a pair of sunglasses. Afterward, they both laugh, take a selfie, and the man shows the boy the camera.", "The child is playing with their dad with camera.", "A baby is sitting and playing with his dad.", "Dad and son are wearing sunglasses.", "The dad and son were taking a picture on a camera."], "audio_visual_captions": ["A small boy and a man are wearing sunglasses and taking pictures with a camera.", "The dad is taking a selfie with his son while people are watching in the background.", "The father and child were playing on the bed."], "GPT_AV_captions": ["A man and a child, both wearing sunglasses, are laughing and taking selfies with a camera.", "A father and his son are playing and laughing together, with the father helping the son put on sunglasses.", "The dad and his son are enjoying their time together, taking pictures and playing on the bed."]}, "5139813648": {"audio_captions": ["The lady speaking to the baby and both enjoy it.", "A lady is talking with a baby in the background.", "The baby is shouting and people are talking."], "visual_captions": ["The two babies are playing.", "The children are playing with full of joy.", "A cute brother and sister are playing together."], "audio_visual_captions": ["Two children are playing at home.", "Two children are playing with the ball happily.", "Two children are playing in their house."], "GPT_AV_captions": ["Two children are playing joyfully at home.", "A lady is talking while two children play happily.", "Two children are playing together with a ball in their house."]}, "5144319075": {"audio_captions": ["A child is laughing while an adult periodically talks to the child.", "A baby is laughing here, and the father is playing with the baby.", "A child is laughing while people are walking in the background."], "visual_captions": ["The baby was walking step by step in their first attempt.", "The father was playing with the children.", "A boy is playing with his sibling."], "audio_visual_captions": ["A sister enjoys teaching her younger sibling how to walk.", "The man is holding the hand of the small baby, and another child is walking. Both children are playing and laughing loudly.", "The father and younger child gave some training to their baby on how to walk, and the baby was very happy to walk alongside their brother and father.", "Two kids are trying to walk, run, and enjoy themselves."], "GPT_AV_captions": ["A father is playing with his children, and the baby is laughing while trying to walk for the first time.", "A man is holding the hand of a small baby, and another child is walking and laughing in the background.", "A baby is happily taking their first steps with the help of their father and sibling, while everyone laughs and enjoys the moment."]}, "5145149014": {"audio_captions": ["The baby is crying and the mother is caring for him/her.", "The baby was crying, so a woman and a man were talking to the baby.", "A baby is crying and a person's voice is heard in the background."], "visual_captions": ["A baby is enjoying with his beloved family member.", "The father is playing with his young child.", "A baby is playing with man."], "audio_visual_captions": ["A man is playing with a baby while a woman is talking in the background.", "The baby was watching their mother speak.", "A mother is playing with the child in the room."], "GPT_AV_captions": ["A baby is crying while a man is playing with him and a woman is talking in the background.", "A baby is being cared for by a man while a woman speaks in the background.", "A baby is crying and being comforted by a man, with a woman talking nearby."]}, "5145526755": {"audio_captions": ["While starting the motor, some people are traveling in the background.", "There are women speaking in the background.", "This person is talking silently and motor sound, which is very loud, as there is starting trouble in this machine."], "visual_captions": ["Two lions are sitting in the forest.", "In the forest, there is one lion sleeping on one line, and two lions are simply sitting on another line.", "The lion is sleeping in the yard.", "Lions are resting in the forest.", "There are two female lions, one is sleeping and the other is sitting."], "audio_visual_captions": ["Two lions are sitting in the forest.", "The main focus is on animals, such as lions.", "Two female lions are sitting and tourists are visiting the lions."], "GPT_AV_captions": ["Two female lions are sitting in the forest while tourists are visiting.", "Lions are resting in the forest with the sound of a motor starting in the background.", "Two lions are in the forest, one is sleeping and the other is sitting, with people talking in the background."]}, "5148501793": {"audio_captions": ["Some people are enjoying the beach, and the children are playing very happily.", "The sound of the river and the sound of many people.", "The rain is very heavy, and the man and child are watching the rain and enjoying it very much."], "visual_captions": ["The baby is playing in the sand.", "The baby was playing games in the beach.", "The baby is playing in the beach and is very, very cute."], "audio_visual_captions": ["A child was playing on the beach.", "A girl is digging sand on the beach with a woman.", "A baby is playing on the beach while people are talking in the background.", "A child is playing at the beach and she is very happy."], "GPT_AV_captions": ["A baby is playing on the beach while people are talking in the background and the sound of the river can be heard.", "A child is happily playing in the sand at the beach, enjoying the moment despite the heavy rain.", "A girl is digging sand on the beach with a woman, surrounded by the sounds of many people."]}, "5149181269": {"audio_captions": ["A mother and baby are playing.", "The child is trying to talk to their mom and smiles and the mom speaks to the child.", "The mother and the baby are playing with a smile.", "When a baby tries to speak, the mother appreciates it and responds."], "visual_captions": ["A cute little baby boy is playing with his dogs in the house.", "A baby boy was playing with two pet dogs!", "The little baby is playing with the dogs and is very happy.", "The baby is playing with dogs and toys."], "audio_visual_captions": ["A baby is playing with the dogs.", "The baby is playing well with the dogs.", "The baby is playing with the dogs."], "GPT_AV_captions": ["A mother and her baby boy are playing with their dogs in the house.", "The baby boy is happily playing with the dogs while his mother talks to him.", "The mother smiles and responds as the baby boy tries to speak while playing with the dogs."]}, "5162562403": {"audio_captions": ["The dogs are barking at one another.", "The dog is barking loudly.", "A man is talking with a background of dog sounds."], "visual_captions": ["The black and white dogs are playing with the dog owner.", "The two dogs are shouting loudly.", "A boy is playing with a black dog and a white dog.", "Two dogs are playing with their owner."], "audio_visual_captions": ["A dog and a boy are playing with a big dog while another man is working on the laptop.", "The two dogs are barking loudly.", "The man was playing with the big dog and trying to save the small dog.", "A dog is continuously barking at another white dog. A boy attempts to play with the white dog, but the dog is clearly uncomfortable. Meanwhile, a man is working on his laptop."], "GPT_AV_captions": ["Two dogs, one black and one white, are barking loudly while playing with a boy.", "A boy is playing with two dogs, one black and one white, as a man works on his laptop in the background.", "The dogs are barking at each other while a boy tries to play with them, and a man is seen working on his laptop."]}, "5165840822": {"audio_captions": ["One person is speaking, and there is a lot of background noise.", "A baby's sounds can resemble crying or playing.", "The baby is playing and watching TV.", "People are talking in the background."], "visual_captions": ["The baby is playing with toys.", "A newborn baby is playing with toys.", "The baby is playing with toys and they are shouting with them, while the mother is playing with her baby.", "The baby starts crying and then plays with the toys."], "audio_visual_captions": ["The baby is playing with its mother and a toy.", "The baby is lying down and murmuring.", "The baby is playing with toys.", "The baby was sleeping on the bed."], "GPT_AV_captions": ["A baby is playing with toys while people are talking in the background.", "A baby is playing with its mother and making sounds that resemble crying or playing.", "A baby is lying down, murmuring, and then starts playing with toys."]}, "5166736368": {"audio_captions": ["The baby was playing while the mom was talking to the baby.", "The baby is shouting, and the mom is talking to the baby.", "A small baby is playing with toys, and then the mother talks to the child."], "visual_captions": ["The child was playing with toys.", "A baby is sitting on the ground, playing with multiple toys and drooling.", "The baby was playing with many different kinds of toys.", "The baby was playing."], "audio_visual_captions": ["A baby is playing with toys.", "A baby is playing with many children's toys.", "One child is playing with the ball."], "GPT_AV_captions": ["A baby is playing with toys while the mom talks to the baby.", "The baby is sitting on the ground, playing with multiple toys.", "A small baby is playing with toys, and the mother is talking to the child."]}, "5166753093": {"audio_captions": ["People are singing a song.", "A music album is playing on the electronic device, but it is being interrupted by some kids' voices.", "There is music playing in the background and a baby is laughing."], "visual_captions": ["The baby was riding a bicycle in the dining room, going around in circles.", "A child is playing with a bicycle.", "The baby is enjoying the ride while cycling.", "A small boy is riding a bicycle.", "The little boy is riding the cycle around the dining table."], "audio_visual_captions": ["A child is riding the bicycle and going around the dining table.", "The boy is playing with his mom and riding a bicycle around.", "The small boy is riding the bicycle around the dining table. The person says something, and the boy stops riding the cycle.", "A boy is playing with a bicycle in the dining area."], "GPT_AV_captions": ["A small boy is riding a bicycle around the dining table while music plays in the background and a baby laughs.", "A child is riding a bicycle in the dining room, going around in circles, with music playing and kids' voices interrupting.", "The boy is enjoying his ride on the bicycle around the dining table, accompanied by background music and laughter."]}, "5173216136": {"audio_captions": ["There are some people enjoying in the party with music.", "A lively, upbeat song sung by a female vocalist, accompanied by the sounds of clapping and cheering from the audience.", "The song party and some members of the audience are singing along with the song party. Some are singing loudly in the background."], "visual_captions": ["A small boy is jumping into his mom's hand.", "The child is attempting to walk with assistance.", "A child is practicing dancing and her mom teaches her.", "The mother is playing with her child. The lady is holding the younger boy's arms and practicing dancing with him, transitioning to walking.", "The mother is dancing with her child for fun."], "audio_visual_captions": ["A woman is playing with a baby. The baby is dancing to a song.", "The baby is dancing with mom and it is very funny.", "The child is playing with their mother."], "GPT_AV_captions": ["A woman is playing and dancing with her child to a lively, upbeat song sung by a female vocalist, with clapping and cheering from the audience.", "The mother is holding her child's arms, helping them dance and walk while enjoying the music and the party atmosphere.", "A child is dancing and playing with their mom, accompanied by a cheerful song and audience participation."]}, "5177755044": {"audio_captions": ["The people are talking about baby pictures.", "The baby is playing a game.", "The child is playing with toys and is very naughty.", "The baby is playing a game at home."], "visual_captions": ["A child is playing with the toy.", "A baby is playing with a toy car.", "The children played in front of their mother at home."], "audio_visual_captions": ["The baby is playing with the toys.", "The baby is playing with a toy while sitting.", "The baby is playing with the toys and also trying to eat the toy car.", "The baby is sitting and playing."], "GPT_AV_captions": ["A baby is playing with a toy car at home.", "The baby is sitting and playing with toys.", "The child is playing with toys and is very naughty."]}, "5178539050": {"audio_captions": ["A lady is saying something and remaining silent.", "Two people are discussing something.", "A girl is speaking with another person.", "The girl is both singing and speaking."], "visual_captions": ["She was working on her laptop and she loves her dog.", "A person is sitting near a dog while using a laptop.", "The dog was sleeping inside the house.", "A dog is playing with a girl while she is working on a laptop."], "audio_visual_captions": ["The woman was playing with the dog.", "The worker work with their pets.", "The woman who is working is playing with her dog.", "The person has a laptop and one dog, which brings them happiness.", "A dog is playing with a girl while the girl is working on a laptop."], "GPT_AV_captions": ["A woman is working on her laptop while playing with her dog.", "A girl is speaking and singing while interacting with her dog and using a laptop.", "Two people are discussing something while a dog is present in the house."]}, "5179297688": {"audio_captions": ["A baby and a person are talking in the house.", "The woman is speaking to her husband.", "A father, a mother, and a baby were engaged in conversation and enjoying themselves.", "The baby girl is speaking with her mother and father."], "visual_captions": ["The baby is playing with the mom, picking up the coffee cup, speaking to the mom, and walking.", "A woman is asking a child to choose a cup between two cups.", "The child is talking to the mother. The mother has two cups and asks which cup the child wants. They select one and go outside.", "The mother was playing with the child.", "The baby is choosing a cup from her mom and they are walking."], "audio_visual_captions": ["A mother is having a conversation with her child while holding tea cups.", "A baby girl is talking with her mother.", "Mom is playing with the kid and talking."], "GPT_AV_captions": ["A mother and father are talking with their baby girl in the house.", "The baby girl is choosing a cup from her mother and they are walking.", "The mother is playing with her baby girl and asking her to choose between two cups."]}, "5182578763": {"audio_captions": ["A few people are talking and laughing.", "Some people are talking and laughing.", "A person and his two friends were laughing having an interesting conversation"], "visual_captions": ["Two robots are fighting each other.", "A machinery was demonstrated, and three people saw it.", "The boy was testing a project with the machine."], "audio_visual_captions": ["A man and a woman are playing with a robot.", "Two men are playing with a device while others in the background are laughing and commenting.", "A person is playing with the toy.", "A group of students are conducting an experiment with their innovation."], "GPT_AV_captions": ["A group of people are talking and laughing while interacting with a robot.", "Two men are demonstrating a device as others in the background laugh and comment.", "A person and his friends are testing a project with a machine, engaging in conversation and laughter."]}, "5185070620": {"audio_captions": ["Two adults are talking to a child about a toy.", "A woman is speaking with a little baby.", "A mom and daddy are playing with their baby here."], "visual_captions": ["A baby is playing with their dad, and the baby is cute.", "A child is currently engaged in playing with toys.", "A baby is playing with toys.", "A child is playing with his father.", "A child is playing with his dad."], "audio_visual_captions": ["A man is playing with a small boy.", "The child is playing with their toy.", "The child is a boy who is playing with toys."], "GPT_AV_captions": ["A mom and dad are talking to their baby while the baby plays with toys.", "A child is playing with his dad and toys.", "A baby boy is playing with his father and toys."]}, "5192910012": {"audio_captions": ["The two children are speaking loudly.", "Two children are talking loudly.", "The sound of a cooker whistle can be heard as the baby girl and her mother engage in conversation.", "The children are playing while the background sound is of a train."], "visual_captions": ["A boy is playing a ride game.", "The little boy plays and drives the scooter.", "A small boy is playing with a toy in the garden.", "He was playing with a motorcycle."], "audio_visual_captions": ["The child is playing with the toy car.", "A little boy is driving his car and talking to his parent.", "A boy is riding the small bicycle."], "GPT_AV_captions": ["A little boy is playing with a toy vehicle in the garden while talking loudly.", "The sound of a cooker whistle can be heard as the boy plays and talks to his parent.", "Two children are playing and talking loudly, with background sounds of a train."]}, "5196883885": {"audio_captions": ["A baby is laughing and learning to talk with his or her mother and father.", "The child is smiling and playing.", "The people are talking to the babies with happiness."], "visual_captions": ["The father and son are playing happily and enjoying themselves.", "A young boy is trying to walk from one person to another with assistance.", "A baby is taking their first steps, so the parents are very happy and the baby is also happy. The baby is playing."], "audio_visual_captions": ["A baby boy is playing with his mother and father by walking to them.", "The baby is playing with his dad and mom.", "A child is playing with his mother and father, and they are encouraging the child."], "GPT_AV_captions": ["A baby boy is playing with his mother and father, learning to walk and talk while they encourage him with happiness.", "The baby is taking his first steps with assistance from his parents, who are very happy and enjoying the moment.", "The child is smiling and playing with his mom and dad, who are talking to him and celebrating his progress."]}, "5202829963": {"audio_captions": ["They are singing the song.", "A man is singing ABC rhymes while some children are talking loudly.", "They sang the song with the children, and after they finished, everyone clapped.", "A man is singing a song for a child."], "visual_captions": ["A man is playing the guitar with two kids on his lap, while two women and a few kids are enjoying the song.", "A baby is listening to our songs and playing with their mother and father.", "A man is playing the guitar and singing with his two kids."], "audio_visual_captions": ["A man is teaching rhymes while babies in the background are enjoying and clapping.", "A family of people and six children are playing and attending a music class in the background.", "The parents are teaching the children how to play musical instruments.", "The parents are teaching with their children. They teach how to play musical instruments."], "GPT_AV_captions": ["A man is playing the guitar and singing ABC rhymes with two kids on his lap, while other children and adults are enjoying and clapping.", "A man is singing a song and playing the guitar with his two kids, while a family and several children are attending a music class.", "A man is teaching rhymes and playing the guitar with his children, as other kids and adults enjoy and clap in the background."]}, "5202975055": {"audio_captions": ["The music was playing in the background.", "A girl is singing a song.", "The song is currently playing, and there is a significant amount of noise in the background.", "Playing music and enjoying the sound of the music.", "People are enjoying the songs."], "visual_captions": ["The friends are playing instruments and singing songs for the concert.", "Two girls and a man are playing the guitar and singing the song.", "Men and women are singing a musical song."], "audio_visual_captions": ["The two girls are singing on the stage with the music band.", "Some people are playing the guitar and others are enjoying themselves at the function.", "A live singing concert."], "GPT_AV_captions": ["Two girls are singing on stage with a music band, while people are enjoying the concert.", "A group of friends, including two girls and a man, are playing instruments and singing at a live concert.", "Music is playing in the background as people enjoy the live performance with guitars and singing."]}, "5206737488": {"audio_captions": ["Two people are talking to each other while other people are laughing in the background.", "A group of people were talking and the woman was laughing.", "Two or more people are talking loudly."], "visual_captions": ["Two women are sitting in the conference area and they are rotating the spring on the table while they talk about it.", "There is an object rotating on the table.", "All of the ladies are attending the meeting, but one lady is playing with some things."], "audio_visual_captions": ["The funny game in the office involves friends and the boss in fun activities.", "There is an object rolling on the table.", "The women are playing in their meeting hall while people are laughing in the background.", "There are two women in the meeting hall. One woman is speaking to the hall."], "GPT_AV_captions": ["Two women are sitting in the meeting hall, talking and laughing while rotating an object on the table.", "A group of people are talking and laughing in the background as two women play with an object during a meeting.", "In the conference area, two women are engaged in a conversation and playing with a rotating object, while others laugh in the background."]}, "5208873554": {"audio_captions": ["The two children are speaking.", "There are two people speaking in the background of the audio.", "A girl speaking in an unfamiliar language and some annoying sounds in the air."], "visual_captions": ["A man and a child are cycling in the forest.", "A father and his child are happily enjoying a bike ride in the forest. Another cyclist is joining them.", "The dad and baby boy ride a bicycle.", "The boy and the child are riding a bicycle."], "audio_visual_captions": ["A man is traveling on a bicycle with a child and a woman shooting that.", "A man is riding a bicycle with a child.", "The mother is shooting the camera. The children are riding bicycles. Then the elder boy drives while the younger boy sits in the back.", "A man is riding a bicycle with a cute baby sitting on the back, looking at the fresh area.", "here is one man driving the cycle and one child sitting on the back seat of the cycle."], "GPT_AV_captions": ["A man is riding a bicycle with a child in the forest, while a woman is filming them.", "A father and his child are enjoying a bike ride in the forest, with another cyclist joining them.\n", "A man is cycling with a child on the back seat, and there are sounds of children speaking in the background."]}, "5209164320": {"audio_captions": ["The people are talking and then they all start singing.", "Both of them are singing a song in a happy mood.", "The members play musical instruments and sing songs.", "This is a party and the mood is joyful."], "visual_captions": ["Some people are playing musical instruments.", "A group of people play musical instruments, such as the guitar, and sing songs to enjoy themselves.", "Four people are sitting, including one man and one woman who are playing the guitar. The lady on the left side is dancing while sitting, and they are all enjoying playing and singing happily."], "audio_visual_captions": ["Both the male and female were talking and singing eventually.", "A man and a woman were studying the guitar while another woman was playing the mouth horn, and the family members were enjoying it.", "The family is enjoying by playing music."], "GPT_AV_captions": ["A group of people, including a man and a woman, are playing musical instruments like the guitar and singing joyfully.", "The family members are talking, playing instruments, and singing together in a happy and joyful mood.", "Four people are sitting and enjoying themselves by playing music and singing, with one woman dancing while sitting."]}, "5211051388": {"audio_captions": ["The child is singing a song.", "A child is singing while the music is playing.", "A baby is singing a song."], "visual_captions": ["A girl is playing the piano.", "The baby is playing a toy piano.", "The baby was playing with a piano."], "audio_visual_captions": ["A girl is playing a toy piano and singing a song loudly.", "The child is watching TV and the child is singing music.", "A girl is singing in the house."], "GPT_AV_captions": ["A girl is playing a toy piano and singing a song.", "A child is singing while playing a toy piano.", "A baby is singing and playing a piano."]}, "5211277413": {"audio_captions": ["A lady is talking to another.", "Some people are talking among themselves.", "A woman is talking to someone."], "visual_captions": ["One team is discussing the meeting and coffee time, while the other team is playing a game.", "It is a family and friends gathering, and they are enjoying the day.", "A group of women is discussing at a table with a man. Three men at another table are arranging something on a table."], "audio_visual_captions": ["A group of people gathered in a house and some of them are finishing up a puzzle.", "Some people are sitting in a group and having snacks, while others are playing a game.", "Some people are playing with the puzzle blocks."], "GPT_AV_captions": ["A group of people gathered in a house, some discussing at a table while others are playing a game.", "A family and friends gathering where some are finishing a puzzle and others are having snacks.", "A group of people enjoying the day, with some talking and others arranging something on a table."]}, "5216965406": {"audio_captions": ["The mother spoke to one child.", "A little boy is shouting in the house, and then the mother speaks to the boy.", "Two children are speaking loudly.", "The babies are speaking in the scene."], "visual_captions": ["Two babies are playing with their toys.", "Four children are playing with toys.", "Three babies are playing with the toys and the babies are having a happy moment."], "audio_visual_captions": ["The children are playing with toys.", "The two children were playing.", "The two children are playing.", "Two babies are playing with the toys and assembling them."], "GPT_AV_captions": ["Two children are playing with toys and assembling them while the mother speaks to one child.", "Two children are playing with toys and the mother speaks to one of them.", "Two children are playing with toys and the mother speaks to one child."]}, "5219718493": {"audio_captions": ["Men and women are laughing, and I think they are playing.", "The friends are talking funny in the park while they are enjoying themselves.", "The women's conversations can be heard."], "visual_captions": ["A few women are hanging off the edge of a monument.", "Three girls are enjoying the play.", "A group of girls is playing in the park.", "They are hanging using the bar."], "audio_visual_captions": ["Three women are disrespecting the monument of St. Catherine by using it to perform pullups.", "The two ladies were playing to do pull-ups.", "There are three women hanging from a stick.", "Three girls are hanging and playing near the steel bar close to the statue.", "The ladies are hanging in the statue rod."], "GPT_AV_captions": ["Three women are laughing and talking while hanging from a bar near a monument in the park.", "A group of women is enjoying themselves, performing pull-ups on a bar close to a statue.", "Three girls are playing and talking near a monument, using a bar for pull-ups."]}, "5219728337": {"audio_captions": ["The women and man are talking and laughing very loudly.", "The people are happily laughing and playing a game.", "The mother and father were talking to their baby, and the baby was saying something but not intelligible."], "visual_captions": ["Two girls are playing with children.", "Two girls are attempting to play with two babies together.", "Two children were playing with their mother.", "Two ladies attempt to make their babies stand without their supports.", "Two children are playing on their mother's lap."], "audio_visual_captions": ["Many people are playing with two babies.", "Two children are laughing and two women are talking loudly, with people in the background also talking.", "Family members are taking their pictures."], "GPT_AV_captions": ["Two women are talking and laughing loudly while playing with two babies.", "Two children are laughing and playing on their mother's lap as people talk in the background.", "Family members are happily interacting and taking pictures with the babies."]}, "5223035448": {"audio_captions": ["This baby is very cute and brings joy to their parents by making sounds.", "A baby begins to talk with her mother.", "The baby is trying to speak."], "visual_captions": ["A baby is playing with its mom.", "A baby was playing and speaking for the first time.", "The baby is very cute and smiles a lot."], "audio_visual_captions": ["A child is with their mom and the child is making a sound.", "The toddler is murmuring one of her first words.", "A baby is with their mother and saying something.", "A child and her mother are in a video call."], "GPT_AV_captions": ["A baby is with her mother, making sounds and trying to speak.", "The baby is very cute, smiling a lot, and playing with her mom.", "A child is with her mom, murmuring one of her first words."]}, "5224502522": {"audio_captions": ["A man hears a playing guitar and sings a song.", "Someone is playing such good music on the guitar.", "The men were playing music and singing songs."], "visual_captions": ["A man is playing the guitar for his friends.", "A man sings a song for his girl.", "The man is singing and  playing the guitar."], "audio_visual_captions": ["A man is sitting on top of an armchair, playing the guitar and singing.", "The man plays music on the guitar.", "He plays the music with a guitar."], "GPT_AV_captions": ["A man is playing the guitar and singing a song.", "A man is sitting on an armchair, playing the guitar and singing.", "A man is playing the guitar and singing for his friends."]}, "5224805531": {"audio_captions": ["This baby's parents are happy and enjoying singing birthday song very much.", "Birthday wishes for some children.", "A group of people is singing the birthday song and going to the party."], "visual_captions": ["It is a birthday party, and all the family and friends have gathered to celebrate.", "A child is celebrating their birthday.", "The family members are enjoying the baby's birthday."], "audio_visual_captions": ["A group of people are celebrating the baby's birthday.", "Family and friends gather around a table to celebrate the birthday of a young boy.", "A group of family members is celebrating the baby's birthday."], "GPT_AV_captions": ["A group of people are celebrating a baby's birthday with singing and joy.", "Family and friends gather around a table to celebrate a child's birthday.", "The family members are enjoying the baby's birthday party together."]}, "5237219621": {"audio_captions": ["The people are all thinking and chatting in the same way.", "One lady is speaking while others in the background are speaking and laughing.", "The woman is talking with her friends and family.", "A woman is speaking with members of her family."], "visual_captions": ["The lady was speaking with her friends and family.", "Four people are speaking.", "Four members are speaking.", "Three girls and one boy are having a jolly conversation."], "audio_visual_captions": ["The women are talking with their family members.", "The youth group is discussing ways to assist young people in their locality.", "The lady is having a serious conversation with her family members.", "A woman is saying something.", "A group of people was discussing."], "GPT_AV_captions": ["A woman is speaking with her friends and family.", "Four people, including three girls and one boy, are having a conversation.", "The group is discussing ways to assist young people in their locality."]}, "5254195028": {"audio_captions": ["The people are talking there is background voice.", "The person is speaking.", "People are talking and playing a song in the background."], "visual_captions": ["The mom and son are funny.", "A baby is playing with things in the hospital.", "A mother was carrying a child who was trying to play.", "A mother and baby are talking."], "audio_visual_captions": ["A baby and her mom are playing.", "A baby and mother are playing together.", "The woman was playing and listening to the baby.", "The mother and baby were laughing in this video.", "The child was trying to take a spoon, and the mother took it and gave it to him."], "GPT_AV_captions": ["A mother and baby are playing and talking while a song plays in the background.", "The mother and baby are laughing and interacting, with the baby trying to play with objects.", "A woman and her child are enjoying each other's company, with background voices and music."]}, "5254866216": {"audio_captions": ["Some people are seriously talking to the other members.", "Many people are talking, but nothing can be heard due to the noise.", "Family members are talking."], "visual_captions": ["The grandfather is taking about his dogs.", "An old man is playing with his dogs.", "The two dogs enjoyed playing with the grandfather.", "There is an old man sitting on a sofa and playing with his dog."], "audio_visual_captions": ["A grandfather is playing with their dogs.", "The dog is playing at home.", "A man enjoying himself with a dog.", "The older man is playing with dogs."], "GPT_AV_captions": ["An old man is playing with his dogs while family members are talking in the background.", "A grandfather is sitting on a sofa, enjoying time with his dogs as people talk around him.", "The older man is interacting with his dogs at home amidst the noise of family conversations."]}, "5263195812": {"audio_captions": ["Two humans are speaking.", "A man was speaking to another person.", "One person is asking some questions to another person, who is answering.", "Two people are speaking and discussing a topic."], "visual_captions": ["Two men are speaking, one is a general.", "The police officer is speaking.", "Two officers are talking seriously.", "It was an official meeting with leaders."], "audio_visual_captions": ["A speech of two individuals.", "The president was interviewing an army man in his castle.", "Two officers are discussing something.", "The soldier and the man are talking to each other."], "GPT_AV_captions": ["Two men, one a general, are speaking and discussing a topic.", "Two officers are talking seriously in an official meeting.", "The president is interviewing an army man in his castle."]}, "5265004457": {"audio_captions": ["A man and a woman are talking to each other, while other people are talking in the background.", "Men and women are discussing cooking details.", "There is a conversation between one man and one woman."], "visual_captions": ["The little boy is eating the food while someone is watching.", "The boy is eating his food while speaking.", "The child is eating very well.", "The little boy is eating food."], "audio_visual_captions": ["The boy is eating food while his mother is recording it.", "The baby was eating with chopsticks.", "A boy is using a chopstick to eat."], "GPT_AV_captions": ["A boy is eating food while his mother is recording it, and a man and a woman are talking in the background.", "The boy is eating with chopsticks while a man and a woman discuss cooking details.", "A child is eating very well with chopsticks as a man and a woman converse nearby."]}, "5265614788": {"audio_captions": ["Some people are talking, and in between, there are sounds of a baby.", "A baby girl is speaking to her mother.", "A baby is crying and a little girl is speaking. The mother is also speaking."], "visual_captions": ["The baby is eating food, and the daddy is helping the baby eat.", "A Chinese child eats his food using chopsticks.", "The child is eating lunch."], "audio_visual_captions": ["The baby is getting used to eating with chopsticks.", "A baby is eating rice.", "The people are speaking loudly."], "GPT_AV_captions": ["A baby is eating food with chopsticks while people are talking loudly.", "A baby girl is eating rice with the help of her father, and her mother is speaking.", "A baby is eating lunch with chopsticks, and there are sounds of people talking and a baby crying."]}, "5267923023": {"audio_captions": ["A group of people is talking.", "The family made an order at the hotel.", "A person is talking with his wife."], "visual_captions": ["This family was enjoying dinner at a hotel.", "The friends met at the hotel and they were ordering the food.", "Many people are talking in the restaurant.", "There is a group of people having a party in the hotel."], "audio_visual_captions": ["The group of girls in the hotel is discussing ordering food.", "They are ordering some food and sandwiches.", "The friends met at the hotel to enjoy food and have a good time laughing.", "Friends are deciding on a suitable menu at a hotel and planning to have a great time."], "GPT_AV_captions": ["A group of people is talking and enjoying dinner at a hotel, deciding on a suitable menu.", "Friends met at the hotel to order food and have a good time laughing and discussing.", "The family and friends are at a hotel, ordering food and planning to have a great time."]}, "5273185164": {"audio_captions": ["A man and child are laughing and talking.", "Many people are talking in the background.", "A man and a woman were speaking. The man was shouting.", "The family is speaking very nicely."], "visual_captions": ["Daddy is carrying the baby while mommy is feeding food to the baby.", "The father and mother are interacting with each other while sitting in the dining area. The mother is feeding food to the baby.", "The mother was feeding food to the child, who was eating.", "The baby is eating lunch."], "audio_visual_captions": ["The mother feeds the baby.", "A child is eating the food.", "A woman is feeding her baby.", "The baby is sitting, and the baby's mother is feeding the baby."], "GPT_AV_captions": ["A mother is feeding her baby while the baby is eating.", "A man and a woman are talking while the baby is being fed.", "The family is interacting in the dining area with the baby eating."]}, "5278313911": {"audio_captions": ["The baby is playing and talking.", "The baby is playing with the toys and making loud sounds. The baby is talking with the mom and playing with even more sound.", "The baby was playing and trying to speak.", "A baby is practicing saying a word while an adult repeats the word to them a few times, and something is shuffling in the background."], "visual_captions": ["The mother is feeding her baby.", "The mom is feeding the food to her boy.", "The mother teaches the child how to eat.", "The mother is feeding her son food."], "audio_visual_captions": ["The mother is feeding the food to her son. The child is eating food with a spoon.", "The boy and mother are sitting on a chair. Then, the mother is feeding food to her son.", "A child was eating the food.", "The mother feeds her son and they take care of each other.", "A mother is feeding the baby."], "GPT_AV_captions": ["The mother is feeding her baby while the baby is playing and talking.", "The mother is feeding her son food as he tries to speak and play with toys.", "The mother and her son are sitting on a chair; she feeds him while he makes sounds and practices words."]}, "5284382213": {"audio_captions": ["It was raining and there were sounds of thunder. It was very loud.", "There is the sound of strong wind.", "The rain and wind are background sound."], "visual_captions": ["A person is taking a photo with the McDonald's toy.", "The boy was sitting on the bench, and then another boy clicked a photo.", "A man is taking photos in the snow."], "audio_visual_captions": ["The people take a photo of the doll.", "A person is sitting on the bench next to a statue while another person takes photos of them.", "A man is taking a photo with a statue.", "A man is playing with the MacDonald mascot."], "GPT_AV_captions": ["A person is sitting on a bench next to a statue while another person takes photos of them, with the sound of rain, thunder, and strong wind in the background.", "A man is taking photos with a statue amidst the sounds of rain and wind.", "A person is taking a photo with a McDonald's toy while it is raining and windy."]}, "5286758447": {"audio_captions": ["The female singer is singing the song.", "The girl is singing.", "A group of people are listening to the music and joining the family in singing and dancing."], "visual_captions": ["A mother and her young child are interacting with each other in the living room, with many people behind them.", "The family is watching TV.", "The child is singing the song and enjoying the family."], "audio_visual_captions": ["The family is watching TV programming and fully enjoying it.", "Two girls are singing in their home.", "They enjoy listening to a song and singing it together as a group.", "One child and one lady are singing at home. Another lady is watching, and one child is playing with a cap."], "GPT_AV_captions": ["A family is watching TV and enjoying the music together in their living room.", "A girl and a woman are singing while others join in and dance.", "A mother and her child interact while the family sings and enjoys the music."]}, "5287251474": {"audio_captions": ["Some people are talking and laughing with each other.", "The man and woman are discussing something.", "The man speaking is very happy."], "visual_captions": ["The man is video calling with the child.", "The people are speaking to someone.", "The man was talking to his son on the phone."], "audio_visual_captions": ["A man was having a conversation with his son during a video call.", "A man is on a video call with a child.", "A man is speaking with someone through a video call on his phone."], "GPT_AV_captions": ["A man is having a happy conversation with his son during a video call.", "The man is speaking and laughing with his son on a video call.", "A man and a child are discussing something happily over a video call."]}, "5293233413": {"audio_captions": ["A man is talking to another man while a woman is laughing.", "Two men are speaking very quietly.", "A man is asking something, then a woman is laughing about the speech."], "visual_captions": ["A dog is watching TV with its owner.", "The dog is watching television.", "The girl and the dog are watching the movie inside the house.", "A dog is watching the television."], "audio_visual_captions": ["A girl was watching TV with her dog.", "A woman and a dog were watching television.", "The dog is watching TV at home.", "The dog is watching another dog on TV, and the girl next to the dog is smiling at the dog.", "The dog was watching television."], "GPT_AV_captions": ["A girl and a dog are watching TV at home while two men are speaking quietly.", "A girl and her dog are watching TV, and a man is talking to another man while a woman laughs.", "A girl and her dog are watching TV, and a man is asking something, making a woman laugh."]}, "5295188880": {"audio_captions": ["The people are speaking loudly and talking.", "A man and a woman were laughing, and the background was very noisy.", "The girl is laughing loudly.", "People are speaking and laughing about something.", "People are talking and laughing loudly."], "visual_captions": ["The dog was playing very nicely.", "The dog is playing with its owner.", "The boy was playing with the dog.", "A dog is playing with one person.", "A dog is playing with a man. He is enjoying himself with the dog."], "audio_visual_captions": ["The dog plays and jumps with its owner.", "A dog is playing with one man.", "The owner and the dog are playing, another dog is watching."], "GPT_AV_captions": ["A dog is playing and jumping with a man while people are talking and laughing loudly in the background.", "The man and the dog are enjoying themselves, with another dog watching, amidst loud conversations and laughter.", "A man and a dog are playing together, surrounded by people speaking and laughing loudly."]}, "5296671076": {"audio_captions": ["Mom and her baby are talking loudly and laughing together.", "The couple is laughing, and their baby is also laughing.", "The parents in the discussion are happy and enjoying their good baby. They are speaking and laughing, enjoying their child."], "visual_captions": ["The father is teaching his child to dress in a careful and happy manner.", "A child is playing with his father.", "The father and child are playing with each other."], "audio_visual_captions": ["The little boy is dancing and playing around.", "The baby is playing with fake hair with their father.", "The baby is participating in the drama practice.", "The baby is playing with the father.", "The father dressed his son like a king, and their family is enjoying it."], "GPT_AV_captions": ["The father is playing and laughing with his baby, and the family is enjoying their time together.", "The baby is playing with his father, who is teaching him to dress and participate in a fun activity.", "The family is happy and engaged, with the father and baby laughing and playing, creating joyful moments."]}, "5303332305": {"audio_captions": ["A small baby was saying something.", "A little boy is singing the rhymes.", "A child is talking with his/her mom while a vehicle sound is playing in the background."], "visual_captions": ["A child is speaking on a toy phone while sitting in the dining area.", "A boy was speaking and playing.", "The child is playing with a walkie-talkie."], "audio_visual_captions": ["The boy set up a train track on the table and pretended to be a traffic man.", "The baby boy acts like an actor, speaking on the phone and playing with his mother and a toy train.", "A child is playing a train game.", "A young boy is speaking into a microphone while there are people talking in the background and the sound of a train.", "A boy is speaking with a walkie-talkie and giving commands to someone."], "GPT_AV_captions": ["A child is speaking on a toy phone while sitting in the dining area, with vehicle sounds in the background.", "A boy is playing with a toy train and speaking into a walkie-talkie, pretending to be a traffic man.", "A young boy is talking to his mother while playing with a toy train and a walkie-talkie, with background noise of people and a train."]}, "5305581718": {"audio_captions": ["The girl is talking.", "The parents asked the kid some questions, and the kid answered the questions while laughing.", "One woman is speaking with a baby while she is playing with a child."], "visual_captions": ["A mother and her child are cooking.", "A mother is making snacks for the child.", "The mother is preparing something, and the boy is helping her.", "A mother and son are in the kitchen, preparing food."], "audio_visual_captions": ["A mother and her son are cooking in the kitchen.", "The baby is cooking with the mother.", "A mother and child were preparing a dish and tapping the pan for cooking.", "The baby tried to cook with the mother."], "GPT_AV_captions": ["A mother and her child are cooking in the kitchen, with the child helping and laughing.", "The mother is preparing food while talking and playing with her child.", "A mother and her son are making snacks together, with the child tapping the pan."]}, "5306545201": {"audio_captions": ["This music had such a beautiful melody.", "A musical instrument is playing in the background.", "A musical instrument is played."], "visual_captions": ["Both men are playing a guitar and enjoying the music.", "Two boys are playing the guitar.", "Two people are playing the guitar and enjoying themselves.", "Two men are playing the guitar and singing."], "audio_visual_captions": ["Two men are playing the guitar.", "Two men are playing the guitar. It was very nice.", "The two men playing music.", "The musicians are playing the guitar.", "They play the guitar."], "GPT_AV_captions": ["Two men are playing the guitar and enjoying the music.", "Two men are playing the guitar with a beautiful melody in the background.", "Two people are playing the guitar and singing, enjoying themselves."]}, "5308844630": {"audio_captions": ["Two women are talking nicely to children.", "The girl is very happy.", "It sounded like waves."], "visual_captions": ["A man and a dog are walking on the road.", "The dog is walking around the street while its owner is feeding it dog food.", "The woman is taking the dog for a walk in the street and recording the dog.", "The woman was trying to take a selfie with her dog, and she gave a biscuit to her dog. The man was showing the dog's teeth.", "One woman is walking with a dog and giving some food to the dog."], "audio_visual_captions": ["A dog is playing with a toy and the girl was taking a selfie with the dog.", "A dog and its owner went for a walk.", "A dog and a person are walking on the road."], "GPT_AV_captions": ["A woman is walking with a dog on the road and giving it some food while recording a video.", "A dog and its owner are walking on the street, and the woman is taking a selfie with the dog.", "A dog and a person are walking on the road, and the woman is feeding the dog."]}, "5309902755": {"audio_captions": ["Some people are playing musical instruments.", "Some musical instruments are playing loudly.", "Someone is currently playing the violin."], "visual_captions": ["Two individuals are playing music.", "One person is playing the violin while the other is teaching how to play the violin.", "A small girl is practicing with the violin."], "audio_visual_captions": ["The kid plays the violin.", "A boy is playing a violin at a Christmas function.", "A girl is playing music with an instrument while another lady is holding notes.", "One lady and one girl are playing the violin at the Christmas function.", "A music teacher gives violin practice to her student."], "GPT_AV_captions": ["A girl is playing the violin while a lady is teaching her.", "A child is practicing the violin with guidance from a music teacher.", "A girl and a lady are playing the violin together."]}, "5310031663": {"audio_captions": ["The song is currently playing in the background.", "One person is working while background songs are playing.", "The person is singing and playing the instrument."], "visual_captions": ["Somebody was preparing a cup of tea.", "A person is pouring milk into the coffee and stirring it thoroughly.", "A person is preparing tea."], "audio_visual_captions": ["They made a coffee and stirred it with a spoon.", "The girl is preparing the tea, and it was very tasty.", "A lady is making tea with a teapot, and it is very clear.", "Someone is making coffee to drink."], "GPT_AV_captions": ["A person is preparing tea while a song plays in the background.", "A person is making tea and stirring it thoroughly while music plays.", "A person is preparing a hot beverage with background music."]}, "5311367704": {"audio_captions": ["The child is speaking to the father.", "The father and the child are having a conversation with each other.", "The baby is talking and someone is speaking about some related matters.", "Child talking to the dad."], "visual_captions": ["The boy is playing with his father.", "The father and the boy are sitting on the floor, and the father is taking some snacks and putting them in a bowl.", "The father is cutting the fruits while the boy is watching."], "audio_visual_captions": ["The father was cooking food for her son.", "The father and son were cutting fruit. The son was watching the father do the work.", "The dad and son are playing with the food.", "The boy and his father are cleaning a pumpkin."], "GPT_AV_captions": ["The father and the boy are sitting on the floor, having a conversation while the father prepares food.", "The father is cutting fruits and putting them in a bowl as the boy watches and talks to him.", "The father and son are interacting and playing with food, including cleaning a pumpkin."]}, "5312036289": {"audio_captions": ["The woman was clapping and enjoying the moment with loud sounds. She was talking to many people and clapping. At the end, the sound of a dog also appeared.", "People are happily playing an indoor game while a dog is barking in the background.", "People are speaking to each other, clapping and enjoying."], "visual_captions": ["Two children are playing with the toys.", "A child is playing with the toys, and another child is beside him. There are many toys beside them.", "A girl is playing with toys on the floor and speaking with her mom.", "Two babies are playing with toys."], "audio_visual_captions": ["Two little kids are playing together.", "Two children are playing with the toys in the house.", "A little boy and a girl are playing together with some toys.", "Two children are playing the game and one woman is encouraging them to play."], "GPT_AV_captions": ["Two children are playing with toys while a woman claps and encourages them.", "A little boy and a girl are playing with toys, and people are happily talking and clapping.", "Two kids are playing with toys indoors, and a dog barks in the background."]}, "5312870730": {"audio_captions": ["A young lady is mocking another guy for stealing her dessert, while making others laugh.", "A man and a boy are having a nice conversation.", "A man and some people are speaking and talking."], "visual_captions": ["The magician entertained the audience, and it was very interesting.", "Two boys are acting in a drama.", "Two boys are performing in a stage drama."], "audio_visual_captions": ["A small boy was talking to the man while people in the background were laughing.", "Two male students perform a scene on stage and elicit laughter from the audience at the end.", "Two people are acting on the stage."], "GPT_AV_captions": ["A young lady mocks a guy for stealing her dessert, making others laugh, while a man and a boy have a conversation in the background.", "Two boys perform a scene on stage, eliciting laughter from the audience.", "A small boy talks to a man while people in the background laugh, and two boys act in a stage drama."]}, "5317259686": {"audio_captions": ["Many people are speaking loudly and laughing very noisily.", "A man and a woman were talking.", "The group of friends was shouting and speaking with someone else.", "A lady and and a man are talking."], "visual_captions": ["The cat is sitting in the lap of the man while the dog is watching.", "The cat is sitting on the man.", "A puppy is walking out of the room, and a man is holding a kitten in his hand."], "audio_visual_captions": ["Two men were playing with the dog and the cat.", "A man was sitting on a chair at the house with his cat, and the place was very noisy.", "The two cats and the family are celebrating Christmas in the house.", "There are two men playing with the cat and the dog."], "GPT_AV_captions": ["A man is sitting with a cat in his lap while a dog watches, and people are talking and laughing loudly.", "Two men are playing with a cat and a dog in a noisy house.", "A group of friends is celebrating noisily while a man holds a kitten and a puppy walks out of the room."]}, "5319163326": {"audio_captions": ["The members of the band are playing the musical instruments.", "Musical instruments are being played in the room.", "Playing music and one person talks at the end.", "A man is enjoying the music while playing the drums.", "The young man is playing the music."], "visual_captions": ["The child plays the musical instruments.", "The boy is playing the drum instrument.", "The boy is learning to play music."], "audio_visual_captions": ["The mother and son are sitting in the room. The mom was playing the guitar and the son was playing the drums.", "The son is playing a drum, and the mother is playing a guitar.", "The boy is playing the drums, and his mom is playing the guitar.", "The sister and brother are playing music at home.", "The boy is playing an instrument."], "GPT_AV_captions": ["A boy is playing the drums while his mother plays the guitar in the room.", "The mother and son are playing musical instruments together.", "A young boy is learning to play the drums as his mom plays the guitar."]}, "5323209509": {"audio_captions": ["Men and women are talking to a child who is unwrapping a present.", "Three members are talking loudly, and a baby's voice is cute.", "A mother and child are speaking about something.", "People are talking and a baby is speaking loudly."], "visual_captions": ["A little girl is opening a present.", "A child is opening a gift that was given to her by her parents.", "The baby is opening a gift."], "audio_visual_captions": ["The child is opening a gift and is extremely delighted to find a kitchen set box.", "A girl baby is talking with a lady.", "A baby girl is opening the gift wrapping."], "GPT_AV_captions": ["A baby girl is opening a present while people are talking around her.", "A child is unwrapping a gift and is delighted to find a kitchen set box.", "A little girl is opening a gift and speaking with a woman."]}, "5323579442": {"audio_captions": ["A piano is being played.", "A man was playing the piano.", "The piano, a musical instrument, has started playing music."], "visual_captions": ["The girl is playing the musical instrument while others are watching.", "The girl is playing the musical instrument.", "A girl is playing the piano. A woman and a man are talking.", "The girl is playing the piano by using sheet music.", "The girl is playing the piano while the husband and wife are talking and drinking some liquor."], "audio_visual_captions": ["The girl is playing the piano very well.", "The girl is playing the music nicely.", "A young woman was playing the piano in her home.", "The young girl is sitting near the piano and playing music. Behind the girl, a young little boy is walking to the TV. There is a young couple sitting on the sofa. The young girl is smiling and has finished playing the music.", "A girl is playing music on the piano."], "GPT_AV_captions": ["A girl is playing the piano while a couple is talking and drinking.", "The girl is playing the piano using sheet music, and a young boy is walking to the TV.", "A girl is playing the piano very well, and a couple is sitting on the sofa."]}, "5328004991": {"audio_captions": ["A mother and son are talking.", "A woman is talking to someone while kids are shouting in the background.", "Two people are speaking with each other about a project and work.", "A mother is talking to her son while some sounds can be heard in the background."], "visual_captions": ["The mother and children are cooking in the kitchen.", "A baby plays with vessels in the kitchen with his mom.", "The baby is trying to cook, and mommy is teaching the child.", "The child is cooking in the kitchen."], "audio_visual_captions": ["The small boy is cooking on his own mom.", "A boy is cooking something with his mom.", "The kid is cooking at home."], "GPT_AV_captions": ["A mother and her son are cooking together in the kitchen while kids are shouting in the background.", "A woman is teaching her child to cook, and they are talking about a project and work.", "A mother and her son are cooking, and a baby is playing with vessels in the kitchen."]}, "5332054914": {"audio_captions": ["Someone is walking and breathing heavily. Occasionally, a beep sound can be heard. Additionally, there is the sound of a child talking.", "There was someone speaking with a low voice.", "There is some noise, with a baby shouting."], "visual_captions": ["A baby who is about five or six months old is crawling and playing with toys, and he also wants to play with the computer.", "A young child is crawling on the bedsheet and moving towards the laptop.", "The baby is practicing crawling across a mat and passes some toys in order to reach a laptop that is sitting on the corner of the mat."], "audio_visual_captions": ["The baby is playing on the floor and then going to play with the laptop.", "The baby is playing on the floor and crawling towards the laptop.", "The baby is playing games at home.", "The cute baby is playing with toys."], "GPT_AV_captions": ["A baby is crawling on the floor, passing toys, and moving towards a laptop while making noises.", "A baby is playing on the floor, occasionally making sounds, and heading towards a laptop.", "A baby is practicing crawling on a mat, surrounded by toys, and moving towards a laptop."]}, "5343144349": {"audio_captions": ["The young child is making noise while people are discussing in the background.", "The baby is shouting while people are talking in the background.", "Some children are playing and speaking."], "visual_captions": ["A boy is eating breakfast at the dining table.", "A boy is eating something while people are walking around him.", "One child is eating at the table.", "The boy is eating the food.", "A boy is sitting on the chair and eating cake while someone is watching in a room."], "audio_visual_captions": ["The child was eating food.", "The kid is eating the cake.", "The boy is eating cake with a spoon.", "A little boy is eating a cake.", "The boy is eating and making a sound."], "GPT_AV_captions": ["A boy is eating cake at the dining table while people are talking in the background.", "A child is eating cake with a spoon while others are discussing nearby.", "The boy is eating cake and making noise as people converse around him."]}, "5344655615": {"audio_captions": ["The piano is playing in the background.", "A pianist is playing the piano with some well-written lyrics.", "Someone is playing a keyboard musical instrument."], "visual_captions": ["The man is playing a piano.", "A person is playing the piano.", "The boy is using a musical instrument.", "A boy is playing the music keyboard."], "audio_visual_captions": ["A man is playing a keyboard and it sounds like nice music.", "A boy is playing his piano.", "The boy is playing the musical instrument."], "GPT_AV_captions": ["A man is playing the piano, creating nice music.", "A boy is playing a keyboard musical instrument.", "A person is playing the piano with well-written lyrics."]}, "5348154608": {"audio_captions": ["The parents are enjoying themselves with the baby and causing the baby to laugh.", "The people are speaking to someone.", "The baby and parents are playing small games."], "visual_captions": ["A woman and a man are playing with a little baby.", "A person is playing with her baby.", "The parents are playing with the baby and the baby is crawling around.", "The parents are playing with their baby."], "audio_visual_captions": ["There is a baby, and both his mother and father are present. The baby is adorable, and he is smiling and having a good time.", "The parents are enjoying watching their baby play and smile.", "The mother and father are watching their son playing on the bed.", "A mother is engaged in play with her child."], "GPT_AV_captions": ["The parents are playing with their baby, making the baby laugh and smile.", "A mother and father are enjoying their time with their adorable baby, who is crawling around and having fun.", "The parents are watching their baby play and smile, engaging in small games together."]}, "5349766264": {"audio_captions": ["A musical instrument is being played and both men and women are singing a song.", "The members of the music crew are performing together.", "The person plays musical instruments and sings songs.", "They are playing the music and singing a song."], "visual_captions": ["The group of friends is composing a music album and they are enjoying themselves.", "Some boys and one girl are singing together while someone is playing instruments.", "The group of friends is composing a music album and they are enjoying singing.", "A group of people is sitting in one room, playing musical instruments and singing songs."], "audio_visual_captions": ["A music team was playing the music, and it was very lovely. It feels good to hear.", "The group of friends is singing songs.", "A group is singing in the room.", "The person plays musical instruments.", "The men are playing a musical instrument."], "GPT_AV_captions": ["A group of friends is sitting in a room, playing musical instruments and singing songs.", "The music crew is performing together, enjoying themselves while composing a music album.", "Both men and women are singing a song, and the music being played is very lovely."]}, "5350306994": {"audio_captions": ["The mother is speaking to the baby and telling him something.", "A woman is speaking and enjoying herself with her children.", "The baby is making a noise.", "A person is speaking with a baby."], "visual_captions": ["A baby is playing with the cup.", "A child is eating food at the dining table and is also drinking water.", "The baby is eating and playing.", "A baby boy is sitting in the chair and playing with his bottle of water."], "audio_visual_captions": ["The baby is playing and shouting at her mommy or another person.", "The baby is sitting on the chair and drinking water from a water bottle. The mom asks the baby to clap. The baby also claps and shouts loudly, enjoying the moment with the mom.", "The baby is holding a bottle and following their mother's instructions.", "The boy was eating and playing with the water bottle."], "GPT_AV_captions": ["A baby is sitting on a chair, playing with a water bottle, and making noise while interacting with his mother.", "The mother is speaking to her baby, who is eating and drinking water, and the baby claps and shouts in response.", "A baby boy is enjoying himself, playing with a cup and bottle, while his mother talks to him and asks him to clap."]}, "5351925965": {"audio_captions": ["The people are talking and laughing.", "One woman is speaking with someone.", "All of the family members are talking and laughing."], "visual_captions": ["A woman is playing with a bird.", "A bird is playing with the woman.", "The person is enjoying the snowfall."], "audio_visual_captions": ["They are enjoying the snow and having tea.", "The people is visiting the snow and enjoying the moment.", "A person gave food to a bird, but the bird came and went."], "GPT_AV_captions": ["A family is talking and laughing while enjoying the snowfall.", "A woman is playing with a bird as everyone enjoys the snowy moment.", "They are having tea and enjoying the snow together."]}, "5352412169": {"audio_captions": ["There is a lot of simultaneous conversation happening.", "Many people are speaking something.", "There is a lot of chatter among people in a crowded place.", "A group of members is conversing with one another and having a good time.", "A group of people are having conversations with their friends and family."], "visual_captions": ["Three people are fighting in the kitchen.", "Three male friends are playing.", "Three boys are playing in the kitchen and punching each other in their shoulders.", "Three guys are playfully fighting with each other for fun.", "Three boys are playfully fighting in the room."], "audio_visual_captions": ["Three friends are playing at the kitchen.", "Three men were playing and kicking with each other.", "Three men are participating in a boxing match and laughing.", "Three boys are practicing fighting in the kitchen."], "GPT_AV_captions": ["Three friends are playfully fighting in the kitchen while having conversations with each other.", "Three boys are having a good time, playfully punching and kicking each other in the kitchen.", "A group of friends is in the kitchen, engaging in playful fighting and chatting simultaneously."]}, "5353485791": {"audio_captions": ["A person is speaking.", "The woman is laughing and speaking to somebody.", "Two women were talking and enjoying themselves with the kids. A baby was blabbering.", "A woman is speaking."], "visual_captions": ["A baby is playing with two women.", "One child is playing with his family.", "Two ladies are playing with the child."], "audio_visual_captions": ["Two ladies are playing with the baby and laughing.", "The child is playing with two women.", "Two women are playing with the baby, and the baby is walking towards them."], "GPT_AV_captions": ["Two women are playing with a baby and laughing.", "A baby is playing with two women who are enjoying themselves.", "The child is playing with two women, and the baby is walking towards them."]}, "5354842767": {"audio_captions": ["The baby is crying while the mother is laughing.", "The baby is laughing and the family members are in a happy mood.", "One woman is speaking with a baby."], "visual_captions": ["A baby and her mother were hugging and speaking joyfully.", "The child played with their mom, and she was very happy to play.", "A mother and baby were playing.", "It is a baby playing toy."], "audio_visual_captions": ["The mother and daughter are playing with each other.", "The baby is with their mother, who is caressing her, causing the girl to smile.", "A child is playing the game and laughing.", "The mother and baby are playing, smiling, and enjoying our happy life.", "A child is sitting on her mother's lap and they are both playing."], "GPT_AV_captions": ["A mother and her baby are playing and laughing together, enjoying their time.", "The baby is sitting on her mother's lap, and they are both smiling and interacting joyfully.", "The mother is caressing her baby, making her smile and laugh while they play."]}, "5356919058": {"audio_captions": ["The female is singing loudly with the accompaniment of playback music. The sound of drums and big crackers can also be heard. At the end of the song, there is also group singing.", "A song is being sung.", "Background music is played with a female voice singing."], "visual_captions": ["The girl is singing a song.", "The two girls are playing in the house and having fun singing like in a concert.", "There are two girls in one room. One girl is singing a song, and the other girl is playing in the room.", "A girl is singing and there is a white dog.", "The child is singing the song and the sister is enjoying it."], "audio_visual_captions": ["The children are singing the songs.", "A girl is singing in her home while her sister is playing.", "A girl was singing in the house while another girl was playing with her."], "GPT_AV_captions": ["A girl is singing loudly with background music while her sister plays in the room.", "A girl sings a song in the house, accompanied by playback music and the sound of drums.", "A girl is singing in her home, and her sister is enjoying it while playing."]}, "5363401248": {"audio_captions": ["A couple is talking to each other while driving in the rain.", "There is a sound of wind in the background and some people are talking.", "A man and a woman are having a conversation."], "visual_captions": ["The baby is playing on the beach and trying to collect shells.", "The baby and daddy are playing in the sand at the sea.", "The dad and little son are playing at the beach."], "audio_visual_captions": ["A small baby is playing on the beach.", "The baby boy was playing at the beach.", "The son was collecting beach stones, and the father was helping to take the stones.", "The boy is playing in the sand with his father.", "A baby is playing in the sand."], "GPT_AV_captions": ["A baby boy is playing in the sand at the beach with his father.", "The baby and his dad are collecting stones and playing in the sand.", "A man and a woman are talking while driving in the rain, with wind sounds in the background."]}, "5368243767": {"audio_captions": ["A group of people is talking and laughing together.", "The two or more people are talking and laughing.", "Some people are having a conversation.", "Many people are saying something."], "visual_captions": ["Two girls and one boy are talking, while one girl is sitting. They give flowers to the sitting girl and take a photo.", "The two people are taking a photo of the lady.", "The women and men are talking."], "audio_visual_captions": ["The woman was talking to someone in the office.", "A staff is giving flowers as a gift  to the manager.", "The team gifted flowers to their office mate.", "Two women are speaking and one of them is holding a flower."], "GPT_AV_captions": ["A group of people, including two girls and one boy, are talking and laughing together, while one girl is sitting and receiving flowers.", "The team is gifting flowers to their office mate and taking a photo.", "Two women are speaking, one of them holding a flower, as they converse and laugh with others."]}, "5379354799": {"audio_captions": ["A windy noise can be heard.", "A man is discussing his friend's outfit.", "The person is talking with their friends."], "visual_captions": ["The father and baby are looking at the flower in the garden.", "A father and child are enjoying the rainy season.", "A baby and father are walking to the garden park."], "audio_visual_captions": ["A baby and her father are walking in the garden during the rainy time with an umbrella.", "A baby is seeing the fruits with her mom or dad.", "A child and their father are looking at the flowers.", "The father and the baby were walking in the rain. The father has the umbrella.", "The baby is accompanying the elder to see the pumpkin. \n\nThe baby is going with the elder to see the pumpkin."], "GPT_AV_captions": ["A father and baby are walking in the garden during the rainy season with an umbrella.", "A father and baby are looking at the flowers in the garden.", "A father and baby are enjoying the rainy season while discussing the garden."]}, "5388595493": {"audio_captions": ["The child is playing with the mother.", "The baby was playing with her mother.", "A mother is speaking with her baby.", "A woman is talking to a girl.", "A baby is enjoying playing with his mother and making a sound."], "visual_captions": ["The child was playing the game and enjoying themselves.", "The baby is playing with the toys.", "A cute baby is happily playing with toys while someone is talking to the baby.", "A baby was playing on the floor."], "audio_visual_captions": ["The child is playing and is a very nice child.", "The baby is happily playing with the toys.", "A child was playing with her mom and the baby had a very smiley face.", "The baby is playing a game."], "GPT_AV_captions": ["A baby is happily playing with toys while the mother talks to her.", "The baby is enjoying playing with toys and interacting with the mother.", "A child is playing with toys and smiling while the mother speaks to her."]}, "5398268379": {"audio_captions": ["The children are singing the birthday song and making their birthday wishes.", "Two or more children are singing the Happy Birthday song, while a group of people is enjoying.", "The children are singing happy birthday."], "visual_captions": ["A group of children is celebrating a birthday party.", "All small girls are at the birthday celebration.", "Many babies celebrate a little baby's birthday.", "The celebration is for children on their sixth birthday."], "audio_visual_captions": ["A woman is singing the birthday song, and the children are enjoying the party.", "A small girl celebrated her birthday with her family and friends with a cake.", "Many children are celebrating a girl's birthday.", "The children are celebrating a girl's birthday.", "The children celebrate the birthday party."], "GPT_AV_captions": ["A group of children is celebrating a girl's birthday with a cake and singing the Happy Birthday song.", "Many children are enjoying a birthday party, singing and making birthday wishes.", "Children are celebrating a birthday party, singing the birthday song and having fun together."]}, "5398860552": {"audio_captions": ["The baby and the mom are talking.", "The baby is speaking with the lady.", "A young child is speaking to his mother."], "visual_captions": ["A baby girl drew a drawing and played with her mom.", "A little baby and her mom are drawing something on the board.", "There is a little girl drawing on the board.", "The child is drawing with her mom.", "The child is drawing happily."], "audio_visual_captions": ["A child is drawing.", "A child is drawing on the drawing paper, and her mother is teaching her how to draw.", "The baby draws the sheets very well.", "The baby boy was speaking and drawing on the drawing board.", "A mother and son were drawing the picture."], "GPT_AV_captions": ["A baby girl is drawing on the board with her mom.", "A young child is speaking to his mother while drawing.", "A child is drawing happily with her mother."]}, "5409193177": {"audio_captions": ["They are talking loudly in the room.", "People are talking, and someone is shouting in the background.", "Many people are talking loudly."], "visual_captions": ["Two people are experimenting with making a DJ mix.", "Two members are experimenting with the theremin.", "The two men are preparing the experiment."], "audio_visual_captions": ["A man is describing the electronic device.", "The man is playing music with the theremin.", "Two boys are standing and conducting a scientific experiment.", "There are two members in a room operating machines."], "GPT_AV_captions": ["Two people are talking loudly while experimenting with a theremin.", "Two men are in a room, preparing and describing an electronic device.", "Two boys are conducting a scientific experiment with a theremin, and there is shouting in the background."]}, "5427285434": {"audio_captions": ["The baby is speaking in a language or making sounds.", "The child is playing music loudly.", "A person is speaking and singing a song."], "visual_captions": ["The baby is playing with his father.", "The child is playing and dancing.", "A child is showing the funny dance to a women."], "audio_visual_captions": ["The child dancing while playing.", "A little boy wearing an orange hat is dancing in front of his parent.", "The kid is wearing a cap on his head.", "The boy and his father are dancing."], "GPT_AV_captions": ["A child is dancing and playing music loudly while wearing an orange hat.", "The baby is making sounds and dancing with his father.", "A little boy is dancing and showing a funny dance to a woman."]}, "5435156153": {"audio_captions": ["The baby is shouting while the woman is talking.", "A woman is talking and dogs are barking.", "The woman is speaking very slowly and the background is very calm."], "visual_captions": ["A cute baby is trying to pull the man's shoelace. A white dog is sitting nearby the man and biting a ball.", "The baby is playing with the dog.", "A child is playing with his dad."], "audio_visual_captions": ["The baby is playing with his parent's shoe.", "A baby is playing with his father's shoes, and the dog is near the baby.", "A baby is playing with his mother's shoes."], "GPT_AV_captions": ["A baby is playing with a parent's shoe while a woman is talking and a dog is nearby.", "The baby is interacting with a parent's shoe, and a dog is sitting close by.", "A baby is playing with a parent's shoe, and a dog is nearby, while a woman speaks slowly."]}, "5435506054": {"audio_captions": ["Two friends having a conversation about something.", "There are only two people talking and laughing in the background.", "Two girls are gossiping about another girl."], "visual_captions": ["A baby is playing with a dog.", "The baby is playing with a puppy dog.", "A baby and a dog are playing with toys."], "audio_visual_captions": ["A dog is playing with a boy.", "The kid was playing with the dog. It looks very adorable.", "The baby is playing with the dog."], "GPT_AV_captions": ["A baby is playing with a dog.", "A baby and a dog are playing together.", "Two friends are having a conversation while a baby plays with a dog."]}, "5449359673": {"audio_captions": ["A man frequently plays music for his wife before they have conversations.", "Men and women smile as their conversation ends.", "Two young people are talking."], "visual_captions": ["The baby is eating and the mom is happy.", "A baby was eating the food that her mother was feeding it.", "The baby is eating the food.", "A lady is feeding food to a cute baby."], "audio_visual_captions": ["The baby was eating alongside her mother.", "Mom is feeding the baby, but the baby refuses to eat it and is listening to music. Finally, the baby ate the food that mom gave.", "The baby is sitting while the mother is feeding.", "A baby is eating food from her mother, and it is very cute."], "GPT_AV_captions": ["A baby is eating food from her mother, and it is very cute.", "A lady is feeding food to a baby who is listening to music.", "The baby is eating the food that her mother is feeding her."]}, "5456274822": {"audio_captions": ["They are enjoying the music while playing musical instruments.", "Music is playing and all the people are singing songs. Some of them are shouting with joy while listening to the song.", "At the music concert, someone is playing the guitar and people are responding by making noise.", "Some people are playing music and dancing."], "visual_captions": ["They are singing a song on the stage.", "The gang was playing music.", "They are all singing and dancing."], "audio_visual_captions": ["The people are participating in a singing and dancing program.", "It was like a music concert.", "One boy is singing and two girls are dancing in the performance.", "On the stage, the man and the woman are singing.", "There is a young boy singing, as well as two girls singing and dancing. Additionally, there is an uncle playing background music on the keyboard."], "GPT_AV_captions": ["People are singing and dancing on stage during a music concert, with some playing musical instruments.", "A young boy is singing while two girls are dancing, and an older man is playing the keyboard in the background.", "The audience is enjoying the music, singing along, and making joyful noise in response to the performance."]}, "5459816888": {"audio_captions": ["A man is singing a song.", "A group of singers is singing a song with music.", "The song was extremely beautiful."], "visual_captions": ["The two boys are playing music.", "Two men are playing the guitar and making music.", "Two members are playing guitar. The music was something that I really enjoyed."], "audio_visual_captions": ["The two singers were singing the song.", "There are two people at a live concert.", "Two men are singing and playing musical instruments at a party while standing.", "The group of two men is playing music.", "There are two people and they play the guitar."], "GPT_AV_captions": ["Two men are singing and playing the guitar at a live concert.", "Two men are performing a beautiful song with guitars at a party.", "A group of two men is singing and playing musical instruments, creating enjoyable music."]}, "5460164242": {"audio_captions": ["The baby and the man are having a conversation while the song plays in the background.", "A man is singing the song in the background while a woman is talking with a boy.", "A woman is speaking while people are singing the song in the background."], "visual_captions": ["A young child is listening to the music and dancing on the floor.", "A baby and her father are dancing.", "A baby and father are dancing."], "audio_visual_captions": ["A girl is playing with a laptop.", "A baby girl saw a laptop and danced well.", "The little girl is enjoying the music while her dad is also happily dancing with her.", "A baby girl was enjoying the music and dancing well."], "GPT_AV_captions": ["A baby girl is enjoying the music and dancing while her dad happily dances with her.", "A baby girl and her father are dancing to the music playing in the background.", "A baby girl is dancing and playing with a laptop while her dad joins in the fun."]}, "5468020076": {"audio_captions": ["A woman is speaking in some other language.", "The women are talking about something.", "A woman is speaking while there is background noise.", "A woman is speaking to someone, explaining something."], "visual_captions": ["The man is working on the laptop and participating in a video call.", "A man wearing a dark long-sleeved shirt with a collar and glasses is sitting at a desk with multiple computer monitors.", "A man is working on his laptop despite his busy schedule.", "One person worked on the desktop and attended the video conference."], "audio_visual_captions": ["A man is working on his laptop and has a busy schedule.", "One person was working on his laptop.", "The man working on the computer works sincerely."], "GPT_AV_captions": ["A man wearing a dark long-sleeved shirt with a collar and glasses is sitting at a desk with multiple computer monitors, working on his laptop and participating in a video call.", "A man is working on his laptop and has a busy schedule while a woman is speaking in the background.", "One person is working on his laptop and attending a video conference, with a woman explaining something in the background."]}, "5476140602": {"audio_captions": ["Some people are talking in the background, as well as the sound of typing is heard. Additionally, someone is breathing loudly. Also music is playing in the background.", "Some music is playing in the background.", "The person is using the keyboard while a song is playing in the background."], "visual_captions": ["The cats are playing at home.", "Many cats are playing in the house.", "All of the cats are playing at home."], "audio_visual_captions": ["Many cats are playing in their house.", "The cats are happily playing all around in the background.", "Some cats are playing at home."], "GPT_AV_captions": ["Many cats are playing in the house while music is playing in the background.", "The cats are happily playing at home with the sound of typing and music in the background.", "All of the cats are playing at home as someone types and music plays."]}, "5479373398": {"audio_captions": ["There are three members speaking and background noises.", "The children are talking and their parent is interfering with them.", "A group of people is speaking in tense voices in some language."], "visual_captions": ["The mother and children were walking on the bridge. The boy was drinking a cold drink.", "They are walking on the bridge.", "The family is walking in the park."], "audio_visual_captions": ["Mom and two children were crossing the bridge.", "A family is taking a walk in the park.", "There are many people walking on the bridge.", "A family was walking on the bridge while they were speaking to each other."], "GPT_AV_captions": ["A family is walking on the bridge while speaking to each other.", "The mother and children are walking on the bridge.", "A family is taking a walk in the park."]}, "5482316216": {"audio_captions": ["The man was speaking and there were noises in the background.", "A man got stuck in dense air while driving.", "The man is inquiring about various situations that may not be very serious, and it is raining heavily late at night."], "visual_captions": ["A man is recording a video while holding something.", "There was an old man near the mountain castle, and he was admiring the beauty of the village. He also had a camera.", "On the mountain, a man is takin selfies and shows all the sides from the mountain. Another man is climbing up with a camera in hand.", "One man is talking about a mountain and a temple."], "audio_visual_captions": ["A man was taking a video at the tourist place.", "The man is taking a picture while the other man is hiking on the mountain.", "Two people enjoy the viewpoint and take photos.", "He is speaking about nature and taking photos."], "GPT_AV_captions": ["A man is recording a video and talking about nature while another man is hiking on the mountain.", "Two men are at a tourist place, one taking selfies and videos, and the other climbing with a camera.", "The men are enjoying the viewpoint, taking photos, and discussing various situations amidst background noises and rain."]}, "5489050159": {"audio_captions": ["A man is speaking at a meeting in the company.", "They are speaking louder to someone.", "The man is speaking loudly."], "visual_captions": ["Two humans are speaking in a room.", "A person is working on a laptop and talking about it.", "A man is recording a video of his friend while he is sleeping during work hours.", "One man is tired of our work, but the other man is very active.", "The men appeared sad and dull."], "audio_visual_captions": ["One person was working and fell asleep on the table because he was tired.", "The old man is looking at his laptop and worrying about his work. Then, the old man smiles and shuts down his laptop.", "A man was narrating his life story.", "Two people are talking and one person is working on the laptop."], "GPT_AV_captions": ["Two people are talking in a room, and one of them is working on a laptop.", "A man is speaking loudly at a meeting in the company while another man appears tired and falls asleep at the table.", "An older man looks at his laptop, worries about his work, then smiles and shuts it down."]}, "5494269389": {"audio_captions": ["A man is speaking loudly .", "One person was speaking as if it were a meeting.", "The person is addressing everyone."], "visual_captions": ["A man is giving a lecture and discussing the topic while others are watching it.", "An elderly man is delivering a lecture.", "The meeting is taking place in the seminar hall.", "A man is explaining to his employees."], "audio_visual_captions": ["It is a conference where one person explains in front of a group of people.", "A man is giving a lecture in Spanish in front of a classroom.", "The professor is teaching in the class room.", "The teacher is conducting a class and explaining something to the students."], "GPT_AV_captions": ["A man is giving a lecture in front of a group of people in a seminar hall.", "An elderly man is addressing everyone in a classroom setting.", "The teacher is conducting a class and explaining a topic to the students."]}, "5498241342": {"audio_captions": ["A mother talking to her kids first in english, then in spanish.", "A woman is speaking while some children are talking in the background.", "A woman is playing with a baby by having a conversation.", "There are some people talking in this scene."], "visual_captions": ["The kids are playing nicely and also fighting.", "The two babies are fighting and playing with each other.", "Two children are playing and enjoying themselves.", "Two children are playing in the bedroom."], "audio_visual_captions": ["The children were playing in the house.", "The two children were playing at home, and another child is drinking the water.", "A younger brother and an older sister are playing near the bed."], "GPT_AV_captions": ["A mother is talking to her kids in English and Spanish while they play in the house.", "Two children are playing and enjoying themselves near the bed, with another child drinking water.", "A woman is speaking while children play and talk in the background."]}, "5498668540": {"audio_captions": ["In this video, there is background noise consisting of a man shouting and children talking.", "The people are playing music.", "There is music playing in the room."], "visual_captions": ["The father and son are seeing something on a tab.", "A man is playing with his son on a tablet.", "A father and daughter are watching videos on a mobile phone."], "audio_visual_captions": ["A baby boy was playing a game with his father on a tablet.", "A man and children are scrolling on the tab.", "A child and his father are playing video games.", "A father and a child are playing with a tablet."], "GPT_AV_captions": ["A father and his child are playing with a tablet while music plays in the background.", "A man and his child are interacting with a tablet amidst background noise of shouting and children talking.", "A father and his child are engaged with a tablet, accompanied by background music and chatter."]}, "5502665217": {"audio_captions": ["People are enjoying the music very loudly.", "At the party hall, drums and other musical instruments are being played loudly, and a man is singing a rap song.", "Some songs are being played and enjoyed."], "visual_captions": ["One person is dancing in front of his friends.", "The man is wearing a white shirt and black pants. He is funny and dancing at a place where other people find it very interesting to watch.", "The girl is dancing."], "audio_visual_captions": ["The woman is dancing very cutely.", "A boy puts on a ghost show in front of his friends.", "Someone is dancing in the room"], "GPT_AV_captions": ["People are enjoying loud music at a party hall where drums and other musical instruments are being played, and a man is singing a rap song.", "A man in a white shirt and black pants is dancing in front of his friends, who find it very interesting to watch.", "Someone is dancing in the room, and people are enjoying the music."]}, "5503778096": {"audio_captions": ["The girl is making different sounds, and her mom is talking to her.", "Both a child's voice and a woman's voice can be heard.", "A young child is playing with his mother and having a great time.", "A baby is talking to its mother."], "visual_captions": ["A baby and a toddler are rolling around on a bed while looking at books.", "A girl and a boy are lying on the bed and playing.", "Two children are sleeping in the bedroom and playing.", "The two babies are playing on the bed."], "audio_visual_captions": ["A small girl is playing with her brother.", "The two children were playing on the bed. It was a very amazing and attractive moment, the child was playing with a book.", "There are two babies sleeping in the bed, while one of them is playing a video game."], "GPT_AV_captions": ["A young girl and her brother are playing on the bed, enjoying their time together.", "Two children are lying on the bed, interacting with books and having fun.", "A baby and a toddler are rolling around on the bed, with their mother talking to them."]}, "5504106604": {"audio_captions": ["Some people are enjoying the dancing and music at that moment.", "A song was playing in the background at a location.", "A man is singing while the background music is playing."], "visual_captions": ["The boys are enjoying playing music.", "Musicians are playing and singing music.", "The group of people is playing the music at the event."], "audio_visual_captions": ["The humans play the instruments.", "A group of boys are performing in the music show and enjoying themselves.", "People are playing the music at the event.", "People are enjoying playing the song at a concert with four members."], "GPT_AV_captions": ["A group of people is playing music and enjoying themselves at an event.", "Musicians are performing and singing while the audience enjoys the music.", "People are playing instruments and having fun at a concert."]}, "5504570766": {"audio_captions": ["A man is speaking to a woman, but there is noise in the surrounding area.", "Two people were talking while they were driving.", "A man and a woman are talking while a car is moving in the background."], "visual_captions": ["The rabbit was running in the snow, and the man was chasing the animal.", "The rabbit was playing in the snow.", "The dog enjoys the snow."], "audio_visual_captions": ["The man is playing in the snow with the rabbits.", "A rabbit wis playing with snow, and there is one cat.", "A rabbit is playing in the snow and being carried by a man."], "GPT_AV_captions": ["A man and a woman are talking while a car is moving in the background, and a rabbit is playing in the snow.", "A man is speaking to a woman with noise in the surrounding area, and a rabbit is being carried by a man in the snow.", "Two people are talking while driving, and a rabbit is playing in the snow."]}, "5511691883": {"audio_captions": ["It seems like the wind is blowing and there is a single animal sound heard.", "I think it's a hill station. There is a fast sound of air in the audio.", "The sound of rain was heavy and very noisy."], "visual_captions": ["The birds are eating on the ground.", "The birds are eating food.", "The birds are eating food."], "audio_visual_captions": ["The pigeons were eating grains on the street.", "Birds are walking around the tree  and observing.", "The group of birds were eating the food.", "The birds are eating food.", "The doves are walking around and eating something from the ground."], "GPT_AV_captions": ["The birds are eating food on the ground while the wind blows.", "The pigeons are eating grains on the street with the sound of heavy rain.", "Birds are walking around and eating food amidst the noisy wind."]}, "5521781780": {"audio_captions": ["People are discussing something in the background.", "Two friends are discussing a specific topic.", "This person is in a discussion and they are very happy to enjoy speaking with the child."], "visual_captions": ["They are shooting pictures of old places with the camera.", "The videographer is focusing on the taking photos of old places while two men are walking.", "Some people were visiting a tourist place with beautiful stone walls."], "audio_visual_captions": ["Two tourists visited an ancient city where people lived.", "The two tourists visited an ancient monument.", "Two tourists are touring popular destinations, including an ancient building."], "GPT_AV_captions": ["Two friends are discussing happily while visiting an ancient city with beautiful stone walls.", "Two tourists are enjoying a discussion as they tour an ancient monument and take photos.", "Two friends are visiting an ancient building, engaging in a lively conversation and capturing memories with a camera."]}, "5532742171": {"audio_captions": ["Someone is speaking and there is also music playing.", "Many people enjoy singing and dancing at the party.", "The baby is enjoying with their mother."], "visual_captions": ["The baby is playing with a ball.", "A boy is playing with the ball in the park.", "A child is playing with a ball in a park."], "audio_visual_captions": ["A young boy is playing on the ground with a ball.", "The baby was playing games and having fun in the garden.", "A baby boy is playing on the ground with grass. He is playing with a green ball. The mom is asking about the car, and there is a white car.", "The child played with the ball and suddenly started playing music, and the child began to dance."], "GPT_AV_captions": ["A child is playing with a green ball in the park while music plays in the background.", "A baby is enjoying time with their mother, playing with a ball and dancing to the music.", "A young boy is having fun in the garden, playing with a ball and dancing as music plays."]}, "5540466660": {"audio_captions": ["The mother and young child are playfully teasing their older sibling.", "The baby is playing with their parents and shouting. Both the father and mother are talking to the child and playing with them.", "A mother is talking to her child."], "visual_captions": ["The baby is holding a plastic bottle and walking smoothly.", "The baby is playing and moving around.", "The father is playing with his child.", "The baby is playing with the bottles."], "audio_visual_captions": ["A baby and their mother are talking, and the baby was playing with empty bottles, and is standing with the help of the sofa.", "The baby is playing and 'pa pa' sounds very fun to the baby. The baby then watches the mouse.", "The baby was playing and was very happy."], "GPT_AV_captions": ["The baby is playing with empty bottles and walking smoothly while the mother and father talk and play with the child.", "The baby is happily playing and moving around, making 'pa pa' sounds, and standing with the help of the sofa.", "The baby is interacting with both parents, playfully teasing and shouting, while exploring the surroundings."]}, "5541230874": {"audio_captions": ["A baby was talking, a girl was talking, and there was a song playing in the background.", "The baby is talking with their parents. A female voice is talking with the baby and playing, while some background music is present.", "The child asked something to the woman, and the woman responded happily.", "The kids and their mother are having a conversation.", "The two babies are speaking in the house."], "visual_captions": ["The babies are playing the game with toys.", "The baby is feeding the toy, and another baby is playing with the Spiderman toy.", "The kid is opening a toy and is very happy."], "audio_visual_captions": ["Two children are playing with toys, a Barbie doll and a spiderman toy.", "A girl is playing with her Barbie toy.", "Two babies are playing with toys.", "The two children are happily playing with the toys."], "GPT_AV_captions": ["Two children are happily playing with toys, including a Barbie doll and a Spiderman toy, while a woman talks to them and background music plays.", "A baby is feeding a toy while another baby plays with a Spiderman toy, and a female voice engages with them.", "The kids are having a conversation with their mother as they play with their toys."]}, "5551527400": {"audio_captions": ["The child is giggling and making playful sounds.", "A child is talking and there is background noise.", "The child is speaking to the father and the child is having fun."], "visual_captions": ["A cute baby is bathing in a bathtub and saying something to his mother.", "The baby is playing while bathing.", "A baby is currently taking a bath.", "The kid is playing while bathing."], "audio_visual_captions": ["A baby was playing in the water.", "A child was sitting in the bathtub, playing with the water, and talking to her mother.", "A baby is playing in the bathtub.", "The cute baby played in a bathtub while wearing a head mask and taken care by her mother."], "GPT_AV_captions": ["A baby is playing and giggling in the bathtub while talking to the mother.", "The child is having fun in the bathtub, making playful sounds and interacting with the mother.", "A cute baby is enjoying a bath, playing with water, and speaking to the mother."]}, "5552271623": {"audio_captions": ["There is a group of people talking loudly in the background.", "In the background, many people are talking.", "The sound of whistles are heard."], "visual_captions": ["He plays with a Rugby ball on the ground with another boy.", "Two boys are playing with a Rugby ball in the ground.", "The man is playing Rugby with his friend in the ground."], "audio_visual_captions": ["The two people are playing.", "Two men played Rugby.", "The boys are playing in the ground."], "GPT_AV_captions": ["Two boys are playing with a Rugby ball on the ground while people talk loudly in the background.", "The boys are playing Rugby on the ground with the sound of whistles and people talking in the background.", "Two boys play Rugby on the ground as many people talk loudly in the background."]}, "5554974582": {"audio_captions": ["The child was playing with their mother.", "The mother is talking to the baby.", "The child's parents are talking to the child and laughing.", "A mother and baby are speaking.", "A woman talks to the baby and the baby was laughing."], "visual_captions": ["The baby is sitting on a walker, and the baby has a cute smile on their face.", "The baby is playing with the things in the cradle.", "The baby was playing in the baby walker."], "audio_visual_captions": ["The baby was sitting in a chair, and there were some toys on the chair. The baby was laughing straight away.", "A child is playing with his toys.", "The baby is sitting in the walker, and someone is talking to the child."], "GPT_AV_captions": ["A baby is sitting in a walker, smiling and playing with toys while a woman talks to the baby.", "The baby is in a walker, laughing and interacting with their mother.", "A mother is talking to her baby who is sitting in a walker and playing with toys."]}, "5557455580": {"audio_captions": ["A woman is having fun with her baby.", "A lady and one child are shouting.", "The woman is talking to the baby."], "visual_captions": ["A woman and her baby are talking to each other and playing happily.", "A girl and a cute little baby are playing together.", "A woman is talking to her child."], "audio_visual_captions": ["A woman is interacting with her baby while the baby is looking at the camera.", "The mother was speaking to the baby.", "The woman was playing with her child."], "GPT_AV_captions": ["A woman is having fun with her baby while they play and talk to each other.", "A woman and her baby are interacting happily, with the baby looking at the camera.", "The woman is talking and playing with her child."]}, "5557751246": {"audio_captions": ["When a man began playing music and a baby started crying, the child remained silent and watched him.", "Somebody is playing the drums in the background.", "The man is playing the drums, and the baby is smiling."], "visual_captions": ["The child is playing with a ball.", "A child is playing with her ball.", "The baby is playing with the ball."], "audio_visual_captions": ["The little baby is playing with the ball.", "The baby is playing the ball game.", "The child is playing with a ball."], "GPT_AV_captions": ["A man is playing the drums while a baby is playing with a ball.", "The baby is playing with a ball and watching the man play the drums.", "The child is playing with a ball as the man plays the drums in the background."]}, "5558701375": {"audio_captions": ["People are talking and walking everywhere.", "There are some bird sounds otherwise it is very silent.", "The baby is making sounds."], "visual_captions": ["The child was walking alongside the mother.", "A mother and daughter are walking around the park, and the child is wearing a pink bag. Finally, there is a male peacock.", "A child is walking in the park with her mother and enjoying her days."], "audio_visual_captions": ["A woman and a little girl are walking somewhere, following the sound of a peacock and they see the peacock.", "The child is walking in the place and see the peacock.", " The baby and mother are walking."], "GPT_AV_captions": ["A mother and her child are walking in the park, and they hear the sound of a peacock.", "The child, wearing a pink bag, is walking with her mother and they see a peacock.", "A woman and her daughter are enjoying a walk in the park, accompanied by bird sounds and the sight of a peacock."]}, "5560177516": {"audio_captions": ["The child was playing with the car at home.", "It is a baby playing with a toy.", "The baby is shouting and playing with toys."], "visual_captions": ["A child is playing with a car and several dolls.", "A child is lying on the bed.", "A baby is playing with toys."], "audio_visual_captions": ["Newborn baby sees the toys and try to catch them.", "The baby was playing with his or her toy car.", "The kid was playing with the toys.", "The small baby is on the floor. The person starts moving the toy car while hearing the sound. The baby sees the toy and makes the sound."], "GPT_AV_captions": ["A baby is playing with a toy car and other toys.", "A child is playing with toys and making sounds.", "A baby is on the floor, interacting with a toy car and other toys."]}, "5563273949": {"audio_captions": ["The child is trying to talk with their parents.", "A woman is speaking, and there is some background noise.", "The family was playing with the child."], "visual_captions": ["The baby is playing with the ball.", "A baby is playing with a ball on the living room floor.", "The baby was playing and enjoying themselves."], "audio_visual_captions": ["One small child was playing.", "A baby is playing with a red ball and teether, while the baby's mom is talking to the baby.", "The baby plays with a ball and toys that make sounds."], "GPT_AV_captions": ["A baby is playing with a ball and toys while their mom talks to them.", "The child is playing with a ball on the living room floor as their parents interact with them.", "A baby is enjoying playing with a ball and other toys while a woman speaks in the background."]}, "5566028125": {"audio_captions": ["A woman is conversing with others.", "The woman is having a conversation with another person.", "Man and woman were talking.", "The father and mother are speaking to each other when suddenly the baby starts shouting in the background."], "visual_captions": ["The child is walking in the snow.", "The baby was playing at a park with her father.", "The father and baby are playing on the swings."], "audio_visual_captions": ["A man was playing with a child, and she feels very happy.", "The kids are playing in a park.", "The dad is happily playing with the daughter."], "GPT_AV_captions": ["A man and a woman are having a conversation while a baby starts shouting in the background.", "A father is playing with his daughter at the park, and she feels very happy.", "The father and baby are playing on the swings in the park."]}, "5569333947": {"audio_captions": ["The baby is laughing loudly and the background is noisy.", "The baby was smiling and playing a lot. There were also noise sounds, and the baby was laughing a lot.", "A baby is playing with other people while they are enjoying."], "visual_captions": ["The baby is playing in the water tub.", "The baby is taking a bath.", "The baby girl is playing while she bathes."], "audio_visual_captions": ["The baby was swimming happily in the bathroom.", "The child is playing while taking a bath.", "The baby was happily being bathed by his parents."], "GPT_AV_captions": ["The baby is laughing and playing while taking a bath in the water tub.", "The baby is enjoying a bath, surrounded by noise and laughter.", "The baby is happily playing in the water while being bathed by parents."]}, "5569974351": {"audio_captions": ["The man was teaching the classroom and children applauded.", "The person is loudly pronouncing the letters of the alphabet.", "A person is speaking about some letters.", "The baby was learning the alphabet and practicing reading and speaking in person."], "visual_captions": ["The baby is playing a puzzle game.", "A baby girl is playing a game on a mobile tablet.", "The baby is playing a game in their home.", "A baby girl is playing with the tablet.", "A cute baby is arranging letters using a mobile phone."], "audio_visual_captions": ["The baby is playing a game on a tablet, and the girl is playing the game very cutely.", "The baby is learning English.", "A baby is learning new things by using a tablet."], "GPT_AV_captions": ["A baby girl is playing a game on a tablet and learning the alphabet.", "The baby is practicing reading and speaking letters while using a mobile tablet.", "A cute baby is arranging letters and learning English through a game on a tablet."]}, "5570574289": {"audio_captions": ["A child is crying loudly while people are talking in the background.", "Some people are talking and a baby is crying.", "The child is not interested in listening to the song, but the mother is playing it."], "visual_captions": ["A baby girl is playing with her mother and is very happy.", "A toddler is playing with a tape measure and then begins to cry and run towards an adult seeking comfort.", "One child is playing with their mom at home."], "audio_visual_captions": ["The baby is crying because it injured its hand.", "A child was crying in front of his mother.", "A baby girl was crying."], "GPT_AV_captions": ["A baby girl is crying while people are talking in the background, and her mother is trying to comfort her.", "A toddler is playing with a tape measure, then begins to cry and runs towards an adult for comfort.", "A child is crying loudly, and the mother is playing a song to soothe her."]}, "5570785480": {"audio_captions": ["The parents are playing with a baby.", "They were playing music and laughing together.", "People are playing music and they are enjoying it."], "visual_captions": ["The child is dancing and enjoying with the family.", "A man is dancing with his daughter.", "The little girl is playing and dancing with her father and other family members.", "The child was playing with her father."], "audio_visual_captions": ["The child and father are playing.", "The baby girl is dancing with her parents.", "The parents are dancing for their child, and she is very happy to jump on the floor.", "The father and daughter were dancing."], "GPT_AV_captions": ["The parents are playing music and dancing with their baby girl, who is very happy and jumping on the floor.", "The father and mother are dancing and playing with their daughter, enjoying the moment together.", "The little girl is dancing and playing with her parents, who are laughing and having fun."]}, "5571838736": {"audio_captions": ["The music is playing at the party.", "The boys are playing music.", "People are enjoying the song and dancing."], "visual_captions": ["The old man is singing the song, and the boy is playing guitar while a woman plays the drums.", "A group of boys are playing some music.", "All members are composing music for television and are happy to collaborate with others."], "audio_visual_captions": ["Some boys are playing music.", "A man was singing a song while another man was playing a guitar, and a lady was beating a drum set in the house.", "The three members are playing instruments."], "GPT_AV_captions": ["A man is singing a song while a boy plays the guitar and a woman plays the drums at a party.", "People are enjoying the music and dancing as the group performs.", "The group is happy to collaborate and compose music together."]}, "5572234385": {"audio_captions": ["A woman was laughing and a baby boy was talking with the women.", "The mom and daughter are having a silent conversation.", "Somebody is laughing and speaking quietly.", "The baby is talking, and their mom is listening and laughing."], "visual_captions": ["The baby siblings are enjoying and playing with each other.", "Two children are playing and having cute and loving conversations.", "Two children are playing in the bedroom.", "The cute brothers enjoy playing on the bed."], "audio_visual_captions": ["The two children are playing on the bed.", "Two beautiful children are playing nicely on the bed.", "A toddler is embracing a baby."], "GPT_AV_captions": ["Two children are playing and laughing on the bed.", "The baby is talking while the mom listens and laughs.", "Two children are enjoying a playful moment together."]}, "5573667855": {"audio_captions": ["Three people are making noises when they speak.", "There are more people talking and there is a lot of background noise.", "The baby is shouting and people are speaking in the background."], "visual_captions": ["The members are happily swimming with others.", "Some people are playing in the swimming pool.", "The babies are swimming with their parents."], "audio_visual_captions": ["Four families enjoy swimming pool training, which is very interesting for the kids.", "The children are playing in the swimming pool.", "The people are playing in the swimming pool.", "The family members enjoy swimming."], "GPT_AV_captions": ["Families are enjoying swimming in the pool with their children, amidst background noise and conversations.", "People are happily playing and swimming in the pool, with babies shouting and parents talking.", "Children and their parents are having fun in the swimming pool, with lively background chatter."]}, "5581572407": {"audio_captions": ["A man is speaking to someone", "A cat is meowing loudly while two people are talking in the background.", "Two people were talking with each other."], "visual_captions": ["The cat was walking on the wood.", "The cat is walking on the bridge.", "A light brown cat is slowly walking onto the wooden wall that is located in the pond.", "A cat is walking on a bridge."], "audio_visual_captions": ["The cat is walking in the river.", "A cat was silently walking in the woods.", "The cat was walking on the bridge."], "GPT_AV_captions": ["A cat is walking on a bridge while two people are talking in the background.", "A light brown cat is slowly walking onto the wooden wall that is located in the pond as a man speaks to someone.", "A cat is walking on a bridge as it meows loudly and two people converse."]}, "5585306763": {"audio_captions": ["A baby is playing in the background, and it is making noise.", "The baby is playing a game.", "The man and the baby are playing, and the baby is laughing loudly."], "visual_captions": ["One man and two children are playing a ball game.", "A man and his sons are playing with their ball.", "Two little boys and their grandfather are playing with a ball.", "Two kids and their father are playing catch with a ball."], "audio_visual_captions": ["Dad is playing with the children. Two children are playing with a ball.", "The children are playing with a man by throwing the ball to each other.", "The two children are playing with their father and enjoying catching the ball.", "Grandfather is playing a game with his grandchildren, and they are very happy enjoying the game."], "GPT_AV_captions": ["A man and two children are playing catch with a ball, and the baby is laughing loudly.", "The children are playing with their father, throwing the ball to each other and enjoying the game.", "A man and his two kids are playing a ball game, and the baby is making noise in the background."]}, "5586292125": {"audio_captions": ["People are laughing in this audio.", "The children are talking loudly, and they are enjoying.", "The entire family is very happy and joyful."], "visual_captions": ["Five men are drinking with their friends.", "People are playing with glass and drinking some juices.", "They are playing while drinking.", "Some people are playing games and drinking."], "audio_visual_captions": ["There were six people in the living room, and there was a small game. Two people were drinking wine.", "The boys' gang enjoyed the party.", "The men are enjoying the party."], "GPT_AV_captions": ["A group of people are in the living room, laughing and talking loudly while enjoying a party.", "Some men are drinking and playing games, creating a joyful and happy atmosphere.", "The entire family is having a great time, with children and adults alike enjoying the festivities."]}, "5586394125": {"audio_captions": ["The girl and boy are discussing.", "A man and a woman are having a conversation while the voices of children can be heard in the background.", "Some people are speaking to somebody."], "visual_captions": ["Two dogs and two people are playing.", "The two ladies were playing with two dogs outdoors.", "Two humans and two dogs are walking on the ground."], "audio_visual_captions": ["The dogs are playing with people.", "There are two dogs and two women.", "Two dogs are eating some food or water while people are talking in the background.", "She is playing with dogs on the ground.", "The dogs were playing with the girls."], "GPT_AV_captions": ["Two women are playing with two dogs while talking in the background.", "Two dogs and two women are outdoors, engaging with each other.", "The dogs are interacting with the women as they converse."]}, "5591479226": {"audio_captions": ["A man is singing along with a band while a crowd is cheering in the background.", "Music is playing loudly and humans are speaking.", "Friends are happily singing songs loudly in the practice room."], "visual_captions": ["A man and a woman are practicing dance.", "They are dancing at home.", "Two people are dancing in her home or hall.", "There is a couple dancing and enjoying themselves over time."], "audio_visual_captions": ["There is one boy and one girl dancing.", "Two people are dancing to lively music in a living room, and then people cheer for them.", "A man is dancing with his partner.", "The man and girl were dancing."], "GPT_AV_captions": ["A man and a woman are dancing to lively music in a living room while a crowd cheers in the background.", "A couple is dancing and enjoying themselves as music plays loudly and people cheer.", "Two people are dancing happily to music in a living room, with cheering heard in the background."]}, "5597037980": {"audio_captions": ["A dad and mom are talking to their child, and the child is telling something to the parents.", "The baby is making sounds and there is background music playing.", "A woman is talking to someone, and there are people who are being very loud. Additionally, there is a baby talking in the background."], "visual_captions": ["The baby is being fed milk.", "A baby is playing with a feeding bottle.", "The child was playing with a feeding bottle.", "The baby is feeding from the milk bottle."], "audio_visual_captions": ["A baby boy is walking and drinking milk.", "The baby is playing in the room with the mother.", "The baby is holding her feeding bottle and walking around the table."], "GPT_AV_captions": ["A baby is walking around the room, holding and drinking from a feeding bottle, while the parents talk to each other and to the baby.", "The baby is playing with a feeding bottle, making sounds, and there is background music playing.", "The baby is interacting with the parents, who are talking to each other and to the baby, while the baby holds the feeding bottle."]}, "5599111348": {"audio_captions": ["A baby is playing music.", "The people are shouting loudly and playing music.", "Father played the drum, mother sang, and the baby enjoyed shouting and talking."], "visual_captions": ["The child is playing the drums instrument.", "The baby is playing music.", "The father and son are sitting while the daughter is playing the drums.", "The children are playing the instruments very well."], "audio_visual_captions": ["Two children play the piano and drums while their parents enjoy watching them. The family is very enjoyable.", "A girl is playing the drums and a boy is playing the piano, and they encourage their children by clapping.", "The two babies are playing the musical instruments and the daddy is enjoying.", "The baby was playing the drums."], "GPT_AV_captions": ["A baby is playing the drums while the father and mother enjoy watching and clapping.", "The baby plays the drums as the family enjoys the music together.", "The child plays the drums while the parents and sibling watch and encourage."]}, "5607360009": {"audio_captions": ["The birds are singing softly and the wind is making a gentle sound.", "The birds are singing in the peaceful breeze.", "The sound of air and birds can be heard in this audio."], "visual_captions": ["The man is teaching the boy how to ride a bicycle.", "The boy is playing with a bicycle.", "The boy practices cycling with the help of his dad.", "A father is teaching cycling to his son."], "audio_visual_captions": ["An older person is helping a child to ride a bicycle.", "A father was teaching his son how to ride a bicycle.", "The man is helping his son or grandson practice bicycle."], "GPT_AV_captions": ["A father is teaching his son how to ride a bicycle while birds sing softly in the background.", "The man helps his son practice cycling as the gentle sound of wind and birds can be heard.", "A father guides his son on a bicycle ride, accompanied by the peaceful sounds of nature."]}, "5608080109": {"audio_captions": ["The father was teaching the child, and the mother was together.", "The man was talking to someone.", "A man was speaking with someone and laughing."], "visual_captions": ["The mother and baby are playing with toys.", "The baby boy is happily playing with his mother.", "The baby is taking the paper and playing with it.", "One child is playing with the toys and one woman is sitting."], "audio_visual_captions": ["The child is playing with his parents, and they are very happy. A dog sees the child.", "The baby is very cute. A dog is playing. The baby's smiling is very nice.", "The mother and father are talking while the child is playing."], "GPT_AV_captions": ["The child is playing with his parents, and they are very happy. A dog sees the child.", "The mother and father are talking while the child is playing with toys.", "The baby boy is happily playing with his mother while the father talks and laughs."]}, "5608194207": {"audio_captions": ["There is a happy event being celebrated by people in the background.", "There are many people clapping on the stage.", "The event is being enjoyed by people in the background.", "Someone is attending the party or music carnival."], "visual_captions": ["A man is recording a video for a man and a woman.", "He is recording a video with a camera in the hotel.", "The bride and groom are walking on the floor."], "audio_visual_captions": ["There was a very clear photoshoot of the party, and two members participated in the party.", "The man and woman are coming to the welcome party, and the cameraman is taking photos.", "In a party the cameraman took a photograph of the couple, capturing them walking well.", "A couples' photo shoot, one couple is posing for the photographer.", "The man is recording the event, and the bride and groom are walking over there."], "GPT_AV_captions": ["A man is recording a video of the bride and groom at a happy event with many people clapping in the background.", "The bride and groom are walking on the floor while a cameraman captures the moment at a lively party.", "A couple is being photographed by a cameraman at a celebration, with people enjoying the event in the background."]}, "5614883965": {"audio_captions": ["The man is talking to the baby.", "The dad is talking to his little baby, and the baby responds using childlike language.", "The boy is speaking like a child."], "visual_captions": ["The little boy kept opening the door repeatedly.", "The little boy opens the cupboard and plays with his toys.", "A child was opening a cupboard."], "audio_visual_captions": ["The little kid opened and closed the storeroom door while dad called the little baby.", "The cute baby is playing with the door and enjoying the attention of the parents.", "The kid is playing with a toy car."], "GPT_AV_captions": ["A little boy is opening and closing the cupboard door while his dad talks to him.", "The dad is talking to his little baby, who responds in childlike language, while playing with the cupboard door.", "The child is enjoying the attention of his dad while playing with the cupboard door."]}, "5625120077": {"audio_captions": ["A person is speaking with someone.", "People are talking and one person is talking loudly.", "A man is engaged in a conversation with other individuals.", "The man is talking seriously about life."], "visual_captions": ["The chef is explaining the recipes to the students.", "The executive chef is explaining to other chefs how to cook the dishes deliciously.", "The chief is explaining to the student.", "People are doing something in the kitchen."], "audio_visual_captions": ["A chef was teaching a class to their students.", "The chef was talking to the junior chef about how to prepare cooked food.", "The chef is giving an explanation.", "He is teaching about cooking."], "GPT_AV_captions": ["A chef is explaining recipes to students in a kitchen.", "The chef is teaching a class about cooking to junior chefs.", "The chef is engaged in a serious conversation about how to prepare delicious dishes."]}, "5630978721": {"audio_captions": ["A father is feeding his picky baby while a television show plays in the background.", "The baby was crying while the father was talking to the baby in a very cheerful manner.", "A person is conversing with the child.", "Daddy asked the baby if they were hungry.", "A man is speaking to the child. The child is very active, and the people around them are listening to the man's speech."], "visual_captions": ["A father is feeding his baby milk from a bottle, and the baby is crying.", "The father is giving the baby a bottle of milk.", "The father is feeding milk to the baby while the baby is crying."], "audio_visual_captions": ["A father is feeding his baby.", "When a child is hungry and cries, the father feeds the youngster.", "Daddy is feeding milk to the baby, and he takes it out. Then the baby cries for the second time, and daddy feeds the milk again.", "Dad feeds his baby with a bottle for feeding.", "A man is feeding a baby using a feeding bottle. Finally, the man kisses the baby."], "GPT_AV_captions": ["A father is feeding his baby milk from a bottle while the baby is crying, and a television show plays in the background.", "The father is talking to the baby in a cheerful manner, asking if they are hungry, and the baby is very active.", "The father feeds the baby milk, takes the bottle out, and when the baby cries again, he resumes feeding, then kisses the baby."]}, "5644588422": {"audio_captions": ["The man is giving a speech to the group of people.", "In an auditorium, men receive applause for their speeches.", "There is a person talking in the hall."], "visual_captions": ["Two men were having a conversation on a stage.", "On stage, the men are delivering a speech to the audience.", "Two men are on stage and are speaking into a microphone. Some other people were sitting on the side of the stage."], "audio_visual_captions": ["There were two people standing on the stage, and one of them was speaking about the other. Throughout the function, there was a sound of applause until it ended.", "Two men are giving the some advice and introducing the same people on the stage.", "In a meeting hall, two people are talking one by one. Three judges are sitting on the stage. One judge goes to the audience side and asks a question. The audience is laughing.", "People are meeting in a hall."], "GPT_AV_captions": ["Two men are on stage giving speeches to an audience, with applause heard throughout the event.", "In an auditorium, two men are speaking into microphones while people sit on the side of the stage.", "During a function, two men take turns speaking on stage, and the audience responds with laughter and applause."]}, "5650441607": {"audio_captions": ["He is speaking to a lady.", "A man is talking to their baby.", "The woman is talking with her husband with love.", "Man and woman are discussing Easter."], "visual_captions": ["A mother is feeding her baby and playing with the baby.", "A girl is feeding a baby.", "A girl is feeding her baby."], "audio_visual_captions": ["The mother talks to her baby and shows the grocery items to her baby.", "Two parents give their newborn child their first Easter basket.", "The baby feeds the mom and is very cute.", "The mother is giving a gift to her baby while feeding.", "The child's parents are introducing new things to them."], "GPT_AV_captions": ["A mother is feeding her baby and talking to her husband about Easter.", "The parents are introducing new things to their baby while discussing Easter.", "The mother is showing grocery items to her baby and feeding them."]}, "5654616479": {"audio_captions": ["There is a man speaking and many women's voices can be heard in the background. Additionally, there is a lot of noise in the background.", "People are laughing and a mixer is running in the background.", "A group of people is talking and laughing while someone is blending something in the background.", "They are joking, speaking, and playing with each other."], "visual_captions": ["A man was playing with his friends with a gun.", "The man is playing with his coworkers using a toy gun.", "The man is playing with the gun in the office."], "audio_visual_captions": ["The man is playing with the gun along with others.", "A man is playing with a toy gun in the office.", "A man was shooting a gun in a funny manner while he was in the office."], "GPT_AV_captions": ["A man is playing with a toy gun in the office while people are talking and laughing in the background.", "The man is joking and playing with a toy gun along with his coworkers in the office.", "People are laughing and talking as a man plays with a toy gun in a lively office environment."]}, "5656360308": {"audio_captions": ["One music band was playing music. It was very good.", "There is a man who sings and plays music, and there is a woman who appreciates it.", "A man is currently singing a song."], "visual_captions": ["One person is playing with a child in the playground.", "A man is pushing a boy on a skate and running in the playground.", "A father is playing with his child on the ground."], "audio_visual_captions": ["The person and the baby are running.", "The father is playing with the child.", "The father and child are playing on the ground."], "GPT_AV_captions": ["A man is playing with his child on the playground while singing a song.", "A father is pushing his child on a skate and running in the playground.", "A man sings and plays music as he enjoys time with his child on the ground."]}, "5662041273": {"audio_captions": ["A woman is talking to a man while they are playing with a baby in the background.", "A father and son were talking about something.", "A woman is talking in the background and making a lot of noise."], "visual_captions": ["A baby is playing a game at home.", "The little boy is playing with a remote control plane and keeps playing with it repeatedly.", "A child was playing with a toy using a joystick."], "audio_visual_captions": ["The boy is playing with a remote-controlled helicopter game while his father motivates the baby with great enthusiasm.", "A boy was playing with a remote-controlled helicopter.", "The baby was playing with a joystick while the father was helping the child.", "A boy is sitting on the sofa, playing with a remote-controlled helicopter toy. His father appreciates the boy for becoming a good pilot. However, the helicopter falls down, but the boy picks it up and continues playing."], "GPT_AV_captions": ["A boy is playing with a remote-controlled helicopter toy while his father encourages him enthusiastically.", "A woman is talking in the background as a boy plays with a remote-controlled helicopter, and his father helps him.", "A boy is sitting on the sofa, playing with a remote-controlled helicopter, and his father appreciates his efforts."]}, "5662313254": {"audio_captions": ["The man is speaking and the other man is laughing.", "Some people are talking in this audio clip.", "This person is very likable, and the discussions between this person and their family members are quite funny."], "visual_captions": ["A man is knocking on the table, and there are also some foods on the table.", "Breakfast was packed and covered.", "There is bread and some types of dishes on the table.", "They explore food, such as bread.", "The table has snacks for friends' meeting, including buns, bread, biscuits, and chips. It is a joyful occasion."], "audio_visual_captions": ["The bread slices are placed on the table with proper covers for breakfast.", "The members are eating breakfast.", "They are having a dinner meeting at the hotel."], "GPT_AV_captions": ["A man is speaking and another man is laughing while they sit at a table with various foods like bread, buns, biscuits, and chips.", "The table is set with covered breakfast items, and the people are enjoying a joyful meal together.", "The group is having a lively discussion and sharing a meal, creating a warm and likable atmosphere."]}, "5671008554": {"audio_captions": ["The moments of celebration when the person won playing the game.", "People are speaking loudly in the background.", "Many people are laughing and talking, enjoying the parties very happily and loudly, saying something."], "visual_captions": ["A girl and her father are playing together.", "A baby girl is playing with a toy and smiling with a man.", "The father and daughter are playing."], "audio_visual_captions": ["The grandfather is playing with the child.", "The baby and grandfather are playing with vegetables.", "A girl is tapping the toy with her dad.", "A baby is playing with their father with balls."], "GPT_AV_captions": ["A baby girl is playing with a toy and smiling with her father while people are speaking loudly in the background.", "The father and daughter are playing together, enjoying the moment as many people laugh and talk happily around them.", "A girl is tapping the toy with her dad, celebrating and having fun amidst the lively party atmosphere."]}, "5681946487": {"audio_captions": ["A woman and children are clamoring with excitement while water splashes and a baby squeals.", "The baby has a very nice smile.", "They are currently engaged in water play."], "visual_captions": ["The mother and baby are playing with water.", "The baby was taking a bath with the mother.", "The child was bathed in water."], "audio_visual_captions": ["A baby is taking a bath in the bathroom.", "The mother is bathing the child while he plays in the water tub.", "The child is playing while taking a bath.", "The mother bathes her child in the restroom."], "GPT_AV_captions": ["A mother and her baby are playing with water while the baby squeals with excitement.", "The baby is taking a bath and smiling as the mother bathes him in the bathroom.", "The child is enjoying water play in the tub while the mother bathes him."]}, "5687893796": {"audio_captions": ["There is music playing in the background.", "Old classical music is often used as background music for comedy scenes.", "This person is very fond of music and enjoys it at a high volume.", "Some individuals were playing the piano."], "visual_captions": ["A lady turned on the music and joined the dance party with her friends, while one of the men started teaching her a dance move.", "A group of people are dancing in the room. A man is standing across from them and taking something from the cupboard.", "The boy and a group of girls are enjoying dancing to the song.", "Two men and three girls are dancing to party songs."], "audio_visual_captions": ["The boy and the girls are dancing.", "The song is playing and the four of them are dancing.", "The party is currently happening, and both the girls and boys are enjoying themselves by dancing.", "The people are dancing while the music plays in the background with others."], "GPT_AV_captions": ["A group of people, including boys and girls, are dancing to the music playing in the background at a party.", "A lady turned on the music and joined the dance party with her friends, while one of the men started teaching her a dance move.", "Two men and three girls are dancing to the music, enjoying themselves at the party."]}, "5694941758": {"audio_captions": ["The child is speaking  and playing.", "The person is speaking while there is a frequent bell sound.", "A woman is having a conversation while the sound of water can be heard in the background.", "A woman is speaking while the sound of water is being heard."], "visual_captions": ["The child played the game on a mobile phone.", "The baby is playing with a mobile phone.", "The child is watching something on the phone."], "audio_visual_captions": ["A child is watching stories on the mobile phone.", "The small child is watching a video on the phone and trying to move the picture. After that, they take a green ball and look upwards.", "A baby is watching a mobile phone.", "The child is watching the phone."], "GPT_AV_captions": ["A child is watching something on a mobile phone while a woman is speaking and the sound of water can be heard in the background.", "The child is playing with a mobile phone and there is a frequent bell sound while a woman is having a conversation.", "The child is watching a video on the phone and trying to move the picture, then takes a green ball and looks upwards."]}, "5697975018": {"audio_captions": ["The background music and sound.", "The music is enjoyable and has a pleasant melody.", "Playing music and enjoying this music."], "visual_captions": ["Two men are working in the system, and one is giving instructions to the other.", "Two men were seeing  the  computer system.", "Two gentlemen are working here on a computer."], "audio_visual_captions": ["Two men are working on computers while listening to loud music.", "The two boys are coding.", "The two men are very serious about our work. The work is going well, and the man working is very interesting."], "GPT_AV_captions": ["Two men are working on a computer while listening to music.", "Two men are focused on their work with pleasant background music playing.", "Two gentlemen are coding on a computer with enjoyable music in the background."]}, "5705234852": {"audio_captions": ["A group of friends is enjoying the match and cheering on the participants.", "The people in the background are making loud sounds.", "Many people are happily talking and laughing.", "A group of people enjoyed the party and were shouting all the time."], "visual_captions": ["Families spend time together at restaurants and enjoy each other's company.", "The mother was encouraging her child.", "The boy was eating at the restaurant."], "audio_visual_captions": ["A mother and her son are in a restaurant, and there is loud background noise playing.", "The children eat the dinner.", "The kids are eating at a restaurant.", "The friends have a party at a restaurant."], "GPT_AV_captions": ["A mother and her son are in a restaurant, enjoying their meal amidst loud background noise.", "Families are spending time together at a restaurant, with people happily talking and laughing.", "A group of friends is having a party at a restaurant, cheering and making loud sounds."]}, "5710270308": {"audio_captions": ["Some people are talking to and playing with the child.", "A man and a woman are having a conversation while the voices of children can be heard in the background.", "The family is interacting with each other, and the baby is shouting in the background."], "visual_captions": ["The child is playing with a ball.", "A small baby is playing with his toys.", "The baby is playing with balls.", "The baby is playing with the toys and enjoying them."], "audio_visual_captions": ["A baby is playing with balls while a television is playing in the background.", "The baby is playing with the balls.", "A little child is playing with his toys.", "The baby plays with a red ball, then takes a yellow ball, and finally takes the red ball again."], "GPT_AV_captions": ["A baby is playing with balls and toys while people are talking and interacting in the background.", "A small child is enjoying playing with a red ball, then a yellow ball, and then the red ball again, with family voices in the background.", "The baby is playing with toys and balls, and there is a conversation between a man and a woman with children\u2019s voices heard."]}, "5717610831": {"audio_captions": ["The boy is singing a song, playing the song, and dancing.", "Music is playing while the child sing a song.", "There is a small child energetically singing along with the song in the background.", "There is a song playing in the background.", "A child was singing a rhyming song."], "visual_captions": ["A baby girl was playing with her hand.", "The baby girl was looking at the laptop and dancing with her mother.", "The baby is playing and dancing."], "audio_visual_captions": ["A child was dancing in the home.", "A baby is singing a song and dancing.", "The baby sings the song and enjoys it."], "GPT_AV_captions": ["A child is singing a song and dancing energetically.", "A baby is dancing and singing along with the music.", "The baby is enjoying the song while dancing."]}, "5722872813": {"audio_captions": ["The music being played on the piano is very sad and eerie.", "Someone is playing the keyboard and people clap at the end.", "Someone is playing the piano in this auditorium.", "There is background music playing."], "visual_captions": ["Two kids are playing piano music.", "Two children were playing a piano.", "One woman and one girl are playing piano."], "audio_visual_captions": ["The girl is playing music while sitting.", "The baby is playing the piano superbly.", "A piano teacher and her student are playing the piano.", "She is playing the piano very nicely.", "The two children were playing the piano."], "GPT_AV_captions": ["Two children are playing the piano in an auditorium, and the music is sad and eerie.", "A piano teacher and her student are playing the piano, and people clap at the end.", "A girl is playing the piano very nicely while sitting, and there is background music playing."]}, "5728648619": {"audio_captions": ["Some people are having a conversation and laughing.", "The family is having a discussion with each other.", "There is a lot of chatter among people in a crowded place.", "A man and a woman had a funny conversation. Sometimes they spoke loudly and made each other laugh."], "visual_captions": ["A man is teaching the student how to draw the drawing.", "A man is writing and drawing on a pad of paper. A boy asks the man some questions.", "He is teaching the child.", "There is a class with a teacher and students present."], "audio_visual_captions": ["The teacher is writing on the board in class.", "The man is drawing a picture.", "A boy is attending a drawing class.", "A man is teaching something using a drawing."], "GPT_AV_captions": ["A man is teaching a boy how to draw, and they are having a lively conversation and laughing.", "The teacher is drawing on a pad of paper while the boy asks questions, and they both laugh at times.", "In a drawing class, a man and a boy are discussing and laughing as the man teaches using drawings."]}, "5729076991": {"audio_captions": ["A baby is crying while people are talking in the background and there is loud music playing.", "Some men and women were happily interacting with a baby while he or she was playing.", "A child is currently listening to music in the background."], "visual_captions": ["The child is playing at home.", "A baby is playing at home.", "The baby girl is very happy to see her parents and she moves towards her father.", "A baby is playing inside the house.", "The baby is playing with toys."], "audio_visual_captions": ["The baby is playing in the house.", "The little girl is playing with toys and moving out of the house.", "A baby girl is crawling on the floor and playing with objects."], "GPT_AV_captions": ["A baby is playing at home with toys while people are talking in the background and music is playing.", "The baby girl is happily interacting with her parents and crawling on the floor.", "A baby is playing inside the house, enjoying the company of adults and listening to music."]}, "5731927400": {"audio_captions": ["Someone is talking, playing in the background, and laughing joyfully.", "A girl is talking in the background and laughing.", "There appears to be a group of people walking, talking, and laughing in a small manner.", "There are people speaking and laughing in the background."], "visual_captions": ["The trainer trains the dog and the dog follows the trainer's instructions.", "Women and a dog are playing in a hall.", "The black dog is playing with its owner."], "audio_visual_captions": ["The dog is playing with the children.", "A dog was playing with a woman.", "The dog is chasing its tail and playing a game."], "GPT_AV_captions": ["A black dog is playing with a woman and children, following the trainer's instructions, while people are talking and laughing in the background.", "A group of people, including women and children, are in a hall where a black dog is being trained and playing joyfully.", "The dog is interacting with its owner and others, chasing its tail and engaging in playful activities, accompanied by background laughter and conversation."]}, "5732384406": {"audio_captions": ["There is background music and people are dancing.", "The music is wonderful and very nice.", "The people are singing a song."], "visual_captions": ["The boys are playing instruments.", "The four people play musical instruments and sing songs.", "The group of people is singing a song and playing music.", "The group of friends is playing instruments."], "audio_visual_captions": ["A group of boys are participating in the music show.", "The people are playing the music.", "The boys are playing the instruments and singing the song."], "GPT_AV_captions": ["A group of people is playing musical instruments and singing a song.", "The group of boys is participating in a music show, playing instruments and singing.", "The people are dancing to wonderful background music while playing instruments and singing."]}, "5738937644": {"audio_captions": ["A man is talking to someone around.", "A man is discussing the optimization and tuning of a mechanism.", "A person is explaining something to someone."], "visual_captions": ["The man is teaching something, and the boy is listening.", "The person operating the system is informing the student.", "One man was teaching a lesson on computers, and another man was listening."], "audio_visual_captions": ["A man is instructing his student.", "The boy is teaching the student and explaining the details.", "The people working at the company are using the computer.", "The man wearing a black t-shirt is explaining the project to his colleague."], "GPT_AV_captions": ["A man is explaining the optimization and tuning of a mechanism to his student.", "The man in a black t-shirt is teaching and informing his colleague about the project.", "A person is instructing and discussing details with a student while using the computer."]}, "5750799064": {"audio_captions": ["The baby is playing a game.", "A child is laughing loudly in our house.", "The baby laughs, giggles, and makes playful sounds upon hearing that his father and mother are enjoying themselves."], "visual_captions": ["The two children are playing with the toys.", "One boy's brother enjoys being with his brother.", "Two small boys are playing with a basket and going around in their house.", "The two children are playing very cutely."], "audio_visual_captions": ["The two children played a very funny game.", "Two children are playing in the room.", "Two children are playing at home."], "GPT_AV_captions": ["Two children are playing a game at home, laughing and giggling.", "The two children are enjoying themselves while playing with toys in the room.", "Two small boys are having fun playing together in their house."]}, "5757232720": {"audio_captions": ["The child is playing with their parents.", "A small child is playing with someone.", "A child is talking and laughing while their parents seem to be talking in the background."], "visual_captions": ["A small baby is playing with a toy while her father is at home.", "The child is extremely happy inside the house.", "A baby is playing with toys in the room.", "A girl is playing in the house.", "A baby is playing in the house with toys and running around."], "audio_visual_captions": ["The child is playing with the floor.", "The girl is playing with a man and a woman. She is running around the kitchen, and the man gives chips to the girl.", "The baby girl is moving in circles inside the room. Then she is playing with her parents."], "GPT_AV_captions": ["A baby girl is playing with toys and running around the house while her parents are talking in the background.", "The child is extremely happy, playing with her parents and moving in circles inside the room.", "A girl is playing with a man and a woman, running around the kitchen, and the man gives her chips."]}, "5759653927": {"audio_captions": ["A male performer is singing. He is playing with the table and singing a song with his family.", "They are speaking and singing.", "The man is singing a song, but the woman is laughing while listening to the song and also singing along with him.", "People in the room are talking and smiling."], "visual_captions": ["The friends are speaking in the office.", "Five members discussed the deal and cleared some doubts about the teamwork.", "A group of people is discussing and talking about something."], "audio_visual_captions": ["One boy is reading the text while the others are enjoying it and they are smiling together.", "One boy read the text and sang a song. His friends enjoyed it and they laughed at each other.", "In a conference hall, three boys and two girls were composing music, singing, and laughing."], "GPT_AV_captions": ["A group of people is in a room, talking, smiling, and enjoying a song together.", "A man is singing a song while a woman laughs and sings along; others in the room are smiling and talking.", "In a conference hall, a group of friends, including three boys and two girls, are composing music, singing, and laughing together."]}, "5765473409": {"audio_captions": ["The discussion with the child is very interesting, and they are happy and enjoy speaking.", "The baby is speaking happily.", "A man is talking to a woman, and the woman is laughing and talking to him."], "visual_captions": ["A baby is playing with a dog.", "A baby is playing with a dog and giving food to the dog.", "The child is playing with the dog while the father is smiling.", "The baby was playing with the dog.", "The baby was playing with her dog."], "audio_visual_captions": ["The baby is playing a game with the dog.", "The child is playing with the dog while her father is sitting nearby. The child is feeding food to the dog.", "The baby is playing with a dog and some food is being provided to the dog.", "A child is playing while a man is sitting nearby.", "A child is playing with the dog while its father is sitting beside the child, and the mother is recording the video."], "GPT_AV_captions": ["A baby is playing with a dog while the father is smiling nearby.", "The child is happily playing with the dog and feeding it while the father watches.", "A baby is playing with a dog and giving it food, with the father sitting close by."]}, "5766018720": {"audio_captions": ["A man and a woman are discussing while music is playing in the background.", "The man is engaged in a slow conversation with someone else.", "Music is playing on a device."], "visual_captions": ["A baby is playing with some toys.", "The baby boy is playing with toys at home.", "The baby is playing with toys in his bedroom.", "One child is playing with a toy.", "The baby was playing with toys."], "audio_visual_captions": ["The baby is playing with soft toys and a musical toy.", "The baby was playing with toys.", "The baby is playing with the toys while some music is playing.", "A child is seen playing with toys, specifically a toy dog.", "The baby plays with the dog toy first, then makes a sound to get the attention of the father and the baby. After that, the baby plays with a musical item and enjoys the movement."], "GPT_AV_captions": ["A baby is playing with toys while music is playing in the background.", "The baby is playing with a toy dog and a musical toy.", "A man and a woman are discussing while the baby plays with toys."]}, "5770462342": {"audio_captions": ["A father is playing with his young child.", "A man is playfully talking to the baby.", "A small child is speaking with their father.", "The father and his baby are having a conversation, and the baby is speaking in an adorable manner. There are also some noises coming from outside."], "visual_captions": ["The baby is cute and eating snacks.", "The baby girl is talking and has taken the cup in her hands.", "A cute girl is sitting on the sofa and eating something.", "The child is eating snacks from the bowl."], "audio_visual_captions": ["The child is eating while holding a cup.", "A girl is speaking to someone and she is very happy.", "The girl child is speaking with someone."], "GPT_AV_captions": ["A father is playfully talking to his young child who is eating snacks and holding a cup.", "A cute girl is sitting on the sofa, happily speaking with her father while eating from a bowl.", "The baby girl is having an adorable conversation with her father, holding a cup and eating snacks."]}, "5770740059": {"audio_captions": ["A man is playing music and singing a song while people are shouting and clapping.", "A singer is performing by playing the guitar in a public place, and people were applauding.", "The man is singing a song beautifully.", "The boy is singing and enjoying. Other people applaud and congratulate him."], "visual_captions": ["The man was engaged in music.", "The man is playing the guitar.", "The man is singing the song."], "audio_visual_captions": ["The human is playing an instrument.", "The man was playing music and singing a song on the stage.", "The man is playing a guitar and singing a song.", "The man is playing music.", "A person is singing a song with a guitar, and another person is taking a photo."], "GPT_AV_captions": ["A man is playing the guitar and singing a song while people are applauding and shouting.", "The man is performing music on stage with a guitar, and the audience is clapping.", "A man is singing and playing the guitar, and people are enjoying and congratulating him."]}, "5779635831": {"audio_captions": ["The horse is running, and the man is shouting.", "The sound of a running horse can be heard.", "The two people are running quickly and talking."], "visual_captions": ["The man was practicing horse riding.", "The person is riding a horse.", "A person is riding a horse from right to left and then from left to right continuously for two times."], "audio_visual_captions": ["The man is riding a horse, and there are dogs on the way.", "The cowboy is riding the horse, and the dogs are playing.", "A man was riding a horse.", "The man is riding a horse."], "GPT_AV_captions": ["A man is riding a horse, and there are dogs on the way.", "The man is riding a horse from right to left and then from left to right continuously.", "The sound of a running horse can be heard as the man rides."]}, "5787622236": {"audio_captions": ["The girl is speaking and the baby is being loud.", "A baby was playing with their daddy and mummy.", "A baby is shouting while people are talking in the background."], "visual_captions": ["A man is changing his baby's clothes while they walk around.", "A baby boy is playing with his father and dog.", "A baby is playing with a dog and wandering here and there. The dog is walking back to the baby. A man is taking care of the baby."], "audio_visual_captions": ["The baby is playing with the toy at home with their father.", "A child was moving in the room while his father was changing the child's shirt, and a dog was walking in the room.", "The baby is playing with his dad and walking alongside him. They are playing with many toys and having a great time.", "One child was playing and the child's father is changing a dress for the child."], "GPT_AV_captions": ["A baby is playing with his father and a dog while the father changes the baby's clothes.", "The baby is moving around the room, playing with toys, and making noise while the father takes care of him.", "A baby boy is interacting with his dad and a dog, enjoying their time together at home."]}, "5793991791": {"audio_captions": ["Two adults are engaged in conversation with a baby in a busy location.", "The mother is speaking to her young child.", "The father and mother were talking to their child."], "visual_captions": ["Two babies are playing a game on a seesaw.", "Two children are playing on a see-saw in a theme park.", "Two children are playing with some seesaw toys."], "audio_visual_captions": ["Two children are playing on a seesaw and exchanging their seats.", "Two babies are playing a seesaw game.", "Two children are playing on the seesaw."], "GPT_AV_captions": ["Two children are playing on a seesaw in a busy location.", "Two children are playing on a seesaw in a theme park.", "Two children are playing on a seesaw and exchanging their seats."]}, "5798851653": {"audio_captions": ["One woman was laughing while there were sounds of birds in the background.", "One girl is talking to her baby.", "The children and parents are playing."], "visual_captions": ["One little kid gave carrots to goat.", "The baby boy gave food to the goat.", "A child was on a farm with animals and happily fed them.", "He feeds the baby goats."], "audio_visual_captions": ["The baby is playing with the sheep.", "The child is playing with a cow and is very happy at that moment.", "A child is feeding a goat with a carrot.", "The baby was given snacks for the goats."], "GPT_AV_captions": ["A child is feeding a goat with a carrot while sounds of birds are in the background.", "A woman is laughing as children and parents play on a farm with animals.", "A baby is happily interacting with farm animals, including feeding goats."]}, "5799956920": {"audio_captions": ["The people are talking in the background.", "A group of friends are laughing and talking while waves are crashing on the beach.", "The family is playing with the child and making the child laugh."], "visual_captions": ["The child is playing in a swimming pool.", "The two babies are playing in the water with their toys.", "Two babies are playing in the water."], "audio_visual_captions": ["Two children are playing in the water and with toys outside, while their parents are standing nearby.", "The two babies are playing in the water with the toys.", "Two babies are playing with water and toys, and then family members join them to enjoy the activity.", "Two children are playing with water."], "GPT_AV_captions": ["Two children are playing in the water with toys while their parents are standing nearby.", "The family is enjoying time together as the children play in the water with their toys.", "A group of friends and family members are laughing and talking while the children play in the water with toys."]}, "5802161982": {"audio_captions": ["The group of members is talking loudly and the background is noisy.", "There are many girls talking and laughing.", "The background was noisy, and one man was talking with someone while some people were making noise."], "visual_captions": ["The couple cut the cake.", "A woman is hosting a birthday party.", "A group of people is celebrating something by cutting a cake.", "A couple is attempting to cut the cake at a function."], "audio_visual_captions": ["The couple is celebrating their marriage reception with friends and family.", "Some people are celebrating a birthday.", "A family was celebrating a birthday party.", "A new couple is cutting the cake while people are watching in the background.", "The couple's cake cutting celebration."], "GPT_AV_captions": ["A couple is cutting a cake while a group of people celebrates in a noisy background.", "A couple is celebrating a special occasion with friends and family, cutting a cake amidst laughter and talking.", "A group of people is gathered around a couple cutting a cake, with lively conversations and background noise."]}}