[{"frame_index": 1, "sentence_text": "The image depicts a man standing in a room filled with boxes and various items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 1, "sentence_text": "There are several chairs scattered throughout the room, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 1, "sentence_text": "A truck is visible in the room, and a couple of bottles are placed on surfaces.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 1, "sentence_text": "The man appears to be looking at the boxes, possibly organizing or unpacking them.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 1, "sentence_text": "The room seems to be a storage area or a place for sorting and packing items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 3, "sentence_text": "In the image, there are two people walking down a street.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 3, "sentence_text": "One person is wearing a white shirt and the other is wearing a black shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 3, "sentence_text": "They are both carrying backpacks.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 3, "sentence_text": "The street is lined with various objects, including a chair, a dining table, and a couch.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 3, "sentence_text": "There are also several boxes and a truck parked on the side of the street.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 3, "sentence_text": "Additionally, there is a bottle and a cup visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 3, "sentence_text": "The overall atmosphere suggests a casual, everyday setting.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 2, "sentence_text": "In the image, there is a man standing in front of a store, possibly a furniture store, with several boxes and chairs scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 2, "sentence_text": "The man appears to be looking at the boxes, possibly considering purchasing them.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 2, "sentence_text": "There are also two other people in the scene, one standing near the left side and the other on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 2, "sentence_text": "The store has a variety of items, including chairs, a dining table, and a refrigerator.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 2, "sentence_text": "Additionally, there is a car parked outside the store, and a bottle can be seen placed on a surface.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 8, "sentence_text": "In the image, a man is walking down a street, carrying a box in his hand.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 8, "sentence_text": "The street is lined with various objects, including a truck parked on the right side of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 8, "sentence_text": "There are several chairs scattered throughout the area, with one near the center of the scene and another closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 8, "sentence_text": "Additionally, there are two dining tables, one located in the middle of the scene and the other towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 8, "sentence_text": "A few bottles can be seen on the ground, with one near the center and another closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 8, "sentence_text": "A bowl is also visible on the left side of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 6, "sentence_text": "In the image, there are two people standing in a room filled with boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 6, "sentence_text": "One person is closer to the left side of the room, while the other is on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 6, "sentence_text": "They appear to be engaged in a conversation or activity involving the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 6, "sentence_text": "The room is furnished with a chair located near the center of the room and a dining table towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 6, "sentence_text": "There are also two bottles placed in the room, one near the left side and the other closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 7, "sentence_text": "In the image, a man is walking down a street, carrying a box in his hand.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 7, "sentence_text": "There are several other people in the scene, some of whom are wearing backpacks.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 7, "sentence_text": "A truck is visible in the background, and a chair can be seen nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 7, "sentence_text": "Additionally, there are multiple bottles scattered throughout the scene, and a clock is mounted on a wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 7, "sentence_text": "The overall atmosphere suggests a busy urban environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 5, "sentence_text": "In the image, there are two people standing in a room filled with boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 5, "sentence_text": "One person is positioned closer to the left side of the room, while the other person is standing more towards the center.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 5, "sentence_text": "They appear to be engaged in a conversation or activity involving the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 5, "sentence_text": "The room is furnished with a chair located near the center and a dining table towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 5, "sentence_text": "There are also two bottles placed in the room, one near the center and the other closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 5, "sentence_text": "Additionally, a car can be seen in the background, parked on the right side of the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 4, "sentence_text": "In the image, there are two people walking down a street.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 4, "sentence_text": "One person is wearing a white shirt and the other is wearing a black shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 4, "sentence_text": "They are both carrying backpacks.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 4, "sentence_text": "The street is lined with boxes and crates, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 4, "sentence_text": "There is also a chair located near the center of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 4, "sentence_text": "Additionally, there is a truck parked on the right side of the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 9, "sentence_text": "In the image, a man is walking down a street, carrying a box on his head.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 9, "sentence_text": "The street is lined with various objects, including a chair, a dining table, and a refrigerator.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 9, "sentence_text": "There are also several bottles scattered throughout the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 9, "sentence_text": "The man appears to be the main focus of the image, as he navigates the street with his box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 14, "sentence_text": "In the image, a person is standing in a room with a red hoodie on, surrounded by various boxes and items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 14, "sentence_text": "There are multiple chairs in the room, with one near the person and another further away.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 14, "sentence_text": "A dining table is also present in the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 14, "sentence_text": "Outside the room, there is a truck visible in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 14, "sentence_text": "Additionally, there are two bottles in the scene, one near the person and the other further away.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 15, "sentence_text": "In the image, a person is standing in a room with boxes and a chair.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 15, "sentence_text": "The person is wearing a red jacket and appears to be looking at a piece of paper.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 15, "sentence_text": "There are several boxes scattered throughout the room, with some placed closer to the person and others further away.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 15, "sentence_text": "A chair is located in the middle of the room, and a truck can be seen outside the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 15, "sentence_text": "Additionally, there is a bottle placed on a surface in the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 17, "sentence_text": "In the image, there is a man standing in a room with boxes and crates scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 17, "sentence_text": "He is wearing a red shirt and appears to be unloading the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 17, "sentence_text": "There are several chairs placed around the room, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 17, "sentence_text": "Additionally, there are two bicycles in the room, one near the center and the other towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 17, "sentence_text": "A truck is visible in the background, and a clock can be seen on the wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 16, "sentence_text": "In the image, a person is standing in a room with a large number of boxes, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 16, "sentence_text": "The person appears to be unpacking the boxes, possibly in a warehouse or storage area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 16, "sentence_text": "There are several chairs scattered throughout the room, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 16, "sentence_text": "Additionally, there are a few bottles placed around the room, and a bowl is located near the center of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 16, "sentence_text": "The overall setting suggests a busy and active environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 12, "sentence_text": "The image depicts a cluttered room with a variety of items scattered throughout.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 12, "sentence_text": "There are several boxes and crates, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 12, "sentence_text": "A chair is located in the middle of the room, and a dining table can be seen towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 12, "sentence_text": "In the room, there are three people present.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 12, "sentence_text": "One person is standing near the left side of the room, another person is located in the middle, and the third person is standing closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 12, "sentence_text": "Additionally, there is a bicycle parked in the room, and a truck can be seen outside the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 13, "sentence_text": "The image depicts a cluttered room with various boxes and items scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 13, "sentence_text": "There are several people in the room, some of whom are sitting on chairs while others are standing.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 13, "sentence_text": "A truck can be seen in the background, and a dining table is also present in the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 13, "sentence_text": "Additionally, there are multiple bottles and a bowl placed throughout the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 13, "sentence_text": "The overall atmosphere suggests a busy and disorganized environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 11, "sentence_text": "The image depicts a cluttered room with various boxes and items scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 11, "sentence_text": "There are several people in the room, some of whom are sitting on chairs while others are standing.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 11, "sentence_text": "A truck can be seen in the background, and a car is parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 11, "sentence_text": "The room also contains a dining table and a refrigerator.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 11, "sentence_text": "There are multiple chairs placed throughout the room, and a few bottles are visible on surfaces.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 11, "sentence_text": "Additionally, a bowl is placed on a surface, and a cell phone can be seen in the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 10, "sentence_text": "The image depicts a cluttered room with various boxes and items scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 10, "sentence_text": "There are several people in the room, with one person standing near the center and two others located towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 10, "sentence_text": "A chair is situated in the middle of the room, and a dining table can be seen towards the right.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 10, "sentence_text": "In the room, there are multiple boxes of different sizes, with some placed on the floor and others stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 10, "sentence_text": "A few bottles are also visible in the scene, with one near the center and another towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 10, "sentence_text": "Additionally, there is a bowl located in the middle of the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 10, "sentence_text": "Outside the room, a car is parked on the left side, and a truck can be seen further back on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 18, "sentence_text": "In the image, a young boy is walking down a street, possibly in a foreign country.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 18, "sentence_text": "He is wearing a white shirt and sandals.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 18, "sentence_text": "The street is lined with various objects, including a truck parked on the right side of the street, a chair located in the middle of the scene, and a dining table towards the left side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 18, "sentence_text": "There are also several boxes scattered throughout the scene, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 18, "sentence_text": "Additionally, there is a bottle placed on the ground near the center of the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 37, "sentence_text": "In the image, a group of people is standing outside in front of a store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 37, "sentence_text": "There are three individuals, with one person wearing a red hoodie and another wearing a black shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 37, "sentence_text": "They are all holding bags, with one person holding a handbag and another holding a backpack.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 37, "sentence_text": "The scene also includes a chair and a dining table, suggesting that the store may have a seating area for customers.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 37, "sentence_text": "Additionally, there is a truck visible in the background, possibly delivering goods to the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 19, "sentence_text": "In the image, a young boy is walking past a store with boxes and crates stacked outside.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 19, "sentence_text": "The store appears to be a furniture store, as there are multiple chairs visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 19, "sentence_text": "The boy is wearing a white shirt and is walking on a sidewalk.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 19, "sentence_text": "There are also a couple of other people in the scene, one of whom is wearing a red hat.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 19, "sentence_text": "Additionally, there is a truck parked in the background, and a couple of bottles can be seen placed around the area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 30, "sentence_text": "In the image, two people are walking in a store, possibly shopping for boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 30, "sentence_text": "One person is wearing a black shirt, while the other person is wearing a white shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 30, "sentence_text": "They are surrounded by various objects, including a chair, a dining table, and a motorcycle.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 30, "sentence_text": "There are also several boxes scattered throughout the scene, possibly indicating that the store sells these items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 30, "sentence_text": "Additionally, there is a bottle visible in the background, and a clock on the wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 30, "sentence_text": "The overall atmosphere of the scene suggests a busy retail environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 40, "sentence_text": "In the image, there are two people standing on a sidewalk, one of them holding a cell phone.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 40, "sentence_text": "They appear to be engaged in a conversation or looking at something on the phone.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 40, "sentence_text": "The scene also includes a truck parked nearby, a chair, and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 40, "sentence_text": "There are several bottles scattered throughout the area, and a handbag can be seen close to one of the people.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 40, "sentence_text": "Additionally, there is a bird visible in the sky, adding a touch of nature to the urban setting.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 31, "sentence_text": "In the image, two people are working in a room filled with boxes and various items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 31, "sentence_text": "One person is standing near the center of the room, while the other is closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 31, "sentence_text": "They appear to be engaged in a task, possibly unpacking or organizing the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 31, "sentence_text": "There are several chairs scattered throughout the room, with one near the center, another on the right side, and a third closer to the left side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 31, "sentence_text": "Additionally, there are two dining tables in the room, one located in the middle and the other towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 31, "sentence_text": "A truck can be seen in the background, possibly delivering or picking up the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 31, "sentence_text": "There are also two bottles in the room, one near the center and the other on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 34, "sentence_text": "In the image, two people are standing in a room, with one person wearing a red hood and the other wearing a black shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 34, "sentence_text": "They appear to be engaged in a conversation or activity.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 34, "sentence_text": "The room is filled with various objects, including multiple chairs, a dining table, and a couple of bottles.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 34, "sentence_text": "There is also a car visible in the background, and a cell phone can be seen in the foreground.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 34, "sentence_text": "The scene seems to be set in an office or a similar indoor environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 35, "sentence_text": "In the image, a group of people is standing in a room, with one person holding a large white object.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 35, "sentence_text": "There are two people on the left side of the room, and three people on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 35, "sentence_text": "One person is wearing a red hoodie, and another person is wearing a black shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 35, "sentence_text": "There are two chairs in the room, one near the center and the other on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 35, "sentence_text": "A truck can be seen outside the room, and a clock is mounted on the wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 35, "sentence_text": "Additionally, there are two bottles in the room, one near the center and the other on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 36, "sentence_text": "In the image, a group of people is standing in a room, possibly a warehouse or a store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 36, "sentence_text": "They are surrounded by various objects, including chairs, a dining table, and multiple boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 36, "sentence_text": "Some of the people are wearing ties, indicating a possible professional setting.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 36, "sentence_text": "There is also a truck visible in the background, suggesting that the room might be used for storage or transportation purposes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 36, "sentence_text": "Additionally, a clock can be seen on the wall, providing a sense of time to the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 22, "sentence_text": "In the image, a person is bending over to pick up a box in a room filled with boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 22, "sentence_text": "The person is wearing a white shirt and appears to be focused on their task.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 22, "sentence_text": "The room is filled with various boxes, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 22, "sentence_text": "There is also a chair located in the room, and a truck can be seen outside the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 22, "sentence_text": "Additionally, there is a clock on the wall, and a bottle is placed on a surface.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 20, "sentence_text": "In the image, a person is bending over to pick up boxes in a room filled with various items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 20, "sentence_text": "There are multiple chairs scattered throughout the room, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 20, "sentence_text": "A truck is visible in the room, and a couple of bottles are placed on surfaces.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 20, "sentence_text": "Additionally, there are two bowls, a cup, and a vase in the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 20, "sentence_text": "A person is also present in the scene, possibly assisting with the task at hand.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 29, "sentence_text": "In the image, two people are standing in a room with various boxes and items scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 29, "sentence_text": "One person is standing closer to the left side of the room, while the other is standing more towards the center.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 29, "sentence_text": "There are several chairs placed throughout the room, with one near the center, another closer to the right side, and a third one near the left side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 29, "sentence_text": "A dining table can be seen in the background, and a refrigerator is located on the right side of the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 29, "sentence_text": "Additionally, there are two bottles placed in the room, one near the center and the other closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 38, "sentence_text": "In the image, a group of people is standing in a room with various boxes and items scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 38, "sentence_text": "There are at least five people visible in the scene, with some of them carrying handbags.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 38, "sentence_text": "The room appears to be a storage area or a workspace, with a chair and a dining table present.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 38, "sentence_text": "Additionally, there is a surfboard in the room, which might suggest that the people are involved in sports or outdoor activities.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 38, "sentence_text": "A truck can be seen outside the room, possibly indicating that the room is connected to a larger space or a storage facility.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 24, "sentence_text": "In the image, there is a person wearing a red shirt and a red mask, standing in a room with a large number of boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 24, "sentence_text": "The person is surrounded by various objects, including a chair, a dining table, and a truck visible in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 24, "sentence_text": "There are also several other people in the scene, some of whom are wearing masks.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 24, "sentence_text": "The room appears to be a storage area or a warehouse, with numerous boxes stacked up and occupying a significant portion of the space.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 25, "sentence_text": "In the image, there are two people walking down a street.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 25, "sentence_text": "One person is wearing a red jacket, while the other person is wearing a white shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 25, "sentence_text": "They are both carrying boxes, with one person holding a box in their hand and the other person carrying a box on their shoulder.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 25, "sentence_text": "The scene also includes a chair and a dining table, suggesting that the people might be moving items from a dining area to another location.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 25, "sentence_text": "Additionally, there is a clock visible in the background, indicating the time.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 28, "sentence_text": "In the image, there are two people standing in a room filled with boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 28, "sentence_text": "One person is closer to the left side of the room, while the other is on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 28, "sentence_text": "They appear to be engaged in conversation or organizing the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 28, "sentence_text": "The room is furnished with a chair located near the center of the room and a dining table towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 28, "sentence_text": "There are also two bicycles in the room, one near the left side and the other closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 28, "sentence_text": "Additionally, there is a truck visible in the background, parked outside the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 39, "sentence_text": "In the image, a group of people is standing in a room filled with boxes and various items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 39, "sentence_text": "There are at least five people visible, with some of them wearing masks.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 39, "sentence_text": "One person is holding a handbag, and another is holding a bottle.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 39, "sentence_text": "The room is furnished with a chair and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 39, "sentence_text": "There are also multiple bicycles in the scene, with one near the center and another towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 39, "sentence_text": "Additionally, there is a truck visible in the background, and a clock can be seen on the wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 39, "sentence_text": "The overall setting appears to be a busy location with people engaged in different activities.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 27, "sentence_text": "In the image, a woman is standing in a room surrounded by boxes and crates.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 27, "sentence_text": "She appears to be looking at the boxes, possibly deciding what to do with them.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 27, "sentence_text": "There are several chairs in the room, with one near the woman and others scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 27, "sentence_text": "A dining table can also be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 27, "sentence_text": "Additionally, there is a car visible in the scene, parked outside the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 21, "sentence_text": "In the image, a person is standing in a room with a large number of boxes, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 21, "sentence_text": "The person appears to be unpacking the boxes, possibly for a store or a delivery.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 21, "sentence_text": "There are several chairs in the room, with one near the person and others scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 21, "sentence_text": "A truck can be seen outside the room, possibly delivering the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 21, "sentence_text": "Additionally, there is a bottle located in the room, possibly for the person to drink from while unpacking the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 33, "sentence_text": "In the image, two people are standing on a sidewalk, one of them holding a ladder.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 33, "sentence_text": "They appear to be working on a project or task, possibly involving the use of the ladder.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 33, "sentence_text": "The scene also includes a truck parked nearby, a chair, and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 33, "sentence_text": "There are several boxes scattered around the area, which might be related to the ongoing work.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 33, "sentence_text": "Additionally, there is a bottle and a bowl visible in the scene, possibly indicating that the people are having a meal or drink during their work.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 41, "sentence_text": "In the image, two people are standing in a room, one of them wearing a red hoodie.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 41, "sentence_text": "They are engaged in a conversation, with one person holding a cell phone.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 41, "sentence_text": "The room is filled with various objects, including multiple chairs, a dining table, and a refrigerator.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 41, "sentence_text": "There are also several boxes scattered throughout the room, possibly containing items for storage or transportation.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 41, "sentence_text": "Additionally, a truck can be seen outside the room, possibly delivering goods or waiting for pickup.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 26, "sentence_text": "In the image, a woman is walking in front of a store with boxes and crates stacked outside.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 26, "sentence_text": "She is wearing a gray shirt and appears to be the main focus of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 26, "sentence_text": "There are several chairs scattered around the area, with one near the center of the image and others towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 26, "sentence_text": "A dining table can be seen in the background, and a handbag is placed on the ground close to the woman.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 26, "sentence_text": "The overall setting seems to be an outdoor retail or storage area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 23, "sentence_text": "In the image, a man is standing in a room, holding a box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 23, "sentence_text": "The room is filled with various objects, including a chair, a dining table, and a potted plant.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 23, "sentence_text": "There are also several other people in the room, some of whom are wearing ties.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 23, "sentence_text": "Additionally, there is a truck visible in the background, and a clock on the wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 23, "sentence_text": "The scene appears to be a busy and lively environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 32, "sentence_text": "In the image, two people are working together in a room filled with boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 32, "sentence_text": "One person is standing closer to the left side of the room, while the other is positioned more towards the center.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 32, "sentence_text": "They appear to be unloading or organizing the boxes, which are scattered throughout the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 32, "sentence_text": "There are several chairs placed around the room, with one near the center, another closer to the right side, and a third one towards the left.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 32, "sentence_text": "Additionally, there is a truck visible in the background, likely used for transporting the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 77, "sentence_text": "In the image, a man is standing in a room with a variety of boxes and crates.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 77, "sentence_text": "There are several chairs placed around the room, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 77, "sentence_text": "A truck is visible outside the room, and a bicycle is parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 77, "sentence_text": "The man appears to be wearing a white shirt and is possibly engaged in a conversation or activity related to the boxes and crates in the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 42, "sentence_text": "In the image, a man is bending over to pick up a box, possibly moving it into a truck.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 42, "sentence_text": "The scene takes place on a street with a truck parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 42, "sentence_text": "There are several chairs scattered around the area, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 42, "sentence_text": "Additionally, there are multiple bottles and a bowl placed around the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 42, "sentence_text": "A backpack is also visible, possibly belonging to the man picking up the box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 53, "sentence_text": "In the image, a person is standing on a sidewalk next to a building, possibly a store or a warehouse.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 53, "sentence_text": "The person is wearing a white shirt and appears to be looking at a box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 53, "sentence_text": "There are several boxes scattered around the area, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 53, "sentence_text": "Additionally, there is a chair located near the person, and a truck can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 53, "sentence_text": "The scene seems to be a busy urban environment with various objects and people present.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 84, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 84, "sentence_text": "There are several chairs placed throughout the store, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 84, "sentence_text": "A number of boxes are scattered around the store, with some placed on the floor and others on shelves.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 84, "sentence_text": "In the scene, there are three people visible.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 84, "sentence_text": "One person is standing near the center of the store, another is located closer to the right side, and the third person is situated near the left side of the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 84, "sentence_text": "Additionally, there is a bicycle parked in the background, and a car can be seen in the far right corner of the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 63, "sentence_text": "In the image, two people are standing on a sidewalk, engaged in conversation.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 63, "sentence_text": "One person is wearing a white shirt, while the other is wearing a grey shirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 63, "sentence_text": "They are both holding water bottles, with one person's bottle being red and the other's being blue.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 63, "sentence_text": "There is a chair nearby, possibly indicating an outdoor seating area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 63, "sentence_text": "In the background, a car is parked, and a truck can be seen further away.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 63, "sentence_text": "Additionally, there is a sports ball visible in the scene, suggesting that the area might be used for recreational activities.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 64, "sentence_text": "In the image, two people are walking down a sidewalk, with one person closer to the left side and the other person more towards the center.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 64, "sentence_text": "They appear to be engaged in conversation.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 64, "sentence_text": "The sidewalk is lined with various objects, including a chair, a dining table, and a bicycle.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 64, "sentence_text": "There are also several boxes and a backpack placed along the sidewalk.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 64, "sentence_text": "A truck can be seen in the background, parked on the right side of the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 64, "sentence_text": "Additionally, there is a book visible in the scene, possibly placed on the dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 43, "sentence_text": "In the image, a man is walking down a sidewalk, carrying a box in his hand.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 43, "sentence_text": "The sidewalk is lined with various objects, including a chair, a dining table, and a potted plant.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 43, "sentence_text": "There are also several boxes scattered throughout the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 43, "sentence_text": "Additionally, there is a truck parked in the background, and a clock mounted on a wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 43, "sentence_text": "The man appears to be the main focus of the scene, as he navigates the sidewalk with his box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 74, "sentence_text": "In the image, a man is standing in a room with several boxes stacked on the floor.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 74, "sentence_text": "He is wearing a white shirt and appears to be in the process of moving the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 74, "sentence_text": "There are also a few chairs in the room, one near the center and another towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 74, "sentence_text": "Additionally, there is a truck visible in the background, likely used for transporting the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 76, "sentence_text": "In the image, a man is standing in a room with a variety of boxes and crates.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 76, "sentence_text": "There are several chairs placed around the room, and a truck can be seen outside.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 76, "sentence_text": "The man appears to be in the process of moving items, possibly related to the boxes and crates.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 76, "sentence_text": "The scene also includes a dining table and a refrigerator, indicating that this room might be a part of a larger living space.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 47, "sentence_text": "In the image, a woman is walking on a sidewalk near a store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 47, "sentence_text": "She is wearing a gray shirt and appears to be looking at a box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 47, "sentence_text": "The store has a variety of items displayed, including several chairs and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 47, "sentence_text": "There are also multiple boxes and a backpack visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 47, "sentence_text": "Additionally, a car can be seen parked in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 71, "sentence_text": "The image depicts a cluttered room with various objects scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 71, "sentence_text": "There are several chairs placed throughout the room, and a dining table can be seen in the middle.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 71, "sentence_text": "A refrigerator is located on the left side of the room, and a microwave is placed above it.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 71, "sentence_text": "In the room, there are three people present.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 71, "sentence_text": "One person is standing near the left side of the room, another person is located in the middle, and the third person is standing closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 71, "sentence_text": "Additionally, there are two bicycles in the room, one near the center and the other towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 71, "sentence_text": "A truck can be seen outside the room, partially visible on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 44, "sentence_text": "In the image, a man is standing on a sidewalk, holding a box in his hand.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 44, "sentence_text": "He appears to be a delivery person, possibly transporting goods to a nearby location.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 44, "sentence_text": "The scene also includes a truck parked in the background, which might be related to the delivery process.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 44, "sentence_text": "There are several chairs scattered around the area, possibly indicating an outdoor seating area or a temporary storage space.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 44, "sentence_text": "Additionally, there are a few bottles and a bowl placed on surfaces, suggesting that the location might be a place where people gather or eat.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "There are several boxes and crates scattered throughout the scene, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "A chair is also visible in the store, placed near the center of the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "Additionally, there is a car parked outside the store, and a person can be seen standing near the left side of the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "The overall scene gives the impression of a busy store with various items for sale.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 59, "sentence_text": "In the image, a man is standing in a room with a cardboard box, possibly preparing to move items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 59, "sentence_text": "There are several chairs in the room, with one near the man and others scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 59, "sentence_text": "A truck can be seen outside the room, possibly for transportation purposes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 59, "sentence_text": "Additionally, there are multiple bottles and a bowl in the room, possibly indicating a recent gathering or event.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 61, "sentence_text": "In the image, two people are standing outside a store, possibly loading or unloading boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 61, "sentence_text": "One person is closer to the left side of the image, while the other is on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 61, "sentence_text": "They are surrounded by various objects, including a truck parked in the background, a chair, and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 61, "sentence_text": "There are also multiple boxes scattered around the scene, some of which are being loaded or unloaded by the people.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 61, "sentence_text": "Additionally, there is a bottle visible in the middle of the image, and a clock can be seen on the wall in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 66, "sentence_text": "In the image, a woman is standing on a sidewalk next to a street.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 66, "sentence_text": "She is wearing a white shirt and appears to be walking.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 66, "sentence_text": "There are several boxes and a chair placed on the sidewalk, possibly indicating a recent delivery or an ongoing outdoor event.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 66, "sentence_text": "A truck can be seen parked further down the street, and a bicycle is located closer to the woman.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 66, "sentence_text": "Additionally, there is a book visible in the scene, possibly left behind by someone or part of an outdoor reading event.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 49, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 49, "sentence_text": "There are several chairs placed throughout the store, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 49, "sentence_text": "A person is standing near the chairs, possibly browsing the items for sale.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 49, "sentence_text": "In addition to the chairs, there are multiple boxes and a backpack placed around the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 49, "sentence_text": "A car is visible in the background, parked outside the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 49, "sentence_text": "The scene is bustling with activity, showcasing the store's offerings and the people visiting the location.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 69, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 69, "sentence_text": "There are several chairs placed throughout the store, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 69, "sentence_text": "A refrigerator is also visible in the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 69, "sentence_text": "In addition to the furniture, there are multiple bottles scattered throughout the scene, as well as a few bowls placed on surfaces.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 69, "sentence_text": "A person can be seen in the store, possibly browsing or working.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 69, "sentence_text": "The overall scene is a mix of retail and home furnishings, creating a cozy and inviting atmosphere.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 65, "sentence_text": "In the image, two people are walking down a street, with one person closer to the left side and the other person on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 65, "sentence_text": "They appear to be engaged in conversation.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 65, "sentence_text": "The street is lined with various objects, including a truck parked on the right side, a chair located near the center, and a backpack placed on the ground closer to the left person.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 65, "sentence_text": "There are also two bowls, one near the center and the other closer to the left person.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 65, "sentence_text": "Additionally, a bottle can be seen on the right side of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 73, "sentence_text": "In the image, a man is walking down a street, carrying a large number of boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 73, "sentence_text": "The boxes are of various sizes and are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 73, "sentence_text": "There are also several chairs scattered throughout the scene, with some placed near the man and others further away.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 73, "sentence_text": "Additionally, there is a truck visible in the background, possibly used for transporting the boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 73, "sentence_text": "The man appears to be the main focus of the scene, as he navigates the street with his boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 62, "sentence_text": "In the image, two people are standing on a sidewalk, one of them is holding a box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 62, "sentence_text": "They appear to be in a store or a similar setting.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 62, "sentence_text": "The store has a variety of items, including several chairs and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 62, "sentence_text": "There are also multiple bicycles parked outside the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 62, "sentence_text": "The scene also includes a car and a truck, with the car being parked further away from the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 62, "sentence_text": "Additionally, there is a clock visible in the background, and a cell phone can be seen in the hands of one of the people.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 81, "sentence_text": "A man is walking down a sidewalk in front of a store, possibly a restaurant or a shop.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 81, "sentence_text": "He is wearing a backpack and appears to be the main subject of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 81, "sentence_text": "There are several chairs and dining tables scattered around the area, suggesting that the store may have a seating area for customers.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 81, "sentence_text": "A motorcycle is parked nearby, and a truck can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 81, "sentence_text": "Additionally, there are multiple bottles and a bowl placed around the scene, possibly indicating that the store sells beverages or food items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 67, "sentence_text": "In the image, there is a person standing in a room with a red cord hanging from the ceiling.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 67, "sentence_text": "The room appears to be a store or a warehouse, as there are several boxes and crates scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 67, "sentence_text": "Some of these boxes are stacked on top of each other, while others are placed on the floor.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 67, "sentence_text": "Additionally, there is a chair located in the middle of the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 67, "sentence_text": "The person in the room seems to be observing the red cord hanging from the ceiling, possibly inspecting or fixing it.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 68, "sentence_text": "In the image, a person is standing in a room with a red cord hanging from the ceiling.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 68, "sentence_text": "The room appears to be a storage area, as there are several boxes and a chair present.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 68, "sentence_text": "A truck can be seen outside the room, and a bicycle is parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 68, "sentence_text": "Additionally, there are two other people in the scene, one standing closer to the left side and the other near the center.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 68, "sentence_text": "A handbag is also visible in the room, placed near the person standing in the center.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 78, "sentence_text": "In the image, a man is walking past a store with boxes and crates on the sidewalk.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 78, "sentence_text": "There are several chairs and a dining table placed outside the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 78, "sentence_text": "A truck is parked nearby, and a car is visible in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 78, "sentence_text": "The man is wearing a backpack, and there is a handbag placed on the ground.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 78, "sentence_text": "The scene appears to be set in an urban environment with various objects and vehicles present.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 48, "sentence_text": "In the image, a woman is walking past a store with boxes and crates outside.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 48, "sentence_text": "She is wearing a white shirt and a blue skirt.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 48, "sentence_text": "The store has a variety of items, including a chair, a dining table, and a refrigerator.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 48, "sentence_text": "There are also several bottles scattered around the area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 48, "sentence_text": "Additionally, there is a car parked nearby, and a truck can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 48, "sentence_text": "The scene captures a moment of everyday life with people going about their daily activities.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 72, "sentence_text": "In the image, a woman is walking down a sidewalk with a handbag, while a truck is parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 72, "sentence_text": "There are several chairs and a dining table in the scene, suggesting an outdoor dining area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 72, "sentence_text": "Additionally, there are multiple boxes and a backpack, indicating that the area might be a storage or delivery location.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 72, "sentence_text": "A person is also present in the scene, possibly a worker or a customer.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 72, "sentence_text": "The presence of a car and a bicycle further adds to the diversity of transportation methods in the image.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 46, "sentence_text": "In the image, there are two people standing outside a store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 46, "sentence_text": "One person is closer to the left side of the image, while the other person is on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 46, "sentence_text": "Both individuals are wearing backpacks, with one backpack being larger and more prominent than the other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 46, "sentence_text": "The store appears to be a shop selling various items, as evidenced by the presence of multiple chairs and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 46, "sentence_text": "There are also several bottles scattered throughout the scene, possibly indicating that the store sells beverages.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 46, "sentence_text": "Additionally, a car can be seen in the background, parked near the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 70, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 70, "sentence_text": "There are several chairs placed throughout the store, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 70, "sentence_text": "A large number of boxes are scattered around the store, with some placed on the floor and others stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 70, "sentence_text": "Additionally, there are multiple bottles and a bowl visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 70, "sentence_text": "A person can be seen in the background, possibly browsing the store or attending to the items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 70, "sentence_text": "The overall atmosphere suggests a busy retail environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 54, "sentence_text": "In the image, a young boy is standing in a room with a red rope hanging from the ceiling.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 54, "sentence_text": "The room appears to be a storage area, as there are several boxes and a chair placed throughout the space.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 54, "sentence_text": "A truck can be seen outside the room, and a bicycle is parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 54, "sentence_text": "Additionally, there are two other people in the room, one of whom is wearing a backpack.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 54, "sentence_text": "The scene also includes a dining table and a refrigerator, further indicating that this is a storage area or a similar space.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "There are several boxes and crates scattered throughout the scene, some of which are stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "A chair is also visible in the middle of the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "In addition to the store items, there are two people present in the scene, one located towards the left side and the other towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 85, "sentence_text": "A truck can be seen in the background, parked outside the store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 45, "sentence_text": "In the image, a man is walking down a street, carrying a box on his head.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 45, "sentence_text": "The street is lined with various objects, including a truck parked on the right side, a chair located in the middle, and a bench on the left side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 45, "sentence_text": "There are also several bottles scattered throughout the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 45, "sentence_text": "Additionally, there are two other people in the background, one closer to the left side and the other near the center.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 45, "sentence_text": "The man carrying the box appears to be the main focus of the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 83, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 83, "sentence_text": "There are several chairs placed throughout the store, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 83, "sentence_text": "A large number of boxes are scattered around the store, with some placed on the floor and others stacked on top of each other.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 83, "sentence_text": "Additionally, there are multiple bottles and a bowl visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 83, "sentence_text": "A person can be seen in the background, possibly browsing the store or attending to the items.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 83, "sentence_text": "The overall atmosphere suggests a busy retail environment.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 51, "sentence_text": "The image depicts a store with a variety of items on display.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 51, "sentence_text": "There are several chairs placed throughout the store, and a dining table can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 51, "sentence_text": "A bicycle is parked outside the store, and a truck is visible in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 51, "sentence_text": "There are multiple people in the store, some of whom are wearing ties.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 51, "sentence_text": "The store has a variety of items on display, including a vase and a clock.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 51, "sentence_text": "Additionally, there are several books scattered throughout the store, and a handbag can be seen on the floor.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 52, "sentence_text": "The image depicts a cluttered room with various objects scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 52, "sentence_text": "There are several chairs placed throughout the room, and a dining table can be seen in the middle.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 52, "sentence_text": "A refrigerator is located on the left side of the room, and a microwave is placed above it.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 52, "sentence_text": "In the room, there are three people present.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 52, "sentence_text": "One person is standing near the left side of the room, another person is located in the middle, and the third person is standing closer to the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 52, "sentence_text": "Additionally, there are two bicycles in the room, one near the center and the other towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 52, "sentence_text": "A truck can be seen outside the room, partially visible on the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 58, "sentence_text": "In the image, a man is standing on a sidewalk next to a building, possibly a store or a warehouse.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 58, "sentence_text": "He is wearing a white shirt and appears to be looking at a box.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 58, "sentence_text": "There are several chairs scattered around the area, and a truck is parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 58, "sentence_text": "Additionally, there are multiple boxes and a backpack in the scene, suggesting that the man might be involved in some sort of delivery or transportation.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 75, "sentence_text": "A man is walking in front of a store, carrying boxes.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 75, "sentence_text": "The store has a variety of items, including a bicycle, a motorcycle, and a car.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 75, "sentence_text": "There are also several chairs and a dining table visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 75, "sentence_text": "The man appears to be wearing a uniform, and there is a clock on the wall.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 75, "sentence_text": "Additionally, there are several bottles scattered throughout the scene, and a cell phone can be seen in the background.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 57, "sentence_text": "A man is walking down a sidewalk, passing by a store with boxes and crates stacked outside.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 57, "sentence_text": "There are several chairs and a dining table visible in the scene, suggesting an outdoor seating area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 57, "sentence_text": "A truck is parked nearby, and a bottle can be seen on the ground.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 57, "sentence_text": "The man appears to be wearing a backpack, and there is a bicycle parked further down the sidewalk.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 55, "sentence_text": "In the image, a man is standing outside a store, possibly a restaurant or a shop, with a red rope hanging from the ceiling.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 55, "sentence_text": "He appears to be looking at the rope, possibly considering whether to enter the store or not.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 55, "sentence_text": "The store has a variety of items displayed, including several chairs and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 55, "sentence_text": "There are also a few bottles and a bowl visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 55, "sentence_text": "The man is wearing a white shirt, and the overall atmosphere suggests a casual and relaxed setting.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 80, "sentence_text": "In the image, a man is walking down a sidewalk, possibly on a street, with a handbag in his hand.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 80, "sentence_text": "There are several chairs and boxes scattered around the area, possibly indicating a store or a market.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 80, "sentence_text": "A truck can be seen in the background, and a motorcycle is parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 80, "sentence_text": "Additionally, there are a few bottles and a bowl placed around the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 80, "sentence_text": "The presence of these objects and the man's attire suggest that this could be a busy urban setting.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 82, "sentence_text": "In the image, a person is walking on a sidewalk near a store.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 82, "sentence_text": "The store has a variety of items displayed, including several chairs and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 82, "sentence_text": "There are also multiple boxes and a backpack visible in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 82, "sentence_text": "A truck can be seen parked on the street, and a bicycle is located close to the person walking.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 82, "sentence_text": "The overall setting appears to be a busy urban environment with various objects and activities taking place.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 50, "sentence_text": "The image depicts a cluttered room with various objects scattered around.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 50, "sentence_text": "There are several chairs placed throughout the room, with one near the center and another towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 50, "sentence_text": "A dining table can be seen in the background, along with a refrigerator on the left side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 50, "sentence_text": "A person is standing in the room, possibly organizing the space.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 50, "sentence_text": "There are multiple boxes and bags placed around the room, with some near the center and others closer to the edges.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 50, "sentence_text": "A couple of bottles are also visible, one near the center and the other towards the right side.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 50, "sentence_text": "Additionally, a car can be seen in the background, parked outside the room.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 79, "sentence_text": "In the image, a young man is standing on a sidewalk near a store, possibly waiting for someone or just passing by.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 79, "sentence_text": "He is wearing a yellow shirt and a backpack.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 79, "sentence_text": "The store has a variety of items displayed outside, including several chairs and a dining table.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 79, "sentence_text": "There are also multiple boxes and a truck parked nearby.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 79, "sentence_text": "Additionally, there is a bicycle parked further back in the scene.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 79, "sentence_text": "The overall setting appears to be a busy urban area with various activities taking place.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 60, "sentence_text": "In the image, a man is standing on a sidewalk next to a box, possibly preparing to move it.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 60, "sentence_text": "There are several chairs and a dining table nearby, suggesting an outdoor dining area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 60, "sentence_text": "A truck is parked in the background, and a couple of bottles can be seen on the ground.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 60, "sentence_text": "Additionally, there is a bird in the scene, adding a touch of nature to the urban setting.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 56, "sentence_text": "In the image, a young boy is walking down a sidewalk, possibly in a shopping area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 56, "sentence_text": "He is wearing a white shirt and appears to be looking at something in his hand.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 56, "sentence_text": "There are several chairs and a dining table in the scene, suggesting a possible outdoor dining area.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 56, "sentence_text": "Additionally, there are multiple boxes and a backpack, indicating that the area might be a storage or delivery location.", "fps": 12, "skipFrameCount": 24}, {"frame_index": 56, "sentence_text": "A truck can be seen in the background, possibly delivering goods to the area.", "fps": 12, "skipFrameCount": 24}]