diff --git "a/Large/Gemini/CommonsenseQA.json" "b/Large/Gemini/CommonsenseQA.json" new file mode 100644--- /dev/null +++ "b/Large/Gemini/CommonsenseQA.json" @@ -0,0 +1,6392 @@ +[ + { + "question": "A revolving door is convenient for two direction travel, but it also serves as a security measure at a what?", + "gold_answer": "bank", + "os_answer": "Bank", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do people aim to do at work?", + "gold_answer": "complete job", + "os_answer": "* Earn a living\n* Contribute to society\n* Develop their skills and knowledge\n* Achieve their goals\n* Make a difference", + "os_eval": "Correct", + "mcq_answer": "A. complete job", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find magazines along side many other printed works?", + "gold_answer": "bookstore", + "os_answer": "Library", + "os_eval": "Incorrect", + "mcq_answer": "B. bookstore", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are you likely to find a hamburger?", + "gold_answer": "fast food restaurant", + "os_answer": "A fast-food restaurant", + "os_eval": "Correct", + "mcq_answer": "A. fast food restaurant", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "James was looking for a good place to buy farmland. Where might he look?", + "gold_answer": "midwest", + "os_answer": "- Real estate agent\n- Farm auctions\n- Online marketplaces\n- Agricultural magazines\n- Local farmers", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "In what Spanish speaking North American country can you get a great cup of coffee?", + "gold_answer": "mexico", + "os_answer": "Mexico", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do animals do when an enemy is approaching?", + "gold_answer": "listen to each other", + "os_answer": "* Run away\n* Hide\n* Attack\n* Play dead\n* Make themselves look bigger", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Reading newspaper one of many ways to practice your what?", + "gold_answer": "literacy", + "os_answer": "Reading comprehension", + "os_eval": "Incorrect", + "mcq_answer": "A. literacy", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do people typically do while playing guitar?", + "gold_answer": "singing", + "os_answer": "* Strumming or picking the strings\n* Using a pick or their fingers\n* Changing chords\n* Reading music or tabs\n* Singing or humming along", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you want harmony, what is something you should try to do with the world?", + "gold_answer": "make peace", + "os_answer": "Be understanding of others", + "os_eval": "Correct", + "mcq_answer": "D. make peace", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Aside from water and nourishment what does your dog need?", + "gold_answer": "lots of attention", + "os_answer": "- Exercise\n- Attention\n- Affection\n- Mental stimulation\n- Grooming\n- Health care", + "os_eval": "Correct", + "mcq_answer": "D. lots of attention", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A fencing thrust with a sharp sword towards a person would result in what?", + "gold_answer": "injury", + "os_answer": "Injury or death", + "os_eval": "Correct", + "mcq_answer": "E. puncture wound", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Unlike a spider and his many sight seers, people only have what?", + "gold_answer": "tongues", + "os_answer": "Two eyes", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do adults use glue sticks?", + "gold_answer": "office", + "os_answer": "Home improvement projects, crafting, scrapbooking, office work, sealing envelopes", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is someone who isn't clever, bright, or competent called?", + "gold_answer": "clumsy", + "os_answer": "Unintelligent", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Blue read material outside of his comfort zone because he wanted to gain what?", + "gold_answer": "new perspective", + "os_answer": "Knowledge and understanding", + "os_eval": "Incorrect", + "mcq_answer": "A. new perspective", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Committing perjury is a serious what?", + "gold_answer": "crime", + "os_answer": "Crime", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you are prone to postpone work what will you have to do in order to finish on time?", + "gold_answer": "hasten", + "os_answer": "* Prioritize tasks and focus on the most important ones first.\n* Break down large tasks into smaller, more manageable chunks.\n* Set realistic deadlines and stick to them.\n* Eliminate distractions and create a dedicated workspace.\n* Reward yourself for completing tasks on time.\n* Seek support from others if needed.", + "os_eval": "Incorrect", + "mcq_answer": "B. hasten", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "James wanted to find an old underground map from the 50s. Where might he look for one?", + "gold_answer": "library", + "os_answer": "- Antique stores\n- Flea markets\n- Historical societies\n- Local libraries\n- Online auction sites", + "os_eval": "Correct", + "mcq_answer": "A. library", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would a person be doing when having to wait their turn?", + "gold_answer": "stand in line", + "os_answer": "Queue or line", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "She was always helping at the senior center, it brought her what?", + "gold_answer": "satisfaction", + "os_answer": "Joy", + "os_eval": "Incorrect", + "mcq_answer": "A. satisfaction", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Who is a police officer likely to work for?", + "gold_answer": "city", + "os_answer": "Government", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you have leftover cake, where would you put it?", + "gold_answer": "refrigerator", + "os_answer": "Cake keeper or airtight container", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a doormat likely to be in front of?", + "gold_answer": "front door", + "os_answer": "An entrance", + "os_eval": "Correct", + "mcq_answer": "B. front door", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Bob the lizard lives in a warm place with lots of water. Where does he probably live?", + "gold_answer": "tropical rainforest", + "os_answer": "A desert", + "os_eval": "Incorrect", + "mcq_answer": "B. tropical rainforest", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "August needed money because he was afraid that he'd be kicked out of his house. What did he need money to do?", + "gold_answer": "pay bills", + "os_answer": "Pay rent", + "os_eval": "Incorrect", + "mcq_answer": "B. pay bills", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you put a picture frame when it's not hung vertically?", + "gold_answer": "art show", + "os_answer": "Horizontally", + "os_eval": "Incorrect", + "mcq_answer": "E. table", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "James knew that he shouldn't have been buying beer for minors. He didn't even get paid for it. Why was this bad?", + "gold_answer": "broken law", + "os_answer": "James' actions were bad because:\n\n* **It is illegal to sell or provide alcohol to minors.** Selling or providing alcohol to minors is a crime in most jurisdictions. James could face fines, jail time, or both if he is caught.\n* **It is dangerous to minors.** Alcohol can have harmful effects on the developing brains and bodies of minors. It can lead to alcohol poisoning, accidents, and other health problems.\n* **It sets a bad example.** James is an adult, and minors may look up to him. By buying alcohol for minors, he is sending the message that it is okay to drink underage.\n* **It can lead to addiction.** Alcoholism is a serious problem that can ruin lives. By providing alcohol to minors, James is increasing the risk that they will develop an addiction.", + "os_eval": "Correct", + "mcq_answer": "D. broken law", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Because John was first violin, he had to bring something important to work ever day. What did he need to bring to work?", + "gold_answer": "music store", + "os_answer": "His violin", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can a human find clothes that aren't pants?", + "gold_answer": "dress shop", + "os_answer": "A store", + "os_eval": "Correct", + "mcq_answer": "C. dress shop", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When a person is beginning work, what are they building?", + "gold_answer": "momentum", + "os_answer": "Experience", + "os_eval": "Incorrect", + "mcq_answer": "D. momentum", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A child wants to play, what would they likely want?", + "gold_answer": "play tag", + "os_answer": "Toys or games", + "os_eval": "Incorrect", + "mcq_answer": "C. play tag", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The teacher doesn't tolerate noise during a test in their what?", + "gold_answer": "movie theatre", + "os_answer": "Classroom", + "os_eval": "Incorrect", + "mcq_answer": "E. classroom", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If there is a place that is hot and arid, what could it be?", + "gold_answer": "lifeless", + "os_answer": "A desert", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you are in a bar in a glove shaped state where are you?", + "gold_answer": "michigan", + "os_answer": "Wisconsin", + "os_eval": "Incorrect", + "mcq_answer": "B. michigan", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Crabs live in what sort of environment?", + "gold_answer": "saltwater", + "os_answer": "Water", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you find a snake in tall grass?", + "gold_answer": "feild", + "os_answer": "Slithering", + "os_eval": "Incorrect", + "mcq_answer": "D. feild", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a human likely to go as a result of being hungry?", + "gold_answer": "eat in restaurant", + "os_answer": "Restaurant", + "os_eval": "Correct", + "mcq_answer": "A. eat in restaurant", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find a single shower curtain being used?", + "gold_answer": "bathtub", + "os_answer": "In a bathroom", + "os_eval": "Incorrect", + "mcq_answer": "D. shower stall", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a good idea but not required to have a fire extinguisher?", + "gold_answer": "house", + "os_answer": "Kitchen", + "os_eval": "Correct", + "mcq_answer": "C. house", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What continent has the most castles?", + "gold_answer": "europe", + "os_answer": "Europe", + "os_eval": "Correct", + "mcq_answer": "D. europe", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you have to read a book that is very dry and long you may become what?", + "gold_answer": "have time", + "os_answer": "Bored", + "os_eval": "Incorrect", + "mcq_answer": "E. bored", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Sally used a clipboard to hold her papers while she read off names at the beginning of the day. Where might she work?", + "gold_answer": "desk", + "os_answer": "- School", + "os_eval": "Incorrect", + "mcq_answer": "E. school", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Despite the name a pawn can be quite versatile, all the parts are important in a what?", + "gold_answer": "chess game", + "os_answer": "Chess", + "os_eval": "Correct", + "mcq_answer": "A. chess game", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What would not be true about a basketball if it had a hole in it but it did not lose its general shape?", + "gold_answer": "full of air", + "os_answer": "It would not be able to bounce.", + "os_eval": "Incorrect", + "mcq_answer": "C. full of air", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you are awaking multiple times throughout the night because a lot is on your mind, what is a likely cause?", + "gold_answer": "depression", + "os_answer": "Stress or anxiety", + "os_eval": "Incorrect", + "mcq_answer": "B. depression", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where does a wild bird usually live?", + "gold_answer": "countryside", + "os_answer": "In a nest", + "os_eval": "Incorrect", + "mcq_answer": "C. countryside", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you expect to find white mice?", + "gold_answer": "bell cat", + "os_answer": "Laboratory", + "os_eval": "Incorrect", + "mcq_answer": "E. laboratory", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "John felt that his actions were fate. Harry said that he could have always made a different what?", + "gold_answer": "choice", + "os_answer": "Choice", + "os_eval": "Correct", + "mcq_answer": "B. choice", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What could committing murder prevent someone from doing?", + "gold_answer": "find god", + "os_answer": "* Going to prison\n* Getting a job\n* Starting a family\n* Having a normal life", + "os_eval": "Incorrect", + "mcq_answer": "A. go to jail", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "George didn't have a car, but he still had his two feet. His socks were smelly and his soles were blistered, but that didn't matter. He could still do what?", + "gold_answer": "walk", + "os_answer": "Walk", + "os_eval": "Correct", + "mcq_answer": "B.", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you put uncooked crab meat?", + "gold_answer": "wharf", + "os_answer": "In the refrigerator", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The man had a fear of illness, so he never visited friends who were a what?", + "gold_answer": "sick person", + "os_answer": "Sick", + "os_eval": "Correct", + "mcq_answer": "A. sick person", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Which large land mass is home to the most monkeys?", + "gold_answer": "amazon basin", + "os_answer": "South America", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "You'll find a landing at the top of what?", + "gold_answer": "stairwell", + "os_answer": "Stairs", + "os_eval": "Correct", + "mcq_answer": "C. stairwell", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you find a number of wind instruments together in public?", + "gold_answer": "music store", + "os_answer": "At a concert band performance", + "os_eval": "Incorrect", + "mcq_answer": "E. symphony", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "A mountie got off at a subway stop. What city might he be in?", + "gold_answer": "urban area", + "os_answer": "Ottawa", + "os_eval": "Incorrect", + "mcq_answer": "E. toronto", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Billy set aside a block of time for having fun after work. Why might he do this?", + "gold_answer": "stress relief", + "os_answer": "To relieve stress, engage in enjoyable activities, and recharge for the next day.", + "os_eval": "Correct", + "mcq_answer": "B. stress relief", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The man in the white suit was very lazy. He did nothing useful. Meanwhile, the ban in the blue had put in effort and was very what?", + "gold_answer": "productive", + "os_answer": "Hardworking", + "os_eval": "Correct", + "mcq_answer": "D. productive", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What would you be unable to do if you have too much greed?", + "gold_answer": "make friends", + "os_answer": "Control your desires", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "I did not need a servant. I was not a what?", + "gold_answer": "rich person", + "os_answer": "Millionaire", + "os_eval": "Correct", + "mcq_answer": "C. hired help", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How would you get from one side of a canal to another?", + "gold_answer": "bridge", + "os_answer": "There are several ways to get from one side of a canal to another:\n\n- Use a bridge: If there is a bridge crossing the canal, you can simply walk, cycle, or drive across it.\n\n- Use a ferry: If there is a ferry service operating on the canal, you can board the ferry and it will take you to the other side.\n\n- Use a boat or canoe: If you have access to a boat or canoe, you can row or paddle across the canal.\n\n- Swim across: If the canal is narrow enough and the water conditions are safe, you can swim across it.\n\n- Use a zip line: In some cases, there may be a zip line installed across the canal that you can use to cross.", + "os_eval": "Correct", + "mcq_answer": "D. bridge", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When learning about the world and different cultures, what is important if you are committed to eliminating preconceived notions", + "gold_answer": "open mind", + "os_answer": "Be open-minded and willing to challenge your own assumptions.", + "os_eval": "Correct", + "mcq_answer": "D. open mind", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "While washing clothes they became what when caught on the sharp object?", + "gold_answer": "torn", + "os_answer": "Torn", + "os_eval": "Correct", + "mcq_answer": "D. torn", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What would encourage someone to continue playing tennis?", + "gold_answer": "becoming tired", + "os_answer": "* Enjoyment of the sport\n* Competitive spirit\n* Desire for physical activity\n* Social interaction with other players\n* Improved physical and mental health\n* Goal-oriented mindset\n* Previous successes or accomplishments in tennis\n* External motivation (e.g., rewards, recognition)\n* Sense of community or belonging within the tennis community\n* Stress relief and mental well-being", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What regions of a town would you have found a dime store?", + "gold_answer": "small neighborhood", + "os_answer": "- Downtown area\n- Shopping malls\n- Neighborhood commercial districts", + "os_eval": "Incorrect", + "mcq_answer": "A. commercial building", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where might an unused chess set be stored?", + "gold_answer": "toy store", + "os_answer": "* In a closet\n* In a drawer\n* In a box\n* In a cabinet\n* Under a bed", + "os_eval": "Incorrect", + "mcq_answer": "D. attic", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "james told his son to settle down and be careful. There were many frogs mating in the area, and James didn't want his son to do what to them?", + "gold_answer": "disturb", + "os_answer": "Step on them", + "os_eval": "Incorrect", + "mcq_answer": "D. disturb", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A man wants air conditioning while we watches the game on Saturday, where will it likely be installed?", + "gold_answer": "house", + "os_answer": "Living room", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Sailors drive many different types of boats, what type of boat involves their namesake.", + "gold_answer": "coming home", + "os_answer": "Sailboat", + "os_eval": "Incorrect", + "mcq_answer": "E. sail boat", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where could a person avoid the rain?", + "gold_answer": "synagogue", + "os_answer": "1. Under an umbrella\n2. Inside a building\n3. Under a tree\n4. In a car", + "os_eval": "Incorrect", + "mcq_answer": "B. tunnel", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Why would a person like to have a large house?", + "gold_answer": "have choice", + "os_answer": "* **Status symbol:** A large house can be seen as a sign of wealth and success, which can boost a person's social status.\n* **Space:** A large house provides more space for a growing family, entertaining guests, or pursuing hobbies and interests.\n* **Privacy:** A large house can offer more privacy, as it provides more space between the occupants and their neighbors.\n* **Investment:** A large house can be a valuable investment, as it is likely to appreciate in value over time.\n* **Comfort:** A large house can provide more comfort, as it allows for more space and amenities, such as multiple bedrooms, bathrooms, and living areas.\n* **Legacy:** A large house can be a legacy that can be passed down to future generations.\n* **Aesthetics:** Some people simply prefer the look and feel of a large house.", + "os_eval": "Incorrect", + "mcq_answer": "E. lots of space", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Who do professors work with?", + "gold_answer": "school students", + "os_answer": "Students", + "os_eval": "Correct", + "mcq_answer": "B. teach courses", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Colorful anemone look somewhat like what object you find on window sills?", + "gold_answer": "flower bed", + "os_answer": "Flower pots", + "os_eval": "Incorrect", + "mcq_answer": "D. flower bed", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The hikers stopped to have a drink, simply put they what?", + "gold_answer": "were thirsty", + "os_answer": "Took a break", + "os_eval": "Incorrect", + "mcq_answer": "C. refreshment", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When you get up in the morning before you begin work you should do what?", + "gold_answer": "shower", + "os_answer": "Make your bed", + "os_eval": "Incorrect", + "mcq_answer": "D. shower", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The kitten had nothing to dig it's claws into, so when it tried to stop it slid across what?", + "gold_answer": "floor", + "os_answer": "Smooth surface", + "os_eval": "Correct", + "mcq_answer": "D. carpet", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If a person is trying to keep something in their hand what should they do?", + "gold_answer": "complete collection", + "os_answer": "Squeeze or grip it tightly", + "os_eval": "Incorrect", + "mcq_answer": "E. have to hold", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Playing baseball is a lot like any other sport, there is always a risk of what?", + "gold_answer": "injury", + "os_answer": "Injury", + "os_eval": "Correct", + "mcq_answer": "D. injury", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If I want to watch a movie without leaving my home what might I use?", + "gold_answer": "television", + "os_answer": "Streaming service", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does a successful dog grooming session likely to make a owner feel?", + "gold_answer": "satisfaction", + "os_answer": "Happy and satisfied", + "os_eval": "Correct", + "mcq_answer": "D. satisfaction", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The runner was in third place, but he pushed harder and thought he might be able to reach second. What was beginning to do?", + "gold_answer": "gain ground", + "os_answer": "Accelerate", + "os_eval": "Incorrect", + "mcq_answer": "D. gain ground", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The tourist entered Mammoth cave, what state were they in?", + "gold_answer": "kentucky", + "os_answer": "Kentucky", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does someone typically feel when applying for a job?", + "gold_answer": "anxiety and fear", + "os_answer": "Nervousness, hopefulness, anticipation, uncertainty", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What kind of feelings does buying presents for others create?", + "gold_answer": "tears", + "os_answer": "Buying presents for others can create a variety of feelings, including:\n\n- Joy: Giving gifts can be a selfless act that brings joy to both the giver and the recipient. It can be a way to show someone that you care about them and appreciate them.\n- Love: Buying gifts for someone you love can be a way to express your affection and make them feel special. It can also be a way to show them that you are thinking of them.\n- Gratitude: Buying gifts for someone who has done something nice for you can be a way to show your gratitude and appreciation. It can also be a way to show them that you value their friendship or relationship.\n- Guilt: If you feel obligated to buy a gift for someone, it can create feelings of guilt. This can happen if you don't have the money to buy a gift, or if you don't know what to buy.\n- Stress: Buying gifts can be stressful, especially if you are trying to find the perfect gift. It can also be stressful if you are on a tight budget.", + "os_eval": "Incorrect", + "mcq_answer": "E. make happy", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What green area is a marmot likely to be found in?", + "gold_answer": "countryside", + "os_answer": "Alpine meadow", + "os_eval": "Incorrect", + "mcq_answer": "A. countryside", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Jan tested the current, and noticed that it was high. He thought that the wires might have too much what?", + "gold_answer": "resistance", + "os_answer": "Resistance", + "os_eval": "Correct", + "mcq_answer": "D. resistance", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does a kindergarten teacher do before nap time?", + "gold_answer": "lower expectations", + "os_answer": "Reads a story", + "os_eval": "Incorrect", + "mcq_answer": "E. tell story", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "To play sports professionally you must do what very often?", + "gold_answer": "practice", + "os_answer": "Practice", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What will a person going for a jog likely be wearing?", + "gold_answer": "comfortable clothes", + "os_answer": "Comfortable clothing, such as:\n- Jogging pants or shorts\n- T-shirt or tank top\n- Running shoes", + "os_eval": "Correct", + "mcq_answer": "C. comfortable clothes", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The child pretended he was reading newspaper, he couldn't actually do it without what?", + "gold_answer": "patience", + "os_answer": "Literacy", + "os_eval": "Incorrect", + "mcq_answer": "E. knowing how to read", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Jenny enjoyed helping people. It brought her a great deal of what?", + "gold_answer": "satisfaction", + "os_answer": "Satisfaction", + "os_eval": "Correct", + "mcq_answer": "A. satisfaction", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find a basement that can be accessed with an elevator?", + "gold_answer": "office building", + "os_answer": "A parking garage", + "os_eval": "Incorrect", + "mcq_answer": "D. office building", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "He was at the gym trying to build muscle, what is it called that he is trying to build muscle on?", + "gold_answer": "body of animal", + "os_answer": "Body", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The man was going fishing instead of work, what is he seeking?", + "gold_answer": "relaxation", + "os_answer": "Escape", + "os_eval": "Correct", + "mcq_answer": "B. relaxation", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find a large dining room containing a fancy chandelier?", + "gold_answer": "mansion", + "os_answer": "A ballroom", + "os_eval": "Incorrect", + "mcq_answer": "E. restaurant", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The extremely large cargo plane could only land at a specialized runway, these were only located at a what?", + "gold_answer": "military base", + "os_answer": "Military base or airport", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "How can someone be let into a brownstone?", + "gold_answer": "ring", + "os_answer": "* Using a key\n* Using a buzzer\n* Using an intercom\n* Being buzzed in by someone inside\n* Using a security code", + "os_eval": "Incorrect", + "mcq_answer": "B. ring", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would someone purchase an upright piano?", + "gold_answer": "music store", + "os_answer": "Music store", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Diving into backyard pools can be very dangerous and can lead to serious head and what?", + "gold_answer": "going somewhere", + "os_answer": "Neck injuries", + "os_eval": "Incorrect", + "mcq_answer": "E. spinal injuries", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would one find a snake in a cage?", + "gold_answer": "pet store", + "os_answer": "At a zoo or reptile park", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When you fail to finish something, you failed at doing what to it", + "gold_answer": "completing", + "os_answer": "Complete", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John didn't care about style. He felt that form was less important than what?", + "gold_answer": "function", + "os_answer": "Function", + "os_eval": "Correct", + "mcq_answer": "C. function", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When you get together with friends to watch film, you might do plenty of this?", + "gold_answer": "have fun", + "os_answer": "Talking", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A supermarket is uncommon in what type of collection of shops?", + "gold_answer": "strip mall", + "os_answer": "A strip mall", + "os_eval": "Incorrect", + "mcq_answer": "E. vermont", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Before racers start to run they must do what at the starting line?", + "gold_answer": "learn to walk", + "os_answer": "Get set", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a person called who doesn't have immortality?", + "gold_answer": "mortal", + "os_answer": "Mortal", + "os_eval": "Correct", + "mcq_answer": "E. mortal", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If chewing food is difficult for you, what is a possible reason?", + "gold_answer": "sore mouth", + "os_answer": "Dental problems (such as cavities, gum disease, or a cracked tooth)", + "os_eval": "Correct", + "mcq_answer": "B. sore mouth", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can children play with animals?", + "gold_answer": "meadow", + "os_answer": "* Zoos\n* Aquariums\n* Farms\n* Petting zoos\n* Animal sanctuaries\n* Parks with animal exhibits\n* Homes of friends or family with pets\n* Animal shelters", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What kind of tale might feature a talking weasel?", + "gold_answer": "mulberry bush", + "os_answer": "A children's story", + "os_eval": "Incorrect", + "mcq_answer": "E. children's story", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What kind of status is the bald eagle given?", + "gold_answer": "protection", + "os_answer": "National bird of the United States", + "os_eval": "Incorrect", + "mcq_answer": "E. america", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Why do most people take a quick rest during the day?", + "gold_answer": "feel more energetic", + "os_answer": "To improve alertness and reduce fatigue", + "os_eval": "Correct", + "mcq_answer": "C. feel more energetic", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What could suddenly stop someone when he or she is running?", + "gold_answer": "falling down", + "os_answer": "* Obstacles like walls, fences, or objects in the path\n* Tripping over uneven surfaces or obstacles\n* Sudden pain or injury\n* Fatigue or exhaustion\n* Fear or shock\n* Physical exhaustion or lack of stamina\n* Slippery or unstable surfaces\n* A medical emergency, such as a heart attack or seizure", + "os_eval": "Incorrect", + "mcq_answer": "B. falling down", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find a monkey in the wild?", + "gold_answer": "zoo", + "os_answer": "Forest or jungle", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where could a sloth live?", + "gold_answer": "tropical jungle", + "os_answer": "In a rainforest", + "os_eval": "Correct", + "mcq_answer": "A. tropical jungle", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A gentleman is carrying equipment for golf, what is he likely to have?", + "gold_answer": "club", + "os_answer": "Golf clubs", + "os_eval": "Correct", + "mcq_answer": "A. club", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you take the risk buying a used car, you still hope it can what?", + "gold_answer": "go fast", + "os_answer": "Run well", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the primary purpose of cars?", + "gold_answer": "move people", + "os_answer": "Transportation", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Alabama is full of different people, but they are all citizens of what?", + "gold_answer": "united states", + "os_answer": "United States of America", + "os_eval": "Correct", + "mcq_answer": "A. united states", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do airplanes do as they are arriving at the gate?", + "gold_answer": "slow down", + "os_answer": "Slow down and descend", + "os_eval": "Correct", + "mcq_answer": "A. slow down", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a person with mental illness stops treatment what will likely happen?", + "gold_answer": "recur", + "os_answer": "The person's symptoms may return or worsen.", + "os_eval": "Correct", + "mcq_answer": "C. recur", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A loud machine is irritating, but many are expected where?", + "gold_answer": "museum", + "os_answer": "Construction site", + "os_eval": "Incorrect", + "mcq_answer": "E. industrial area", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If I have a modern light source in my living room, what is it likely to be?", + "gold_answer": "lamp", + "os_answer": "LED", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Who might wear dark glasses indoors?", + "gold_answer": "blind person", + "os_answer": "- Someone with a medical condition that makes their eyes sensitive to light\n- Someone who is trying to hide their identity\n- Someone who is trying to look cool or mysterious", + "os_eval": "Incorrect", + "mcq_answer": "D. ray charles", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What instrument can be played with an air of happiness?", + "gold_answer": "jump up and down", + "os_answer": "Wind instrument", + "os_eval": "Incorrect", + "mcq_answer": "E. fiddle", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What animal has quills all over it?", + "gold_answer": "feather", + "os_answer": "Porcupine", + "os_eval": "Incorrect", + "mcq_answer": "D. porcupine", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Why would you go to an office?", + "gold_answer": "work", + "os_answer": "* To work\n* To meet with colleagues\n* To attend meetings\n* To use office equipment\n* To access company resources\n* To collaborate on projects\n* To receive training\n* To socialize with coworkers\n* To network with other professionals\n* To build relationships with clients", + "os_eval": "Correct", + "mcq_answer": "A. work", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you spend all your time buying and not saving what is is likely to happen?", + "gold_answer": "using money", + "os_answer": "You will run out of money.", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do they call the trash in Australia?", + "gold_answer": "dirt", + "os_answer": "Rubbish", + "os_eval": "Incorrect", + "mcq_answer": "E. dustbin", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Joan wants to cook a potato, where should she place it?", + "gold_answer": "boiling water", + "os_answer": "In a pot with water", + "os_eval": "Incorrect", + "mcq_answer": "A. boiling water", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A person with an allergy might be doing what if they awake suddenly?", + "gold_answer": "have fun", + "os_answer": "Sneezing", + "os_eval": "Incorrect", + "mcq_answer": "E. sneezing", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a ferret unlikely to be?", + "gold_answer": "classroom", + "os_answer": "Laboratory", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Immediately after peeing, a person's bladder is what?", + "gold_answer": "empty", + "os_answer": "Empty", + "os_eval": "Correct", + "mcq_answer": "A. collapsed", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "A car was hailed to chauffeur someone to the opera house, where was it heading?", + "gold_answer": "go downtown", + "os_answer": "The opera house", + "os_eval": "Incorrect", + "mcq_answer": "B. appear suddenly", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do you go to see for live entertainment?", + "gold_answer": "show", + "os_answer": "* Concerts\n* Plays\n* Musicals\n* Stand-up comedy\n* Sporting events\n* Dance performances", + "os_eval": "Correct", + "mcq_answer": "E. theatre", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "A creek is a body of water found in what low land?", + "gold_answer": "valley", + "os_answer": "Valley", + "os_eval": "Correct", + "mcq_answer": "B. valley", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If I have a pet bird, what does it likely live in?", + "gold_answer": "forest", + "os_answer": "A cage", + "os_eval": "Incorrect", + "mcq_answer": "E. cage", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Joe and Mac were playing basketball. They did it every day in their back yard. Why were they playing basketball?", + "gold_answer": "have fun", + "os_answer": "Because they enjoyed it and it was a fun activity.", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What makes someone a nomad?", + "gold_answer": "have no home", + "os_answer": "A person who does not have a permanent home and moves from place to place", + "os_eval": "Correct", + "mcq_answer": "C. have no home", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a treat that you dog will enjoy?", + "gold_answer": "bone", + "os_answer": "A bone", + "os_eval": "Correct", + "mcq_answer": "D. bone", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Women used to be expected to wear a dress but it's now acceptable for them to wear what?", + "gold_answer": "pants", + "os_answer": "Pants", + "os_eval": "Correct", + "mcq_answer": "B. pants", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The fact that Joe was able to memorize the list in spite of his apparent state proved that part of his brain was what?", + "gold_answer": "awake", + "os_answer": "Functional", + "os_eval": "Incorrect", + "mcq_answer": "A. awake", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a wet person likely to do?", + "gold_answer": "catch cold", + "os_answer": "Dry off", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The painter started to edge the room with tape, he always took extra care to make the lines clean and crisp when working with an what?", + "gold_answer": "triangle", + "os_answer": "Expensive paint", + "os_eval": "Incorrect", + "mcq_answer": "C. corner", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "After high tide, where on the coast can you look to find a sea anemone?", + "gold_answer": "tide pool", + "os_answer": "In a tide pool", + "os_eval": "Correct", + "mcq_answer": "E. intertidal zone", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "People do many things to alleviate boredom. If you can't get out of the house you might decide to do what?", + "gold_answer": "listen to music", + "os_answer": "- Read a book\n- Watch a movie\n- Play a video game\n- Listen to music\n- Draw or paint\n- Write in a journal\n- Learn a new skill\n- Meditate\n- Do yoga\n- Play with a pet\n- Talk to a friend or family member\n- Take a nap", + "os_eval": "Correct", + "mcq_answer": "A. play cards", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "At a grocery store they sell individual potatoes, where does the grocery clerk likely put the potato?", + "gold_answer": "paper bag", + "os_answer": "Produce section", + "os_eval": "Incorrect", + "mcq_answer": "D. paper bag", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What room is a rubber bath mat usually kept?", + "gold_answer": "doorway", + "os_answer": "Bathroom", + "os_eval": "Incorrect", + "mcq_answer": "E. bathroom", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What would you put meat on top of to cook it?", + "gold_answer": "oil", + "os_answer": "Grill", + "os_eval": "Incorrect", + "mcq_answer": "E. frying pan", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Minerals can be obtained in what way for a person who avoids leafy greens?", + "gold_answer": "multivitamin", + "os_answer": "- Fortified foods (e.g., cereals, milk, orange juice)\n- Supplements\n- Foods high in minerals (e.g., beans, lentils, nuts, seeds, seafood)", + "os_eval": "Incorrect", + "mcq_answer": "A. multivitamin", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What might a couple have a lot of when they are deciding on stopping being married to each other?", + "gold_answer": "pleasure", + "os_answer": "Arguments", + "os_eval": "Incorrect", + "mcq_answer": "E. fights", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If a person is working a lot, what are they likely trying to earn?", + "gold_answer": "much money", + "os_answer": "Money", + "os_eval": "Correct", + "mcq_answer": "A. much money", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Billy hated using other people's toilets. He was only comfortable on his own. So whenever he needed to poop, he would go back to his what?", + "gold_answer": "house", + "os_answer": "Home", + "os_eval": "Correct", + "mcq_answer": "D. house", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "How can you let someone know about your anger without hurting him or her?", + "gold_answer": "write letter", + "os_answer": "* **Choose the right time and place.** Don't try to have this conversation when you're both tired, stressed, or in a public place. Find a private place where you can talk openly and honestly.\n* **Start by expressing your appreciation.** Let the person know that you value their relationship and that you're not trying to hurt them.\n* **Use \"I\" statements.** This will help you take ownership of your feelings and avoid blaming the other person. For example, instead of saying \"You always make me angry,\" you could say \"I feel angry when you...\"\n* **Be specific about what you're angry about.** Don't just say \"I'm angry.\" Instead, explain what the person did or said that made you angry.\n* **Avoid using generalizations.** Don't say things like \"You always...\" or \"You never...\" These kinds of statements will only make the other person defensive.\n* **Listen to the other person's perspective.** Once you've expressed your anger, give the other person a chance to share their perspective. Listen to what they have to say without interrupting.\n* **Try to find a solution together.** The goal of this conversation is not to blame the other person or to make them feel bad. It's to find a way to resolve the issue and move forward.\n* **Be willing to forgive.** If the other person apologizes and takes responsibility for their actions, be willing to forgive them. Holding on to anger will only hurt you in the long run.", + "os_eval": "Incorrect", + "mcq_answer": "D. write letter", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is one likely to find a brownstone?", + "gold_answer": "new york city", + "os_answer": "New York City", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What language type is someone from Iran likely to use?", + "gold_answer": "dard", + "os_answer": "Farsi", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The child wasn't allowed in the kitchen but still wanted to help, what could it do to help in the dining room?", + "gold_answer": "set table", + "os_answer": "Set the table, clear the table, wipe spills, hand out napkins, help carry light items to the table, or entertain younger siblings to keep them out of the kitchen.", + "os_eval": "Correct", + "mcq_answer": "A. set table", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "He was having a hard time expressing himself in a healthy way, the psychologist said he was mentally what?", + "gold_answer": "suffering", + "os_answer": "Blocked", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "How would you express information to a deaf person?", + "gold_answer": "write down", + "os_answer": "- Sign language\n- Lip reading\n- Written communication\n- Gestures\n- Visual aids (e.g., pictures, diagrams)\n- Technology (e.g., video relay services, text-to-speech apps)", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Printing on a printer can get expensive because it does what?", + "gold_answer": "use paper", + "os_answer": "Uses ink", + "os_eval": "Incorrect", + "mcq_answer": "B. use paper", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "One of the potential hazards of attending school is what?", + "gold_answer": "colds and flu", + "os_answer": "Bullying", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What could bring a container from one place to another?", + "gold_answer": "cargo ship", + "os_answer": "- A person\n- A vehicle\n- A conveyor belt\n- A crane\n- A boat\n- A plane", + "os_eval": "Incorrect", + "mcq_answer": "C. cargo ship", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is it called when you are talking to someone?", + "gold_answer": "communication", + "os_answer": "Conversation", + "os_eval": "Correct", + "mcq_answer": "A. communication", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The family finished dinner, the child's chore was to load the dirty dishes where?", + "gold_answer": "dishwasher", + "os_answer": "Dishwasher", + "os_eval": "Correct", + "mcq_answer": "B. dishwasher", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where could you find a bureau as well as many politicians?", + "gold_answer": "each city", + "os_answer": "Washington, DC", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "For some reason she was devoid of regular emotions, buying products was the only way she could feel what?", + "gold_answer": "pleasure", + "os_answer": "Joy", + "os_eval": "Correct", + "mcq_answer": "A. pleasure", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are horses judged on appearance?", + "gold_answer": "fair", + "os_answer": "Cannot be answered due to inappropriate content", + "os_eval": "Incorrect", + "mcq_answer": "B. fair", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why do people read non fiction?", + "gold_answer": "learn new things", + "os_answer": "* To gain knowledge and expand understanding\n* To learn new skills or information\n* To satisfy curiosity\n* To stay informed about current events\n* To improve critical thinking and analytical abilities\n* To explore different perspectives and broaden horizons\n* To understand the world around them better\n* For entertainment or relaxation\n* To gain insights into human nature and society\n* To connect with others who share similar interests", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are you likely to set papers while working on them?", + "gold_answer": "table", + "os_answer": "On a desk or table", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John had a massive debt to 50 million dollars. Compared to that, Leo's 2000 dollar debt seemed what?", + "gold_answer": "insubstantial", + "os_answer": "Cannot be answered due to inappropriate content", + "os_eval": "Incorrect", + "mcq_answer": "B. inconsequential", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The man flew his airplane over the city and saw pollution visibly in the sky, what was polluted?", + "gold_answer": "air", + "os_answer": "The air", + "os_eval": "Correct", + "mcq_answer": "C. air", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a very unlikely side effect of becoming inebriated?", + "gold_answer": "fights", + "os_answer": "Gaining the ability to speak a foreign language", + "os_eval": "Incorrect", + "mcq_answer": "E. paralysis", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If not in a stream but in a market where will you find fish?", + "gold_answer": "refrigerator", + "os_answer": "Fish market", + "os_eval": "Incorrect", + "mcq_answer": "E. market", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What are people likely to want to do with their friends?", + "gold_answer": "own land", + "os_answer": "* Socialize\n* Spend quality time\n* Have fun\n* Engage in shared activities\n* Talk and share experiences\n* Support each other\n* Relax and de-stress\n* Explore new places or activities\n* Create memories\n* Bond and strengthen their friendship", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "During a shark filled tornado where should you not be?", + "gold_answer": "marine museum", + "os_answer": "In the water", + "os_eval": "Incorrect", + "mcq_answer": "E. outside", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the likely result of buying products in excess?", + "gold_answer": "running out of money", + "os_answer": "* Financial strain\n* Clutter and disorganization\n* Waste and environmental impact\n* Reduced satisfaction and well-being\n* Increased stress and anxiety", + "os_eval": "Incorrect", + "mcq_answer": "E. overstocking", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a person trying to accomplish when taking analgesics?", + "gold_answer": "avoid pain", + "os_answer": "Reduce pain", + "os_eval": "Correct", + "mcq_answer": "B. avoid pain", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you put a glass after drinking from it?", + "gold_answer": "dishwasher", + "os_answer": "Cannot be answered due to inappropriate content", + "os_eval": "Incorrect", + "mcq_answer": "D. dishwasher", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you buy food?", + "gold_answer": "store", + "os_answer": "Cannot be answered due to inappropriate content", + "os_eval": "Incorrect", + "mcq_answer": "B. store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When a person admits his mistakes, what are they doing?", + "gold_answer": "accident", + "os_answer": "Taking responsibility", + "os_eval": "Incorrect", + "mcq_answer": "D. feel relieved", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Donald is a prominent figure for the federal government, so in what city does he likely spend a lot of time?", + "gold_answer": "everything", + "os_answer": "Washington, D.C.", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Of all the sports, Billy enjoys football, but what does his concerned mother think of the sport?", + "gold_answer": "very entertaining", + "os_answer": "She thinks it's too dangerous.", + "os_eval": "Incorrect", + "mcq_answer": "E. violent", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What city will likely have many parking structures?", + "gold_answer": "chicago", + "os_answer": "A big city", + "os_eval": "Correct", + "mcq_answer": "A. chicago", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the habitat of the fox?", + "gold_answer": "hen house", + "os_answer": "Forest, grasslands, woodlands", + "os_eval": "Incorrect", + "mcq_answer": "B. burrow", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "They children loved having a back yard, and the parents loved that it was a safe what?", + "gold_answer": "neighborhood", + "os_answer": "space", + "os_eval": "Incorrect", + "mcq_answer": "B. neighborhood", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "While people just throw coins down them now, what originally had a pail to be lowered for it's intended use?", + "gold_answer": "wishing well", + "os_answer": "Wishing well", + "os_eval": "Correct", + "mcq_answer": "D. wishing well", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When a human is earning money, where are they often found?", + "gold_answer": "place of work", + "os_answer": "Workplace", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why do people play chess on the weekends?", + "gold_answer": "have fun", + "os_answer": "* To engage in a challenging mental activity\n* To socialize and connect with others\n* To escape from daily routines and relax\n* To improve cognitive skills and strategic thinking\n* For the thrill of competition and the satisfaction of winning", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do you need energy to do in gym class?", + "gold_answer": "play sports", + "os_answer": "Exercise", + "os_eval": "Correct", + "mcq_answer": "A. work", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If a person were going to bed, what would be their goal?", + "gold_answer": "falling asleep", + "os_answer": "To fall asleep", + "os_eval": "Correct", + "mcq_answer": "C. rest", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What are candles good for eliminating?", + "gold_answer": "shelf", + "os_answer": "Odors", + "os_eval": "Incorrect", + "mcq_answer": "E. dark", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What room would you find many bookcases and is used for contemplation?", + "gold_answer": "study", + "os_answer": "Library", + "os_eval": "Incorrect", + "mcq_answer": "A. study", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do you head to travel to a star?", + "gold_answer": "outer space", + "os_answer": "A star is an astronomical object and cannot be reached through physical travel.", + "os_eval": "Incorrect", + "mcq_answer": "C. outer space", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The player lifted his cornet and walked in rhythm, what was the player a member of?", + "gold_answer": "marching band", + "os_answer": "A marching band", + "os_eval": "Correct", + "mcq_answer": "C. marching band", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When someone is talking and you missed something, what can you do to get them to repeat it?", + "gold_answer": "ask question", + "os_answer": "* Say \"Excuse me\" or \"Pardon me\" to politely interrupt.\n* Ask, \"Could you please repeat that?\" or \"I didn't catch that, can you say it again?\"\n* Rephrase your question to include the part you missed, such as \"I heard you say [what you remember], but what did you say after that?\"\n* Ask for clarification, such as \"I'm not sure I understand, could you explain it differently?\"\n* If the person is speaking in a group setting, you can raise your hand or wait for an opportunity to ask your question privately.", + "os_eval": "Correct", + "mcq_answer": "B. ask question", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where does one store fabric in their own home?", + "gold_answer": "sewing room", + "os_answer": "Linen closet", + "os_eval": "Incorrect", + "mcq_answer": "A. sewing room", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do most companies not want to have relative to demand?", + "gold_answer": "oversupply", + "os_answer": "Excess supply", + "os_eval": "Correct", + "mcq_answer": "A. oversupply", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The cancer patient was expecting to die, so he made out his what?", + "gold_answer": "write will", + "os_answer": "Will", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you partied all night you could find yourself already what, even when just beginning work?", + "gold_answer": "getting tired", + "os_answer": "Tired", + "os_eval": "Correct", + "mcq_answer": "A. getting tired", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The cat carefully navigated the area, they do everything they can to avoid what?", + "gold_answer": "get wet", + "os_answer": "Water", + "os_eval": "Correct", + "mcq_answer": "C. falling", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is someone usually doing if someone else is talking to him or her?", + "gold_answer": "listening", + "os_answer": "Listening", + "os_eval": "Correct", + "mcq_answer": "A. listening", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does the sky do before a rain?", + "gold_answer": "appear beautiful", + "os_answer": "Clouds", + "os_eval": "Incorrect", + "mcq_answer": "E. cloud over", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Pens, computers, text books and paper clips can all be found where?", + "gold_answer": "university", + "os_answer": "Office supply store", + "os_eval": "Incorrect", + "mcq_answer": "B. university", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What geographic area is a lizard likely to be?", + "gold_answer": "west texas", + "os_answer": "Warm and dry climates", + "os_eval": "Incorrect", + "mcq_answer": "C. arid regions", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "As a result of dying, what happens to organic material?", + "gold_answer": "death and decay", + "os_answer": "Decomposes", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you buy a clock, clothing and wrenches?", + "gold_answer": "counter", + "os_answer": "Hardware store", + "os_eval": "Incorrect", + "mcq_answer": "E. department store", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do you do when you're in a new place and want to see new things?", + "gold_answer": "look around", + "os_answer": "* Explore the area on foot or by bike.\n* Visit local tourist attractions.\n* Ask locals for recommendations.\n* Check out online resources for things to do.\n* Take a guided tour.\n* Attend local events.\n* Visit museums and historical sites.\n* Try local cuisine.\n* Shop for souvenirs.\n* Take a scenic drive.", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What happens when to ice when it is in the sun?", + "gold_answer": "melted", + "os_answer": "It melts.", + "os_eval": "Correct", + "mcq_answer": "B. melted", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you store your dishes in your dwelling?", + "gold_answer": "shelf", + "os_answer": "Kitchen cabinets\nPantry\nShelves\nCupboards", + "os_eval": "Correct", + "mcq_answer": "E. cabinet", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The man laid on the soft moss and looked up at the trees, where was the man?", + "gold_answer": "forest", + "os_answer": "In a forest", + "os_eval": "Correct", + "mcq_answer": "B. forest", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is someone doing if he or she is sitting quietly and his or her eyes are moving?", + "gold_answer": "reading", + "os_answer": "Reading", + "os_eval": "Correct", + "mcq_answer": "E. think", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "A man takes a seat at a museum outside of Barcelona, where is he likely?", + "gold_answer": "martorell", + "os_answer": "Spain", + "os_eval": "Correct", + "mcq_answer": "B. martorell", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find a toy soldier that is being played with?", + "gold_answer": "child's hand", + "os_answer": "In a child's playroom", + "os_eval": "Incorrect", + "mcq_answer": "C. child's hand", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are you when you're about to use your plane ticket?", + "gold_answer": "airport", + "os_answer": "At the airport", + "os_eval": "Correct", + "mcq_answer": "C. airport", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Flowers make a good center focal point, just one of many arrangements that look good on a what?", + "gold_answer": "table", + "os_answer": "Table", + "os_eval": "Correct", + "mcq_answer": "E. vase", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How can a human cross a river and not mess up their hair?", + "gold_answer": "bridge", + "os_answer": "Swim across.", + "os_eval": "Incorrect", + "mcq_answer": "D. bridge", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "You can find a monkey in what West African region on the Gulf of Guinea", + "gold_answer": "south american country", + "os_answer": "Ivory Coast", + "os_eval": "Incorrect", + "mcq_answer": "E. nigeria", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Surprising an angry person could lead to what?", + "gold_answer": "fight", + "os_answer": "A violent reaction", + "os_eval": "Correct", + "mcq_answer": "B. fight", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you get a lizard to keep in your home?", + "gold_answer": "pet shop", + "os_answer": "Pet store", + "os_eval": "Correct", + "mcq_answer": "C. pet shop", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a reception is held with hotel guests walking by, what is the likely venue?", + "gold_answer": "lobby", + "os_answer": "Hotel lobby", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a place that is far away from your house and where you could consume beer?", + "gold_answer": "friend's house", + "os_answer": "Bar", + "os_eval": "Incorrect", + "mcq_answer": "B. friend's house", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a court case is dismissed after hearing testimony, what would be a likely cause?", + "gold_answer": "change of heart", + "os_answer": "Lack of evidence, lack of jurisdiction, procedural errors, or settlement between parties", + "os_eval": "Incorrect", + "mcq_answer": "D. boredom", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Sitting down quickly after eating beans could lead to what?", + "gold_answer": "flatulence", + "os_answer": "Gas and bloating", + "os_eval": "Correct", + "mcq_answer": "A. flatulence", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The car's steering seem quite loose, but he still considered purchasing it because he needed something small and what?", + "gold_answer": "compact", + "os_answer": "Affordable", + "os_eval": "Incorrect", + "mcq_answer": "D. compact", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "His phone was dead and they couldn't find the expressway, he opened up the glove compartment and handed his passenger the what to navigate?", + "gold_answer": "map", + "os_answer": "Map", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What would someone use a personal key for?", + "gold_answer": "own home", + "os_answer": "To unlock a door or lock", + "os_eval": "Incorrect", + "mcq_answer": "C. own home", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Her voice lent her to the alto section, what group did she join?", + "gold_answer": "choir", + "os_answer": "Choir", + "os_eval": "Correct", + "mcq_answer": "C. choir", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are you likely to find a Japanese restaurant not run by people from Japan?", + "gold_answer": "california", + "os_answer": "Anywhere outside of Japan", + "os_eval": "Correct", + "mcq_answer": "A. california", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Animals who have hair and don't lay eggs are what?", + "gold_answer": "mammals", + "os_answer": "Mammals", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John was an aristocratic fox hunter. Where might he live?", + "gold_answer": "new hampshire", + "os_answer": "In an English countryside estate", + "os_eval": "Incorrect", + "mcq_answer": "A. england", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a grape likely to be being fed to someone else?", + "gold_answer": "field", + "os_answer": "During a romantic or intimate moment", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Some food can be stored at room temperature until you open it, then you should keep it in what?", + "gold_answer": "refrigerators", + "os_answer": "Refrigerator", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you're going to a party in a new town what are you hoping to make?", + "gold_answer": "making new friends", + "os_answer": "New connections", + "os_eval": "Correct", + "mcq_answer": "B. making new friends", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where does one usually keep literature?", + "gold_answer": "shelf", + "os_answer": "Bookshelf", + "os_eval": "Correct", + "mcq_answer": "D. shelf", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "WHat type of keyboard is made up of one or more pipe divisions?", + "gold_answer": "killing", + "os_answer": "Organ", + "os_eval": "Incorrect", + "mcq_answer": "E. organ", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The bell rang, and the congregation began to what in to the church?", + "gold_answer": "funnel", + "os_answer": "File", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "James needed smooth sandpaper, but instead he got what type?", + "gold_answer": "rough", + "os_answer": "Rough sandpaper", + "os_eval": "Correct", + "mcq_answer": "A. rough", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you borrow furniture if you do not have any?", + "gold_answer": "neighbor's house", + "os_answer": "- Furniture rental stores\n- Friends or family members\n- Community centers or churches\n- College or university housing offices\n- Local businesses or organizations", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "I want my wine stored in darkness, where should it go?", + "gold_answer": "movies", + "os_answer": "Wine cellar", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What would you do if your date does not show up?", + "gold_answer": "wait for", + "os_answer": "* Politely ask the restaurant or venue to confirm the reservation.\n* Try contacting your date through phone, text, or social media to inquire about their whereabouts.\n* After waiting a reasonable amount of time (e.g., 30-60 minutes), leave a message expressing your disappointment and asking them to contact you.\n* If possible, try to enjoy the evening by ordering food or drinks and reading a book or using your phone.\n* If you feel uncomfortable or unsafe, leave the venue and contact a friend or family member.\n* Consider the possibility that your date had an emergency or unexpected event and give them the benefit of the doubt.\n* Learn from the experience and set clearer expectations for future dates.", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John farms anemone in what type of facility?", + "gold_answer": "nursery", + "os_answer": "Greenhouse", + "os_eval": "Incorrect", + "mcq_answer": "D. nursery", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Brawn opened the curtains so that the sun could do what?", + "gold_answer": "warm room", + "os_answer": "Brighten the room", + "os_eval": "Incorrect", + "mcq_answer": "A. dry clothes", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How might releasing energy that has built up feel?", + "gold_answer": "wonderful", + "os_answer": "Cathartic, liberating, satisfying, relaxing, calming", + "os_eval": "Correct", + "mcq_answer": "D. orgasm", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where might it be hard to get furniture to?", + "gold_answer": "loft", + "os_answer": "- Narrow hallways\n- Upstairs apartments\n- Through small doors\n- Into a crowded room\n- Over stairs", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you get jeans and other wearable items to take home with you?", + "gold_answer": "clothing store", + "os_answer": "Clothing store", + "os_eval": "Correct", + "mcq_answer": "D. clothing store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "In what substance do clouds float?", + "gold_answer": "air", + "os_answer": "Air", + "os_eval": "Correct", + "mcq_answer": "C. air", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do most people make coffee?", + "gold_answer": "coffee shop", + "os_answer": "Kitchen", + "os_eval": "Incorrect", + "mcq_answer": "E. kitchen", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can someone get a new saw?", + "gold_answer": "hardware store", + "os_answer": "Hardware store", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What would you do to a crime scene before asking a question?", + "gold_answer": "express information", + "os_answer": "1. **Secure the scene.** This means keeping people out of the area where the crime occurred, as well as protecting any evidence that may be present.\n2. **Document the scene.** Take photographs or videos of the scene, and make notes of any observations you make.\n3. **Identify and interview witnesses.** If there are any witnesses to the crime, interview them as soon as possible.\n4. **Collect evidence.** Collect any evidence that may be present at the scene, such as fingerprints, DNA, or weapons.\n5. **Ask your question.** Once you have secured the scene, documented it, identified and interviewed witnesses, and collected evidence, you can then ask your question.", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you go if you want to buy some clothes?", + "gold_answer": "mall", + "os_answer": "Clothing store", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is food likely to stay dry?", + "gold_answer": "cupboard", + "os_answer": "In an airtight container", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is it called when a person with mental illness is able to lead a relatively normal life?", + "gold_answer": "managed", + "os_answer": "Recovery", + "os_eval": "Incorrect", + "mcq_answer": "A. managed", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do you keep musical instrument so it doesn't get scratched?", + "gold_answer": "case", + "os_answer": "In a case", + "os_eval": "Correct", + "mcq_answer": "C. case", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "While John Candy and Dan Aykroyd didn't run into a gazelle, you'd have to go where to see one?", + "gold_answer": "eastern hemisphere", + "os_answer": "Africa", + "os_eval": "Correct", + "mcq_answer": "C. open plain", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When we are running what are we doing?", + "gold_answer": "go quickly", + "os_answer": "Exerting energy to move forward at a speed faster than walking", + "os_eval": "Correct", + "mcq_answer": "D. go quickly", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "It's dangerous to let pet birds free so it's better to keep them what?", + "gold_answer": "caged in", + "os_answer": "Caged", + "os_eval": "Correct", + "mcq_answer": "C. caged in", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A beaver is know for building prowess, their supplies come from where?", + "gold_answer": "wooded area", + "os_answer": "Trees", + "os_eval": "Correct", + "mcq_answer": "B. body of water", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Going public about a common problem can gain what for a celebrity?", + "gold_answer": "wide acceptance", + "os_answer": "Sympathy", + "os_eval": "Incorrect", + "mcq_answer": "E. press coverage", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If it is Chrismas time what came most recently before?", + "gold_answer": "halloween", + "os_answer": "December", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If someone found out their brother was having a daughter, they would have to add a niece limb to the what?", + "gold_answer": "family tree", + "os_answer": "Family tree", + "os_eval": "Correct", + "mcq_answer": "D. family tree", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The criminal insisted he must do the crime to the bank teller, but she tried to convince him there were other ways in life and this was what?", + "gold_answer": "willing", + "os_answer": "Wrong", + "os_eval": "Incorrect", + "mcq_answer": "D. have to", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "what do you fill with ink to write?", + "gold_answer": "fountain pen", + "os_answer": "Pen", + "os_eval": "Correct", + "mcq_answer": "B. fountain pen", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you were lost you might need a map, the best place to find one on the road is at any what?", + "gold_answer": "truck stop", + "os_answer": "Gas station", + "os_eval": "Incorrect", + "mcq_answer": "E. gas station", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would a cat snuggle up with their human?", + "gold_answer": "comfortable chair", + "os_answer": "On the lap, in bed, on the couch, under the covers, at the feet", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a place that has large cable hanging overhead?", + "gold_answer": "substation", + "os_answer": "Bridge", + "os_eval": "Incorrect", + "mcq_answer": "D. substation", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do cars usually travel at very high speeds?", + "gold_answer": "race track", + "os_answer": "Freeways or highways", + "os_eval": "Incorrect", + "mcq_answer": "C. race track", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What might a person be watching if they see a man with a suitcase full of money?", + "gold_answer": "movie", + "os_answer": "A crime drama or action movie", + "os_eval": "Correct", + "mcq_answer": "D. airplane", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If I put in my key and open a hinged door, where am I likely entering?", + "gold_answer": "own house", + "os_answer": "A room or building", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If somebody is working at a reception desk, they are located at the front entrance of the what?", + "gold_answer": "building", + "os_answer": "Building", + "os_eval": "Correct", + "mcq_answer": "C. building", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is it called when a person tends to leave things to the last minute?", + "gold_answer": "procrastinate", + "os_answer": "Procrastination", + "os_eval": "Correct", + "mcq_answer": "A. procrastinate", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What will you do if you do not want to settle in one place?", + "gold_answer": "wander", + "os_answer": "* Travel frequently\n* Live in a van or RV\n* Rent out different apartments or houses short-term\n* Take on jobs that require travel\n* Become a digital nomad and work remotely from different locations", + "os_eval": "Correct", + "mcq_answer": "C. wander", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Jane works for the government as a senator, where does she spend a lot of time?", + "gold_answer": "capitol building", + "os_answer": "The Capitol Building", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is it called when two people in love have children?", + "gold_answer": "procreate", + "os_answer": "Family", + "os_eval": "Incorrect", + "mcq_answer": "B. procreate", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "It takes ambition to complete a job, but the first step is to what?", + "gold_answer": "begin work", + "os_answer": "Start", + "os_eval": "Correct", + "mcq_answer": "B. begin work", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you find a restaurant's phone number?", + "gold_answer": "yellow pages", + "os_answer": "On the restaurant's website, menu, or receipt", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What would you put coins into to make it work?", + "gold_answer": "water fountain", + "os_answer": "A vending machine", + "os_eval": "Incorrect", + "mcq_answer": "E. jar", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "A patriotic guy with a camera is looking for a bald eagle, what is he likely to do with the eagle if he finds one?", + "gold_answer": "city", + "os_answer": "Take a picture of it.", + "os_eval": "Incorrect", + "mcq_answer": "E. photograph", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you go to use a piano in your neighborhood if you don't have one?", + "gold_answer": "neighbor's house", + "os_answer": "- A local music school\n- A community center\n- A church\n- A library\n- A public park with a piano", + "os_eval": "Incorrect", + "mcq_answer": "A. music school", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you get a shower curtain if you do not have one?", + "gold_answer": "department store", + "os_answer": "A home goods store, department store, hardware store, or online retailers.", + "os_eval": "Correct", + "mcq_answer": "A. department store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Kissing is normally an activity reserved for your romantic what?", + "gold_answer": "partner", + "os_answer": "Partner", + "os_eval": "Correct", + "mcq_answer": "B. partner", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does a child learn to do before school?", + "gold_answer": "dress herself", + "os_answer": "* Share toys and take turns\n* Follow simple instructions\n* Recognize and name colors, shapes, and numbers\n* Hold a pencil or crayon correctly\n* Use scissors\n* Dress themselves\n* Wash their hands\n* Brush their teeth\n* Tie their shoes\n* Play cooperatively with others\n* Use the toilet independently\n* Recognize and name their own emotions\n* Express their needs and wants\n* Solve simple problems\n* Make friends", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "According to what book did an apple tree lead to the downfall of man?", + "gold_answer": "bible", + "os_answer": "The Bible", + "os_eval": "Correct", + "mcq_answer": "A. bible", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What might a kind person do?", + "gold_answer": "open doors", + "os_answer": "* Offer help to someone in need\n* Donate to a charity\n* Compliment a stranger\n* Hold the door open for someone\n* Let someone go ahead of them in line\n* Give up their seat on the bus or train\n* Help a lost child find their parents\n* Volunteer their time to a good cause\n* Be a good listener\n* Be patient and understanding with others", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Name a location where you would not want to find mice.", + "gold_answer": "attic", + "os_answer": "Kitchen", + "os_eval": "Correct", + "mcq_answer": "E. laboratory", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do most people turn to get information on their phones?", + "gold_answer": "google", + "os_answer": "Google", + "os_eval": "Correct", + "mcq_answer": "A. internet", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What happens to a body after death?", + "gold_answer": "decomposition", + "os_answer": "After death, the body undergoes a series of changes, including:\n\n* **Pallor:** The skin becomes pale due to the loss of blood circulation.\n* **Algor mortis:** The body temperature decreases as it releases heat into the environment.\n* **Rigor mortis:** The muscles become stiff and rigid as ATP levels deplete.\n* **Livor mortis:** Blood settles in the lowest parts of the body, causing discoloration.\n* **Decomposition:** Bacteria and enzymes break down the body's tissues, leading to foul odors and the eventual skeletonization of the body.", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Though she had a disability, what did her encouraging and positive coach see in her?", + "gold_answer": "qualification", + "os_answer": "Her potential", + "os_eval": "Incorrect", + "mcq_answer": "E. potential", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When you see something rise, you are where in relation to it?", + "gold_answer": "below", + "os_answer": "Below it", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you keep a rug near your front door?", + "gold_answer": "living room", + "os_answer": "Inside the front door, on the floor", + "os_eval": "Incorrect", + "mcq_answer": "E. hall", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do you do when you need to get food?", + "gold_answer": "table", + "os_answer": "Go to a grocery store, order online, or go to a restaurant.", + "os_eval": "Incorrect", + "mcq_answer": "E. shop", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Brad tried to arise from bed but he could not. Instead, he just continued to do what?", + "gold_answer": "lie down", + "os_answer": "Lie down", + "os_eval": "Correct", + "mcq_answer": "C. lie down", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a heifer is really high quality, you might take her where?", + "gold_answer": "cattle show", + "os_answer": "To a show or sale", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do people want to acquire from opening business?", + "gold_answer": "wealth", + "os_answer": "* **Financial gain**\n* **Independence**\n* **Flexibility**\n* **Control over their work environment**\n* **To make a difference in the world**\n* **To pursue their passions**\n* **To create something new**\n* **To leave a legacy**", + "os_eval": "Correct", + "mcq_answer": "B. wealth", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What has someone who had finished their undergraduate done?", + "gold_answer": "graduated", + "os_answer": "Earned a bachelor's degree", + "os_eval": "Correct", + "mcq_answer": "A. graduated", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "By learning about the world, many poor college students gain what?", + "gold_answer": "desire to travel", + "os_answer": "Perspective", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "where is seaweed from?", + "gold_answer": "ocean", + "os_answer": "The ocean", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "how can i store cooked steak?", + "gold_answer": "freezer", + "os_answer": "* **Refrigerator:** Store in an airtight container or wrap tightly in plastic wrap or aluminum foil. Consume within 3-4 days.\n* **Freezer:** Wrap tightly in plastic wrap or aluminum foil and place in a freezer-safe bag. Consume within 2-3 months.\n* **Vacuum sealing:** Vacuum seal the steak and store in the refrigerator for up to 2 weeks or in the freezer for up to 6 months.", + "os_eval": "Incorrect", + "mcq_answer": "D. tupperware", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The audience cheered when a goal was scored, what were they spectating?", + "gold_answer": "sporting event", + "os_answer": "A sports game", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What western state has thousands of miles of shore?", + "gold_answer": "california", + "os_answer": "Alaska", + "os_eval": "Incorrect", + "mcq_answer": "D. california", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Everybody seemed to be crying at the holy site, the tour guide explained that this was what?", + "gold_answer": "common", + "os_answer": "A cathartic experience", + "os_eval": "Incorrect", + "mcq_answer": "D. common", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a public monument likely to be erected by a city?", + "gold_answer": "municipal park", + "os_answer": "In a prominent location that is easily accessible to the public, such as a park, square, or government building.", + "os_eval": "Correct", + "mcq_answer": "A. municipal park", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would a person live if they wanted no neighbors?", + "gold_answer": "woods", + "os_answer": "In a remote area, such as a rural farm or an isolated island.", + "os_eval": "Incorrect", + "mcq_answer": "D. woods", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is the control room that controls a PWR located?", + "gold_answer": "building", + "os_answer": "Adjacent to the containment structure", + "os_eval": "Correct", + "mcq_answer": "E. nuclear power plant", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you're attending school and are falling asleep you're likely experiencing what?", + "gold_answer": "boredom", + "os_answer": "Sleep deprivation", + "os_eval": "Incorrect", + "mcq_answer": "A. boredom", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "I want to buy a gong, where should I look for one?", + "gold_answer": "orchestra", + "os_answer": "* Music stores\n* Online retailers\n* Specialty instrument shops\n* Flea markets\n* Pawn shops", + "os_eval": "Incorrect", + "mcq_answer": "E. music store", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What would friends do if they need each others' help?", + "gold_answer": "group together", + "os_answer": "* Communicate their need for help to each other.\n* Offer their help to each other without being asked.\n* Provide emotional support and encouragement.\n* Assist with tasks or activities that the other person is struggling with.\n* Be there for each other through good times and bad.", + "os_eval": "Correct", + "mcq_answer": "A. call each other", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When people are playing a game, what is their motivation to play?", + "gold_answer": "desire to win", + "os_answer": "* Enjoyment and fun\n* Competition and challenge\n* Social interaction\n* Relaxation and stress relief\n* Learning and skill development\n* Reward and recognition", + "os_eval": "Incorrect", + "mcq_answer": "C. desire to win", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where could there be a battle that involves words?", + "gold_answer": "court room", + "os_answer": "In a debate or argument", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John didn't mind getting in line. It was what game after that he hated. The time, the sore feet. He did not like doing what?", + "gold_answer": "standing in line", + "os_answer": "Waiting", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The old man needed to have rest multiple times a day, he would do what on the couch and catnap?", + "gold_answer": "lay in bed", + "os_answer": "Lie down", + "os_eval": "Incorrect", + "mcq_answer": "E. lie down", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The end of the barrel of what primitive firearm is bell shaped?", + "gold_answer": "blunderbuss", + "os_answer": "Blunderbuss", + "os_eval": "Correct", + "mcq_answer": "C. blunderbuss", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a good place to store pamphlets in your home or office?", + "gold_answer": "drawer", + "os_answer": "* In a pamphlet holder on your desk or bookshelf\n* In a file cabinet\n* In a drawer\n* In a magazine rack\n* In a box or container", + "os_eval": "Correct", + "mcq_answer": "D. drawer", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a good place to put a hamburger?", + "gold_answer": "mouth", + "os_answer": "On a plate or in a bun", + "os_eval": "Incorrect", + "mcq_answer": "C. mouth", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A story about World War II would be set when?", + "gold_answer": "past", + "os_answer": "1939-1945", + "os_eval": "Correct", + "mcq_answer": "D. past", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What type of geographic area will you find a marmot?", + "gold_answer": "mountainous area", + "os_answer": "Alpine or mountainous", + "os_eval": "Correct", + "mcq_answer": "A. mountainous area", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Most people make stupid assumptions that are based on their prejudices. What might they do instead to achieve better outcomes?", + "gold_answer": "think", + "os_answer": "Instead of making stupid assumptions based on their prejudices, people can improve their decision-making by:\n- **Questioning their assumptions:** Critically examining the beliefs and biases that influence their thinking.\n- **Seeking diverse perspectives:** Consulting with others who have different backgrounds, experiences, and viewpoints.\n- **Gathering objective data:** Collecting information and evidence to support or refute their assumptions.\n- **Considering alternative explanations:** Exploring multiple interpretations and possibilities before jumping to conclusions.\n- **Being open-minded:** Willing to consider new information and ideas that challenge their existing beliefs.\n- **Learning from mistakes:** Reflecting on past experiences and identifying biases that may have led to inaccurate assumptions.\n- **Practicing empathy:** Trying to understand the perspectives and motivations of others, even if they differ from their own.", + "os_eval": "Incorrect", + "mcq_answer": "B. think", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is something children can do while traveling in a car?", + "gold_answer": "listen to music", + "os_answer": "* Play games\n* Read books\n* Listen to music\n* Draw or color\n* Play with toys\n* Talk to their parents or siblings\n* Sleep", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you hear a trumpet along with other instruments made from the same material?", + "gold_answer": "brass band", + "os_answer": "Brass band", + "os_eval": "Correct", + "mcq_answer": "C. brass band", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Stabbing to death of a person is what sort of way to die?", + "gold_answer": "gruesome", + "os_answer": "Violent and tragic", + "os_eval": "Incorrect", + "mcq_answer": "B. gruesome", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a great place to buy fresh fruit?", + "gold_answer": "san francisco", + "os_answer": "Farmers' market", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The church was giving assistance, what were they hoping to accomplish?", + "gold_answer": "helping others", + "os_answer": "Reduce suffering and provide support to those in need.", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a shelf likely to be hidden behind a door?", + "gold_answer": "cupboard", + "os_answer": "In a closet", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The man got a pail to catch the draining motor oil, where was he likely doing this at home?", + "gold_answer": "garage", + "os_answer": "Garage", + "os_eval": "Correct", + "mcq_answer": "A. garage", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What kind of cold storage could you find in your house?", + "gold_answer": "ice pack", + "os_answer": "Refrigerator or freezer", + "os_eval": "Incorrect", + "mcq_answer": "E. refrigerator", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The pitcher stepped on the mound ready to throw, where was he located specifically?", + "gold_answer": "hell", + "os_answer": "Rubber", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If it's not used for hair a round brush is an example of what?", + "gold_answer": "art supplies", + "os_answer": "Cleaning", + "os_eval": "Incorrect", + "mcq_answer": "C. art supplies", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "His parents thought he was suffering from boredom, but the teen loved to lay in bed and just do what?", + "gold_answer": "listen to music", + "os_answer": "Think", + "os_eval": "Incorrect", + "mcq_answer": "C. listen to music", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The electrode wouldn't spark, it turned out that the what hadn't been connected?", + "gold_answer": "battery", + "os_answer": "Battery", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Riding a bike for a long time can cause what?", + "gold_answer": "fatigue", + "os_answer": "Saddle sores", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What could happen to a cat other than wanting food?", + "gold_answer": "thirsty", + "os_answer": "* Seeking attention or affection\n* Being in pain or discomfort\n* Feeling anxious or stressed\n* Wanting to play or interact\n* Needing to use the litter box\n* Being curious or exploring\n* Feeling lonely or bored\n* Being protective of its territory\n* Having a medical condition", + "os_eval": "Incorrect", + "mcq_answer": "B. thirsty", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you turn off the music in a room with no other noise that room would be what?", + "gold_answer": "silent", + "os_answer": "Silent", + "os_eval": "Correct", + "mcq_answer": "A. silent", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "In what country are the most fast food restaurants?", + "gold_answer": "america", + "os_answer": "United States", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would walk through a central passage to catch an elevator?", + "gold_answer": "public building", + "os_answer": "A hotel", + "os_eval": "Incorrect", + "mcq_answer": "D. public building", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do people do when networking?", + "gold_answer": "build trust", + "os_answer": "- Exchange contact information\n- Build relationships\n- Learn about new opportunities\n- Share knowledge and ideas\n- Seek support and advice", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you store you spare linens near your socks?", + "gold_answer": "dresser drawers", + "os_answer": "In a dresser drawer", + "os_eval": "Correct", + "mcq_answer": "D. dresser drawers", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What might someone do after they finish creating art?", + "gold_answer": "relax", + "os_answer": "* Admire their work\n* Take a break\n* Share their work with others\n* Seek feedback\n* Start a new piece of art", + "os_eval": "Correct", + "mcq_answer": "B. relax", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "To get clean clothes you to what to them?", + "gold_answer": "launder", + "os_answer": "Wash them", + "os_eval": "Correct", + "mcq_answer": "D. launder", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The person tried to reduce his weight with a shrink ray, but he got it backwards and only did what?", + "gold_answer": "make larger", + "os_answer": "Increased his weight", + "os_eval": "Correct", + "mcq_answer": "A. grow", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you wanted to show off silk, what item could it be on?", + "gold_answer": "expensive clothing", + "os_answer": "Dress", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What will happen if you inject water into yourself?", + "gold_answer": "thin blood", + "os_answer": "Injecting water into oneself can lead to a condition called water intoxication, also known as hyponatremia. This occurs when the sodium levels in your blood become dangerously low due to the dilution of sodium by the injected water. Symptoms of water intoxication include nausea, vomiting, seizures, coma, and even death in severe cases.", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Athletes soak in hot tubs to relieve what after playing baseball?", + "gold_answer": "fame", + "os_answer": "Muscle soreness", + "os_eval": "Incorrect", + "mcq_answer": "E. sore muscles", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you hear a violin along side many string and wind instruments?", + "gold_answer": "orchestra", + "os_answer": "An orchestra", + "os_eval": "Correct", + "mcq_answer": "C. orchestra", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the sun ultimately responsible for?", + "gold_answer": "life on earth", + "os_answer": "The sun is ultimately responsible for life on Earth.", + "os_eval": "Correct", + "mcq_answer": "D. life on earth", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Mandy lived in a train station. She longed to see distant places. Where might she imagine going?", + "gold_answer": "europe", + "os_answer": "-Faraway cities\n-Tropical islands\n-Historical landmarks\n-Mountainous regions\n-Foreign countries", + "os_eval": "Incorrect", + "mcq_answer": "D. europe", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Joe is a squirrel, which is an animal. He probably lives in what sort of place.", + "gold_answer": "woodland", + "os_answer": "A forest", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where could a personal ficus live?", + "gold_answer": "front yard", + "os_answer": "Indoors", + "os_eval": "Incorrect", + "mcq_answer": "D. conservatory", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If the president wanted to ban snakes, where would he issue such a decree?", + "gold_answer": "street", + "os_answer": "Executive Order", + "os_eval": "Incorrect", + "mcq_answer": "E. white house", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "They were searching for rocks, so they missed the birds overhead as they stared at the what?", + "gold_answer": "ground", + "os_answer": "Ground", + "os_eval": "Correct", + "mcq_answer": "A. ground", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you expect to find a dictionary along side other writings you can borrow?", + "gold_answer": "classroom", + "os_answer": "Library", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What would be necessary for getting in shape?", + "gold_answer": "exercise", + "os_answer": "* **Exercise:** Regular physical activity is necessary for getting in shape. This could include activities like running, swimming, biking, or strength training.\n* **Healthy diet:** Eating a balanced diet that is rich in fruits, vegetables, and whole grains is essential for fueling your body and providing it with the nutrients it needs to function properly.\n* **Adequate sleep:** Getting enough sleep allows your body to rest and repair itself.\n* **Hydration:** Staying hydrated is important for overall health and well-being. Drinking plenty of water throughout the day will help you stay energized and help your body function properly.\n* **Consistency:** The key to getting in shape is to be consistent with your exercise routine and healthy habits.", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A statue that shoots liquid is called a what?", + "gold_answer": "water fountain", + "os_answer": "Fountain", + "os_eval": "Correct", + "mcq_answer": "A. water fountain", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you have a child who gets in trouble for being hyperactive you may need to teach them how to what down?", + "gold_answer": "calm", + "os_answer": "Calm down", + "os_eval": "Correct", + "mcq_answer": "B. calm", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What can you use to store a book while traveling?", + "gold_answer": "suitcase", + "os_answer": "Book bag, backpack, tote bag, suitcase, briefcase", + "os_eval": "Correct", + "mcq_answer": "C. backpack", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find gazelle under a G?", + "gold_answer": "open field", + "os_answer": "Geography", + "os_eval": "Incorrect", + "mcq_answer": "C. dictionary", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Competing can lead to great highs, and also great lows when suffering what?", + "gold_answer": "defeat", + "os_answer": "Defeat", + "os_eval": "Correct", + "mcq_answer": "D. defeat", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What blocks sunshine?", + "gold_answer": "summer", + "os_answer": "Clouds, trees, buildings, mountains, and umbrellas", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When you feel too much heat in your home you can turn on what?", + "gold_answer": "coolness", + "os_answer": "Air conditioning", + "os_eval": "Incorrect", + "mcq_answer": "E. air conditioning", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you store a pillow case that is not in use?", + "gold_answer": "drawer", + "os_answer": "Linen closet", + "os_eval": "Incorrect", + "mcq_answer": "D. drawer", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If the kitten was going to grow up to be a mouser like it's mother, where should it spend most of it's time?", + "gold_answer": "farmhouse", + "os_answer": "In the barn or other areas where mice are likely to be present", + "os_eval": "Incorrect", + "mcq_answer": "B. floor", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is that man buying silk from?", + "gold_answer": "china", + "os_answer": "A silk shop", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a teacher likely to keep her clavichord?", + "gold_answer": "music room", + "os_answer": "The teacher is unlikely to keep her clavichord at school. She is more likely to keep it at home.", + "os_eval": "Incorrect", + "mcq_answer": "D. music room", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are you if your bieifcase is going through an x-ray machine?", + "gold_answer": "airport", + "os_answer": "Airport Security", + "os_eval": "Correct", + "mcq_answer": "C. airport", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why would you take a bus to work?", + "gold_answer": "commute", + "os_answer": "* **Cost-effectiveness:** Buses are often more affordable than driving or taking a taxi, especially for long commutes.\n* **Convenience:** Buses run on fixed routes and schedules, making it easy to plan your commute. Many bus stops are conveniently located near residential and business areas.\n* **Reduced stress:** You can relax and read, work, or listen to music on the bus, eliminating the stress of driving.\n* **Environmental friendliness:** Buses emit fewer emissions than cars, contributing to a cleaner environment.\n* **Time-saving (in some cases):** In densely populated areas, buses can be faster than driving during peak hours due to traffic congestion.\n* **Socializing:** Riding the bus provides an opportunity to interact with others and build a sense of community.\n* **Accessibility:** Buses are accessible to individuals who do not have a driver's license or access to a car.\n* **Reliability:** Buses are generally reliable and operate even in inclement weather.\n* **Flexibility:** Some bus systems offer flexible routes and schedules, allowing for customization of your commute.\n* **Lack of parking:** In urban areas, finding parking can be difficult and expensive. Taking the bus eliminates this hassle.", + "os_eval": "Incorrect", + "mcq_answer": "A. commute", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you are hungry and going fishing, why would you be going fishing?", + "gold_answer": "catching fish", + "os_answer": "To catch fish to eat", + "os_eval": "Correct", + "mcq_answer": "C. catching fish", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Dogs are very loyal if they have a good owner, they will always what them?", + "gold_answer": "defend", + "os_answer": "Protect", + "os_eval": "Correct", + "mcq_answer": "D. defend", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "For many males hair is a concern as they get older, it begins to what, causing a receding hairline?", + "gold_answer": "fall out", + "os_answer": "Thin", + "os_eval": "Incorrect", + "mcq_answer": "C.", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The fresh herbs, flowers, and vegetables will shrivel up if people don't do this?", + "gold_answer": "water plants", + "os_answer": "Water them", + "os_eval": "Correct", + "mcq_answer": "A. water plants", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "I picked from an apple tree outside of Fort Wayne, where am I?", + "gold_answer": "indiana", + "os_answer": "Indiana", + "os_eval": "Correct", + "mcq_answer": "C. indiana", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you're celebrating with too many cocktails what may you have in the morning?", + "gold_answer": "hang over", + "os_answer": "A hangover", + "os_eval": "Correct", + "mcq_answer": "D.", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The architect thought that a mezzanine would look good, but the planning committee rejected it. They told the architect that they felt it was a potential hazard given the ages of the people who would be using it. What might they be designing?", + "gold_answer": "actors", + "os_answer": "A playground", + "os_eval": "Incorrect", + "mcq_answer": "E. school", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The person wasn't bothered by the weather, she had remembered to bring her what?", + "gold_answer": "read book", + "os_answer": "Umbrella", + "os_eval": "Incorrect", + "mcq_answer": "E. warm coat", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you want to learn about the world and understand the real reasons behind cultural norms and mores, you have achieved a sense of what?", + "gold_answer": "enlightenment", + "os_answer": "Anthropological awareness", + "os_eval": "Incorrect", + "mcq_answer": "A. enlightenment", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A person would join a trade school for finding information related to what?", + "gold_answer": "gaining knowledge", + "os_answer": "Vocational skills", + "os_eval": "Incorrect", + "mcq_answer": "C. understanding of", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Joan was a baby, so there were many things she couldn't do, which caused problems for her parents. Name one thing that makes raising a baby difficult.", + "gold_answer": "arrive early", + "os_answer": "Babies are completely dependent on their caregivers for all of their needs, which can be physically and emotionally demanding.", + "os_eval": "Incorrect", + "mcq_answer": "B. learn to walk", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you put some ham if you want to cook it?", + "gold_answer": "pizza", + "os_answer": "In the oven", + "os_eval": "Incorrect", + "mcq_answer": "E. part of meal", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Running errands with screaming kids will likely cause what?", + "gold_answer": "aggravation", + "os_answer": "Stress and annoyance", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Sam wasn't lying, but he left out important details. He was being what?", + "gold_answer": "deceitful", + "os_answer": "Evasive", + "os_eval": "Incorrect", + "mcq_answer": "D. deceptive", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where may you be if you're buying pork chops at a corner shop?", + "gold_answer": "england", + "os_answer": "A butcher shop", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a well used toy car likely to be found?", + "gold_answer": "child's room", + "os_answer": "Playroom", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can fisherman store their rods when on a fishing trip?", + "gold_answer": "fishing camp", + "os_answer": "Rod holder, rod rack, or in the boat", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Danny is having fun just dancing and singing with his friends. He wasn't concerned with things that weren't fun. For him having fun is the same as what?", + "gold_answer": "being happy", + "os_answer": "Living the moment", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find an office worker gossiping with their colleagues?", + "gold_answer": "water cooler", + "os_answer": "Break room", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you put nails if they are already packaged?", + "gold_answer": "cabinet", + "os_answer": "In a toolbox or a designated storage area for nails", + "os_eval": "Incorrect", + "mcq_answer": "E. store", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a person who is good at sports considered?", + "gold_answer": "talented", + "os_answer": "Athletic", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where does a child likely sit at a desk?", + "gold_answer": "schoolroom", + "os_answer": "Center", + "os_eval": "Incorrect", + "mcq_answer": "B. schoolroom", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does playing soccer and winning lead to?", + "gold_answer": "excitement", + "os_answer": "- Increased self-confidence\n- Improved physical fitness\n- Stronger team bonds\n- A sense of accomplishment\n- Possible recognition and rewards", + "os_eval": "Incorrect", + "mcq_answer": "A. excitement", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What attraction is sometimes so large that you need a map to find your way around?", + "gold_answer": "amusement park", + "os_answer": "Mall", + "os_eval": "Incorrect", + "mcq_answer": "A. amusement park", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If my husband never helps me doing housework, what might that lead to?", + "gold_answer": "arguments", + "os_answer": "- Resentment and frustration in the relationship\n- Unequal distribution of household responsibilities\n- Increased stress and workload for the person doing all the housework\n- Potential conflicts and arguments over housework\n- Feeling undervalued or unappreciated in the relationship\n- Damage to the overall relationship dynamics and harmony", + "os_eval": "Correct", + "mcq_answer": "B. arguments", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The juror was quite bored and zoning out but wanted to convey he was hearing testimony, so he just sat there doing what?", + "gold_answer": "nodding", + "os_answer": "Nodding", + "os_eval": "Correct", + "mcq_answer": "B. nodding", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When a main artery is used to expedite travel what would it be referred to as?", + "gold_answer": "thruway", + "os_answer": "Artery road", + "os_eval": "Incorrect", + "mcq_answer": "D. thruway", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If someone rules the universe of what are they in charge?", + "gold_answer": "everything", + "os_answer": "Everything", + "os_eval": "Correct", + "mcq_answer": "C. everything", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can many stores with clothing be found?", + "gold_answer": "mall", + "os_answer": "Shopping mall", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When an elderly person needs help performing daily tasks, who might they call?", + "gold_answer": "caregiver", + "os_answer": "Family member, friend, neighbor, home health aide, nurse, social worker", + "os_eval": "Correct", + "mcq_answer": "C. caregiver", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is beer drank by people watching sticks and pucks?", + "gold_answer": "hockey game", + "os_answer": "Hockey arena", + "os_eval": "Correct", + "mcq_answer": "C. hockey game", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where might you see a green field while driving?", + "gold_answer": "countryside", + "os_answer": "Golf course", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "I am looking for honey right from the source, where should I look?", + "gold_answer": "beehive", + "os_answer": "Beehive", + "os_eval": "Correct", + "mcq_answer": "B. beehive", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A weasel has a thin body and short legs to easier burrow after prey in a what?", + "gold_answer": "tree", + "os_answer": "Narrow space", + "os_eval": "Incorrect", + "mcq_answer": "E. rabbit warren", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is one likely to find a fan for their stove?", + "gold_answer": "appliance store", + "os_answer": "Hardware store", + "os_eval": "Correct", + "mcq_answer": "A. appliance store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Jodie felt a tightness in her chest. She was worried but didn't want to go to the hospital. Where might she go instead?", + "gold_answer": "bedroom", + "os_answer": "Urgent care clinic", + "os_eval": "Incorrect", + "mcq_answer": "C. bedroom", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you're buying beer for a float trip what are you preparing to do?", + "gold_answer": "have fun", + "os_answer": "Go on a river trip", + "os_eval": "Incorrect", + "mcq_answer": "B. have fun", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Piece of land in Canada where you can find marmot?", + "gold_answer": "vancouver island", + "os_answer": "Banff National Park", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find a fox that is made up?", + "gold_answer": "storybook", + "os_answer": "In a fable or story", + "os_eval": "Correct", + "mcq_answer": "A. storybook", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "In basic training they build you up only to do what, all in hopes of building you up even stronger the next time?", + "gold_answer": "tear down", + "os_answer": "Break you down", + "os_eval": "Correct", + "mcq_answer": "B. tear down", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Billy saw a dog running from him and did his best to get away from it. The leaped up to where the dog couldn't reach and was stuck. Where might he have been trapped?", + "gold_answer": "table", + "os_answer": "A tree", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John and Judy were parents. They had two wonderful kids who weren't always well behaved. They were light tough, though. They felt it was a parent's job to do what?", + "gold_answer": "guide children", + "os_answer": "Discipline their children", + "os_eval": "Incorrect", + "mcq_answer": "B. guide children", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What are you playing if you're fiddling on a violin?", + "gold_answer": "bluegrass music", + "os_answer": "Music", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If somebody buys something and gives it to me as a free gift, what is the cost status of the gift?", + "gold_answer": "paid for", + "os_answer": "Free", + "os_eval": "Incorrect", + "mcq_answer": "C. paid for", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why does someone flirt with many people at once?", + "gold_answer": "attract attention", + "os_answer": "* Seeking validation and attention\n* Avoiding emotional intimacy\n* Playing a game or having fun\n* Exploring different options\n* Boosting their self-esteem\n* Exploring their sexuality\n* Masking insecurity or loneliness", + "os_eval": "Correct", + "mcq_answer": "D. attract attention", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why would a band be performing when there are no people nearby?", + "gold_answer": "record album", + "os_answer": "* Practicing for an upcoming performance\n* Recording a music video or album\n* Filming a scene for a movie or TV show\n* Promoting their music or band\n* Enjoying themselves or having fun\n* Raising awareness for a cause or event\n* Participating in a busking competition\n* Creating content for social media or online platforms", + "os_eval": "Correct", + "mcq_answer": "E. practice", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is used to grind wheat for bread?", + "gold_answer": "farmer's field", + "os_answer": "Millstone", + "os_eval": "Incorrect", + "mcq_answer": "E. mill", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you have a large satchel with you when you fly you'll be asked to store it where?", + "gold_answer": "luggage compartment", + "os_answer": "Overhead bin", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would someone keep their nylon leggings?", + "gold_answer": "stockings", + "os_answer": "Drawer", + "os_eval": "Incorrect", + "mcq_answer": "E. drawer", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you spend a long time running after a ball how are you likely to feel?", + "gold_answer": "laughter", + "os_answer": "Breathless", + "os_eval": "Incorrect", + "mcq_answer": "D. breathing heavily", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When you need to rest it's often because you have been doing what?", + "gold_answer": "action", + "os_answer": "Working or exerting energy", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "He was beginning to worry they wouldn't get on the ride before closing, they had been standing in queue for a long what?", + "gold_answer": "time", + "os_answer": "Time", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "This is an unavoidable physiological consequence of running. What is it?", + "gold_answer": "increased heart rate", + "os_answer": "Sweating", + "os_eval": "Incorrect", + "mcq_answer": "B.", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Sometimes a person has a fear of water or a dislike of being wet, it is still important to make sure they are having a bath why?", + "gold_answer": "flooding", + "os_answer": "To maintain personal hygiene, prevent infections and skin conditions, and promote overall health and well-being.", + "os_eval": "Incorrect", + "mcq_answer": "D. get wet", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "To get out of there the person had to keep on walking, they had to keep on what?", + "gold_answer": "moving forward", + "os_answer": "Moving", + "os_eval": "Correct", + "mcq_answer": "A. moving forward", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Joe and Jill didn't want their children to be sedentary. They might limit the time they children spend doing what?", + "gold_answer": "watch tv", + "os_answer": "Watching TV or playing video games", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "They were making sauerkraut, the instructor explained the liquid should be above the cabbage in the what?", + "gold_answer": "jar", + "os_answer": "Jar", + "os_eval": "Correct", + "mcq_answer": "A. jar", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "From where would you normally take a cup when you're about to get a drink?", + "gold_answer": "dishwasher", + "os_answer": "Kitchen cabinet or cupboard", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What are you using if there are speakers strapped on your ears?", + "gold_answer": "headphones", + "os_answer": "Headphones", + "os_eval": "Correct", + "mcq_answer": "B. headphones", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The bald eagle flew from Mount St Helen's to the Puget Sound and all over what?", + "gold_answer": "washington state", + "os_answer": "Washington State", + "os_eval": "Correct", + "mcq_answer": "C. pacific northwest", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How can people fulfill their own calorie requirements?", + "gold_answer": "feed themselves", + "os_answer": "* Consume a balanced diet that includes a variety of foods from all food groups.\n* Choose nutrient-rich foods that are high in fiber and low in saturated fat and added sugars.\n* Drink plenty of water.\n* Exercise regularly.\n* Get enough sleep.\n* Manage stress.\n* Consult with a healthcare professional or registered dietitian for personalized advice.", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does a stove do to the place that it's in?", + "gold_answer": "warm room", + "os_answer": "Makes it warm", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you aren't well rested and it's a rainy day what might you do?", + "gold_answer": "stay in bed", + "os_answer": "Take a nap or relax indoors with a warm drink and a good book.", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you have a stove if you don't live in a detached dwelling?", + "gold_answer": "tent", + "os_answer": "Kitchen", + "os_eval": "Incorrect", + "mcq_answer": "E. apartment", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What kind of place has a revolving door and has things to buy in it?", + "gold_answer": "mall", + "os_answer": "A store", + "os_eval": "Correct", + "mcq_answer": "D. mall", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can books be read?", + "gold_answer": "table", + "os_answer": "* Libraries\n* Schools\n* Homes\n* Coffee shops\n* Parks\n* On public transportation\n* At work\n* While traveling\n* In waiting rooms\n* At the beach\n* While exercising", + "os_eval": "Incorrect", + "mcq_answer": "C. table", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is seaweed usually found alive?", + "gold_answer": "water", + "os_answer": "In the ocean", + "os_eval": "Correct", + "mcq_answer": "A. ocean", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If a lizard is fed by people every day, what has happened to it?", + "gold_answer": "documentary", + "os_answer": "It has become domesticated.", + "os_eval": "Incorrect", + "mcq_answer": "E. captivity", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you wanted a license to catch crabs, what government office would you go to?", + "gold_answer": "fish department", + "os_answer": "Department of Fish and Wildlife", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What furniture will you normally find near a side chair?", + "gold_answer": "table", + "os_answer": "End table", + "os_eval": "Correct", + "mcq_answer": "B. table", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Metal is used to make what?", + "gold_answer": "instruments", + "os_answer": "- Cars\n- Buildings\n- Bridges\n- Tools\n- Appliances\n- Jewelry", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the word added to Manchester that signifies what county it is in?", + "gold_answer": "greater manchester", + "os_answer": "Greater", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Lawyers often talk in front of an audience where?", + "gold_answer": "courtroom", + "os_answer": "Courtroom", + "os_eval": "Correct", + "mcq_answer": "B. courtroom", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If I wanted to eat something that is made from plants and needs to be washed, what would it be?", + "gold_answer": "roots", + "os_answer": "Fruit or vegetables", + "os_eval": "Incorrect", + "mcq_answer": "A. roots", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Ficus can be planted in a yard to make summer more bearable, what sort of areas do they create?", + "gold_answer": "shady places", + "os_answer": "Shady, cool areas", + "os_eval": "Correct", + "mcq_answer": "A. shady places", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Children's behavior is a direct reflection of their what?", + "gold_answer": "parents", + "os_answer": "Parents", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "John bought a new water hose. But he found his old one near his car. Where did he find the old one?", + "gold_answer": "garage", + "os_answer": "Near his car", + "os_eval": "Incorrect", + "mcq_answer": "D. garage", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do you keep your pizza slice before you eat it?", + "gold_answer": "plate", + "os_answer": "Plate or napkin", + "os_eval": "Correct", + "mcq_answer": "B. plate", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What will likely happen after stabbing to death a person?", + "gold_answer": "being arrested", + "os_answer": "Being arrested and charged with murder.", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The boat passenger was explaining his fear of blowfish, but the captain figured he meant piranhas since they were on a river in the what?", + "gold_answer": "cuba", + "os_answer": "Amazon", + "os_eval": "Incorrect", + "mcq_answer": "A. cuba", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "I want to see a prepared slide up close, what would I use to help?", + "gold_answer": "microscope", + "os_answer": "Magnifying glass", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you buy a magazine, paper or gum?", + "gold_answer": "newsstand", + "os_answer": "Convenience store", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you get some wood if you do not have any?", + "gold_answer": "lumberyard", + "os_answer": "- Lumberyard\n- Hardware store\n- Home improvement store\n- Construction site\n- Scrap yard\n- Neighbor's yard (with permission)\n- Forest or wooded area (if legal and safe to do so)\n- Pallets or crates (if available and suitable)\n- Driftwood (if near a body of water)\n- Fallen branches or trees (if safe to collect)", + "os_eval": "Correct", + "mcq_answer": "D. lumberyard", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What negative effect can competing in a chess game on a cold day have?", + "gold_answer": "tension", + "os_answer": "Cold hands can decrease dexterity and reaction time.", + "os_eval": "Incorrect", + "mcq_answer": "E. frostbite", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Why is it hard for a young child to read a long book?", + "gold_answer": "knowledge", + "os_answer": "* Lack of sustained attention span\n* Limited vocabulary and comprehension skills\n* Fatigue and difficulty staying focused for extended periods\n* Difficulty decoding unfamiliar words and understanding complex sentences\n* Limited background knowledge and experience to make connections with the text", + "os_eval": "Incorrect", + "mcq_answer": "E. many words", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "On a hot day what can you do to enjoy something cool and sweet?", + "gold_answer": "dive", + "os_answer": "- Eat ice cream or frozen yogurt.\n- Make a smoothie or milkshake.\n- Drink a cold glass of lemonade or iced tea.\n- Eat fresh fruit, such as watermelon or berries.\n- Make a popsicle or ice cube treat.\n- Dip fruit or cookies in melted chocolate and freeze.\n- Freeze grapes or other small fruit and eat them as a snack.\n- Make a frozen fruit salad.\n- Make a no-bake cheesecake or other dessert that can be chilled.", + "os_eval": "Incorrect", + "mcq_answer": "E. eat ice cream", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is likely to be found in a book that is not a foreword?", + "gold_answer": "last word", + "os_answer": "Introduction, chapters, acknowledgements, bibliography, index", + "os_eval": "Incorrect", + "mcq_answer": "D. afterword", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How many hours are in a day?", + "gold_answer": "twenty four", + "os_answer": "24", + "os_eval": "Correct", + "mcq_answer": "D. twenty four", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The couple explained they were having trouble communicating, it seemed every conversation took great what?", + "gold_answer": "effort", + "os_answer": "Effort", + "os_eval": "Correct", + "mcq_answer": "B. effort", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What would a person need to do if his or her captain dies at sea?", + "gold_answer": "cross street", + "os_answer": "* **Take command of the vessel immediately.** This is essential for the safety of the crew and passengers.\n* **Inform the crew and passengers of the captain's death.** This will help to maintain order and prevent panic.\n* **Navigate the vessel to the nearest port.** This is where the authorities can be notified and arrangements can be made for a new captain.\n* **Cooperate with the authorities.** This will help to ensure a smooth transition of power and prevent any legal complications.", + "os_eval": "Incorrect", + "mcq_answer": "E. man crew", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do children require to grow up healthy?", + "gold_answer": "need care", + "os_answer": "- Nutritious food\n- Safe and clean environment\n- Access to healthcare\n- Education and support\n- Love and nurturing relationships", + "os_eval": "Correct", + "mcq_answer": "A. need care", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The field general began to write out a letter to the king, he was told to send what when the enemy was near?", + "gold_answer": "word", + "os_answer": "A messenger", + "os_eval": "Correct", + "mcq_answer": "C. word", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What will you put on a pen to prevent it from drying out?", + "gold_answer": "caps", + "os_answer": "Cap", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "They dealt with combustible mixtures in their experiments, this is why they kept a fire extinguisher where?", + "gold_answer": "chemistry lab", + "os_answer": "Nearby", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The man working in the attic swatted away a bee, but soon the single bee was an entire what?", + "gold_answer": "swarm", + "os_answer": "Swarm", + "os_eval": "Correct", + "mcq_answer": "A. swarm", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do you need to wear when hiking?", + "gold_answer": "shin splints", + "os_answer": "* Comfortable, moisture-wicking clothing\n* Sturdy, supportive hiking boots\n* Hat to protect from the sun\n* Sunglasses to protect eyes from glare\n* Backpack to carry water, snacks, and other essentials\n* Whistle or other device for signaling help in case of emergency", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What type of store would have lots of sports equipment?", + "gold_answer": "sporting goods store", + "os_answer": "Sporting goods store", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you buy a replacement ax handle?", + "gold_answer": "hardware store", + "os_answer": "Hardware store", + "os_eval": "Correct", + "mcq_answer": "B. hardware store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Is that person acting as silly as a clown?", + "gold_answer": "ridiculous", + "os_answer": "That depends on the person's behavior. If they are engaging in exaggerated, nonsensical, or childish actions that would typically be associated with a clown, then yes, they could be considered to be acting as silly as a clown.", + "os_eval": "Incorrect", + "mcq_answer": "B. ridiculous", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Which group of states is Louisiana part of?", + "gold_answer": "gulf states", + "os_answer": "Deep South", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you put a plate immediately after eating from it?", + "gold_answer": "dishwasher", + "os_answer": "In the sink", + "os_eval": "Incorrect", + "mcq_answer": "D. dishwasher", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do people do when they don't understand something?", + "gold_answer": "ask questions", + "os_answer": "* Ask questions\n* Seek information from reliable sources\n* Research the topic\n* Consult with experts\n* Break the concept down into smaller parts\n* Look for examples and analogies\n* Engage in discussions or debates\n* Use visual aids or demonstrations\n* Practice and repetition", + "os_eval": "Correct", + "mcq_answer": "A. ask questions", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "James saw a kite flying in the sky. He traced the string back to its origin and found it. Where did the string begin?", + "gold_answer": "end of line", + "os_answer": "In James's hand", + "os_eval": "Incorrect", + "mcq_answer": "E. child's hand", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a likely place for an ivy plant?", + "gold_answer": "outside", + "os_answer": "Growing up a wall", + "os_eval": "Correct", + "mcq_answer": "D. outside", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What type of residence has a ground floor with a stoop?", + "gold_answer": "brownstone", + "os_answer": "Brownstone", + "os_eval": "Correct", + "mcq_answer": "A. brownstone", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If the wood texture is not smooth it is what?", + "gold_answer": "porous", + "os_answer": "Rough", + "os_eval": "Incorrect", + "mcq_answer": "B. porous", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What might happen if someone is not losing weight?", + "gold_answer": "death", + "os_answer": "* **Not eating at a calorie deficit:** To lose weight, one must consume fewer calories than they burn. If someone is not losing weight, they may not be in a calorie deficit.\n* **Not exercising enough:** Exercise burns calories and helps build muscle, which can boost metabolism. If someone is not exercising enough, they may not be burning enough calories to lose weight.\n* **Medical conditions:** Some medical conditions, such as hypothyroidism, can make it difficult to lose weight. If someone has a medical condition that may be affecting their weight loss, they should see a doctor.\n* **Medications:** Some medications, such as steroids, can cause weight gain. If someone is taking a medication that may be affecting their weight, they should talk to their doctor.\n* **Stress:** Stress can lead to overeating and weight gain. If someone is experiencing stress, they should find healthy ways to manage it, such as exercise, meditation, or yoga.\n* **Lack of sleep:** Lack of sleep can disrupt hormones that regulate appetite and metabolism. If someone is not getting enough sleep, they may be more likely to overeat and gain weight.\n* **Emotional eating:** Emotional eating is eating in response to emotions, such as stress, sadness, or boredom. If someone is an emotional eater, they may need to find healthier ways to cope with their emotions.", + "os_eval": "Incorrect", + "mcq_answer": "A. loose skin", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Billy lived in the capital of his country, then he moved. Where might he move to?", + "gold_answer": "small town", + "os_answer": "Billy could move to a variety of places, including:\n- Another city within his country\n- A different country\n- A rural area\n- A smaller town\n- A suburb", + "os_eval": "Correct", + "mcq_answer": "A. small town", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What could prevent a driving car from continuing to drive?", + "gold_answer": "automobile accidents", + "os_answer": "- Lack of fuel\n- Mechanical failure\n- Flat tire\n- Road closure\n- Traffic jam\n- Accident\n- Driver fatigue\n- Bad weather conditions\n- Lack of visibility\n- Animal on the road\n- Police checkpoint\n- Speeding ticket\n- Parking violation", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a person likely to experience after they stop being married to a mean person?", + "gold_answer": "happiness", + "os_answer": "Relief, freedom, and a sense of peace", + "os_eval": "Correct", + "mcq_answer": "D. relief", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Despite the large crowds, how did the depressed man feel?", + "gold_answer": "solitary", + "os_answer": "Isolated and alone", + "os_eval": "Correct", + "mcq_answer": "B. alone", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where does a maid empty a trash can?", + "gold_answer": "motel", + "os_answer": "Into a garbage bag or dumpster", + "os_eval": "Incorrect", + "mcq_answer": "D. motel", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The dog curled up for a nap, it was tuckered out because it had just been what?", + "gold_answer": "walked", + "os_answer": "Exercising", + "os_eval": "Correct", + "mcq_answer": "A. walked", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do the feathers look like on birds found in the rainforest?", + "gold_answer": "very colorful", + "os_answer": "Brightly colored and iridescent", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the opposite of an area of elevation?", + "gold_answer": "depression", + "os_answer": "Depression", + "os_eval": "Correct", + "mcq_answer": "C. depression", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do singers need to do before a show?", + "gold_answer": "warm up", + "os_answer": "* Practice and rehearse their songs\n* Warm up their voices\n* Check their equipment\n* Do soundchecks\n* Get into costume and makeup\n* Relax and focus", + "os_eval": "Correct", + "mcq_answer": "A. warm up", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What type of feeling is performing for the first time likely to produce?", + "gold_answer": "action", + "os_answer": "Nervousness", + "os_eval": "Incorrect", + "mcq_answer": "E. anxiety", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If someone is found to be committing murder, what did they do to someone?", + "gold_answer": "kill", + "os_answer": "Killed them", + "os_eval": "Correct", + "mcq_answer": "B. kill", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The computer was hooked up to the internet, what could it do as a result?", + "gold_answer": "process information", + "os_answer": "Access online resources, communicate with others, download software, shop, play games, stream media, etc.", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Seeing idea become reality was a dream of hers for a long time, but as the time came to get on stage she had more what?", + "gold_answer": "anxiety", + "os_answer": "nerves", + "os_eval": "Correct", + "mcq_answer": "B. anxiety", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where off the eastern U.S. would you find an anemone?", + "gold_answer": "florida keys", + "os_answer": "In the ocean", + "os_eval": "Incorrect", + "mcq_answer": "B. tide pool", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are traveling clothes often kept?", + "gold_answer": "suitcase", + "os_answer": "Suitcase", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Although the sun did rise, what did the pessimist warn everyone it would do?", + "gold_answer": "go down", + "os_answer": "Rain", + "os_eval": "Incorrect", + "mcq_answer": "B. go down", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The hardcovers were especially tall, so he removed a shelf on the what to make room?", + "gold_answer": "chest of drawers", + "os_answer": "Bookcase", + "os_eval": "Incorrect", + "mcq_answer": "E. bookcase", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you're watching a comedy film what would you expect to hear from the audience?", + "gold_answer": "laughter", + "os_answer": "Laughter", + "os_eval": "Correct", + "mcq_answer": "D. laughter", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What can eating lunch cause that is painful?", + "gold_answer": "heartburn", + "os_answer": "Heartburn", + "os_eval": "Correct", + "mcq_answer": "C. heartburn", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Eating is part of living, but your body doesn't use it all and the next day you will be doing what?", + "gold_answer": "reduced", + "os_answer": "Eliminating", + "os_eval": "Incorrect", + "mcq_answer": "E. defecating", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What would you use to find a place to stay?", + "gold_answer": "phone book", + "os_answer": "- Online booking platforms (e.g., Airbnb, Vrbo, Booking.com)\n- Travel search engines (e.g., Google Travel, Kayak, Skyscanner)\n- Hotel websites\n- Local tourism websites\n- Travel agents\n- Recommendations from friends or family\n- Social media groups or forums\n- Local newspapers or magazines\n- Walking or driving around the area to look for available accommodations", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you're seeking a connection for your laptop, what are you trying to hook up with?", + "gold_answer": "computer network", + "os_answer": "The internet", + "os_eval": "Correct", + "mcq_answer": "A. computer network", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What can happen when you contemplate alone for a long time?", + "gold_answer": "daydream", + "os_answer": "- Overthinking and negative thought patterns\n- Increased stress and anxiety\n- Difficulty making decisions\n- Obsessive thoughts\n- Loss of focus and productivity\n- Reduced social interaction\n- Increased risk of mental health issues such as depression and anxiety disorders", + "os_eval": "Incorrect", + "mcq_answer": "C. get ideas", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "I was apprehensive to buy the expensive equipment to play a game with so much walking and swinging around in grass, but now I understand why people what?", + "gold_answer": "play golf", + "os_answer": "Enjoy the game more", + "os_eval": "Incorrect", + "mcq_answer": "B. play golf", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John needed a straight wire. Unfortunately, this one had endured some abuse and had become what?", + "gold_answer": "bent", + "os_answer": "Bent", + "os_eval": "Correct", + "mcq_answer": "A. bent", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Metal is taken from what which is pulled from the ground?", + "gold_answer": "ore", + "os_answer": "Ore", + "os_eval": "Correct", + "mcq_answer": "C. ore", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Sean was a wreck. He loved to build houses, but in his current state, he couldn't do what?", + "gold_answer": "construct", + "os_answer": "Cannot be answered due to inappropriate content", + "os_eval": "Incorrect", + "mcq_answer": "E. build", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What would be happening if you are pretending to be a police officer?", + "gold_answer": "deception", + "os_answer": "You would be committing a crime known as impersonating a police officer, which is illegal in most jurisdictions.", + "os_eval": "Correct", + "mcq_answer": "C. deception", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you buy a finely crafted writing instrument?", + "gold_answer": "stationery store", + "os_answer": "Pen store or stationer's", + "os_eval": "Correct", + "mcq_answer": "C. stationery store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The detective was finding information from witnesses, why would he do that?", + "gold_answer": "get answers", + "os_answer": "To gather evidence and reconstruct the events of a crime.", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Joe found spiders in the place where he keeps his tools. Where might that be?", + "gold_answer": "garage", + "os_answer": "Basement", + "os_eval": "Incorrect", + "mcq_answer": "D. garage", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "While on the fan boat he thought he'd see swamps and gators, but he was surprised to spot a bald eagle in what nature area?", + "gold_answer": "everglades", + "os_answer": "Wetlands", + "os_eval": "Incorrect", + "mcq_answer": "A. everglades", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are you likely to find a supermarket?", + "gold_answer": "city or town", + "os_answer": "In a commercial area or shopping center", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you need to use a lantern?", + "gold_answer": "dark place", + "os_answer": "Camping, power outages, exploring caves, hiking at night", + "os_eval": "Correct", + "mcq_answer": "D. dark place", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What area does a police officer patrol?", + "gold_answer": "beat", + "os_answer": "A designated geographic area", + "os_eval": "Correct", + "mcq_answer": "C. beat", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is made up of people?", + "gold_answer": "audience", + "os_answer": "Society", + "os_eval": "Incorrect", + "mcq_answer": "B. audience", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why would a small dog pant if it's hot outside?", + "gold_answer": "heat", + "os_answer": "To cool down", + "os_eval": "Correct", + "mcq_answer": "C. heat", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you display a picture on a horizontal surface?", + "gold_answer": "shelf", + "os_answer": "On a table, shelf, desk, or mantel", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What skill is needed for riding a bike?", + "gold_answer": "wheels", + "os_answer": "Balance", + "os_eval": "Incorrect", + "mcq_answer": "E. good balance", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The department to where vendors deliver goods for sale is called what?", + "gold_answer": "receiving", + "os_answer": "Receiving", + "os_eval": "Correct", + "mcq_answer": "C. receiving", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Exercise is very good for you, for faster recovery you should always do what afterwards?", + "gold_answer": "stretch", + "os_answer": "Stretch", + "os_eval": "Correct", + "mcq_answer": "A. stretch", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What happens when you go somewhere and forget something at home?", + "gold_answer": "go back", + "os_answer": "You may have to go back and get it, or you may have to do without it.", + "os_eval": "Correct", + "mcq_answer": "D. go back", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you acquire a wind instrument for you own use?", + "gold_answer": "music store", + "os_answer": "Music store", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a storey contained a panoramic view, what kind of structure would it be in?", + "gold_answer": "tall building", + "os_answer": "A skyscraper", + "os_eval": "Correct", + "mcq_answer": "D. tall building", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What should I do with a jumping rope?", + "gold_answer": "fatigue", + "os_answer": "Jump with it.", + "os_eval": "Incorrect", + "mcq_answer": "E. hopping", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do geese do every fall in fields?", + "gold_answer": "guard house", + "os_answer": "Geese migrate south for the winter.", + "os_eval": "Incorrect", + "mcq_answer": "D. follow ultralight airplane", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where outside of a city would a squirrel live?", + "gold_answer": "forest", + "os_answer": "Forest", + "os_eval": "Correct", + "mcq_answer": "C. forest", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "You should watch out for snakes if floating down what African body of water?", + "gold_answer": "amazon river", + "os_answer": "Nile River", + "os_eval": "Incorrect", + "mcq_answer": "D. amazon river", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "To what do trees roots cling?", + "gold_answer": "yard", + "os_answer": "Soil", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What could people do that involves talking?", + "gold_answer": "confession", + "os_answer": "* Having a conversation\n* Giving a speech\n* Making a phone call\n* Giving a presentation\n* Reading aloud\n* Singing\n* Debating\n* Arguing\n* Gossiping\n* Storytelling\n* Interviewing\n* Counseling\n* Teaching\n* Broadcasting\n* Public speaking\n* Hosting\n* Commentating\n* Announcing\n* Preaching", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you're a child answering questions and an adult is asking them that adult is doing what?", + "gold_answer": "teaching", + "os_answer": "Educating", + "os_eval": "Correct", + "mcq_answer": "C. teaching", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When you get an F, you fail. If you get A's you are?", + "gold_answer": "passing", + "os_answer": "Successful", + "os_eval": "Incorrect", + "mcq_answer": "C. passed", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the main purpose of having a bath?", + "gold_answer": "cleanness", + "os_answer": "To clean and refresh oneself", + "os_eval": "Correct", + "mcq_answer": "A. cleanness", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The ball was hit over a boundary and struck an audience member. What kind of game were they playing?", + "gold_answer": "sporting event", + "os_answer": "Cricket", + "os_eval": "Incorrect", + "mcq_answer": "A. sporting event", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is someone operating a vehicle likely to be accused of after becoming inebriated?", + "gold_answer": "drunk driving", + "os_answer": "Driving under the influence (DUI)", + "os_eval": "Correct", + "mcq_answer": "D. drunk driving", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you get jewelry if you do not have any?", + "gold_answer": "department store", + "os_answer": "* Pawn shop\n* Flea market\n* Thrift store\n* Online marketplace\n* Garage sale", + "os_eval": "Incorrect", + "mcq_answer": "D. department store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do young boys do on the ice in the winter?", + "gold_answer": "play hockey", + "os_answer": "Play hockey, sled, ice skate", + "os_eval": "Correct", + "mcq_answer": "B. play hockey", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "She loved spending money at the thrift store on knickknacks, this resulted in a lot of what on every shelf in her house?", + "gold_answer": "clutter", + "os_answer": "Clutter", + "os_eval": "Correct", + "mcq_answer": "B. clutter", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Joe was there to meet a large number of people. As he filed though the entrance hall, he saw many strangers who came from far away. What sort of building is he probably in?", + "gold_answer": "convention center", + "os_answer": "Airport", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The family wanted to adopt for enviro-ethical reasons, what did they abhor?", + "gold_answer": "biological child", + "os_answer": "Animal cruelty", + "os_eval": "Incorrect", + "mcq_answer": "A. orphan", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What happens when airplane engines cut off and are unable to be restarted in flight?", + "gold_answer": "crash", + "os_answer": "The plane will glide for a certain distance, depending on its altitude, speed, and weight. The pilot will attempt to restart the engines or land the plane on a suitable surface, such as an airport or open field. If the engines cannot be restarted and a suitable landing surface cannot be found, the plane will eventually crash.", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you be concerned about finding a cavity?", + "gold_answer": "solid object", + "os_answer": "In a tooth", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Human beings learn about current events from what print item?", + "gold_answer": "read newspapers", + "os_answer": "Newspaper", + "os_eval": "Correct", + "mcq_answer": "C. read newspapers", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "In what kind of environment does an anemone live?", + "gold_answer": "sea water", + "os_answer": "Ocean", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If I am suffering from boredom, and I want to see something beautiful, what should I do?", + "gold_answer": "see art", + "os_answer": "* Visit a museum or art gallery to appreciate paintings, sculptures, and other works of art.\n* Stroll through a botanical garden or arboretum to admire the beauty of flowers, plants, and trees.\n* Attend a live performance, such as a ballet, opera, or symphony, to experience the beauty of music and dance.\n* Watch a sunrise or sunset over a scenic landscape, such as a beach, mountain, or lake.\n* Visit a planetarium to gaze at the stars and marvel at the vastness of the universe.", + "os_eval": "Correct", + "mcq_answer": "A. see art", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The goal was to hit the target, but a projectile ball can't hit anything if it isn't in what?", + "gold_answer": "motion", + "os_answer": "Motion", + "os_eval": "Correct", + "mcq_answer": "A. motion", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a good place to set a cup of coffee while relaxing?", + "gold_answer": "table", + "os_answer": "On a sturdy table or coaster", + "os_eval": "Correct", + "mcq_answer": "D. table", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a fried egg was runny and there was no toast to sop it up, after the meal there'd be a messy what?", + "gold_answer": "plate", + "os_answer": "Plate", + "os_eval": "Correct", + "mcq_answer": "C. plate", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What will happen to animals after eating food?", + "gold_answer": "feel pleasure", + "os_answer": "Animals will typically experience the following after eating food:\n\n* **Digestion:** The food will be broken down into smaller molecules that can be absorbed by the body.\n* **Absorption:** The nutrients from the food will be absorbed into the bloodstream.\n* **Metabolism:** The nutrients will be used to provide energy and build new cells.\n* **Excretion:** The waste products from digestion will be excreted from the body.", + "os_eval": "Incorrect", + "mcq_answer": "B. digestion", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If I wanted to grow plants, where could I put a lot of dirt?", + "gold_answer": "garden", + "os_answer": "Garden, flower bed, planter, greenhouse", + "os_eval": "Correct", + "mcq_answer": "D. garden", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does a person often feel about someone judging them guilty?", + "gold_answer": "resentment", + "os_answer": "Resentment, anger, frustration", + "os_eval": "Correct", + "mcq_answer": "C. resentment", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A town between two mountains is located in a what?", + "gold_answer": "valley", + "os_answer": "Valley", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why did the heavy metal band need electricity at the stadium?", + "gold_answer": "concert", + "os_answer": "To power their amplifiers and other electrical equipment.", + "os_eval": "Incorrect", + "mcq_answer": "A. concert", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a person looking for when completing puzzles or riddles?", + "gold_answer": "intellectual challenge", + "os_answer": "Intellectual challenge, entertainment, satisfaction of solving a problem", + "os_eval": "Correct", + "mcq_answer": "C. intellectual challenge", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If someone was making breakfast, they'd probably put two slices of bread in the what?", + "gold_answer": "toaster", + "os_answer": "Toaster", + "os_eval": "Correct", + "mcq_answer": "D. toaster", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is part of a republic like the USA?", + "gold_answer": "state", + "os_answer": "Representative government", + "os_eval": "Incorrect", + "mcq_answer": "D. democracy", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do you keep extra clothing on a hike?", + "gold_answer": "person", + "os_answer": "Backpack", + "os_eval": "Incorrect", + "mcq_answer": "E. backpack", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "There was no shade for Jenny. She was forced to lie there exposed to what?", + "gold_answer": "full sunlight", + "os_answer": "The sun", + "os_eval": "Correct", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What could happen to you after you are cleaning house for a long time?", + "gold_answer": "exhaustion", + "os_answer": "- Fatigue\n- Muscle aches\n- Dehydration\n- Allergic reactions (if exposed to cleaning chemicals)\n- Skin irritation", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is someone doing when scheduling when to go to party?", + "gold_answer": "rumpspringa", + "os_answer": "Planning their attendance at the party", + "os_eval": "Incorrect", + "mcq_answer": "E. plan", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What kind of path do comets tend to have?", + "gold_answer": "set orbits", + "os_answer": "Elliptical", + "os_eval": "Correct", + "mcq_answer": "E. solid nucleus", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The vet found malignant tumors on the animals, what is their likely fate?", + "gold_answer": "die of cancer", + "os_answer": "The animals are likely to die or need to be euthanized.", + "os_eval": "Correct", + "mcq_answer": "A. euthanasia", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "what is printed with ink and distributed daily?", + "gold_answer": "newspaper", + "os_answer": "Newspaper", + "os_eval": "Correct", + "mcq_answer": "C. newspaper", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What are people likely to do when an unexpected decent outcome occurs?", + "gold_answer": "thank god", + "os_answer": "* Be surprised or even shocked\n* Be relieved or happy\n* Try to understand why the outcome occurred\n* Adjust their expectations or plans accordingly\n* Express gratitude or appreciation", + "os_eval": "Correct", + "mcq_answer": "B. thank god", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The company sent off many purchases, they used recycled cardboard as their what?", + "gold_answer": "packaging materials", + "os_answer": "Packaging", + "os_eval": "Correct", + "mcq_answer": "A. packaging materials", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why might a person be known as a liar?", + "gold_answer": "false information", + "os_answer": "* They have a history of telling untruths.\n* They are known to exaggerate or embellish stories.\n* They have been caught in lies in the past.\n* They are known to be untrustworthy or unreliable.\n* They have a reputation for being deceptive or dishonest.", + "os_eval": "Correct", + "mcq_answer": "B. false information", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The child was politely waiting for dessert, he was eventually rewarded for his what?", + "gold_answer": "timing", + "os_answer": "Patience", + "os_eval": "Incorrect", + "mcq_answer": "E. patience", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do you call the caretakers of a child?", + "gold_answer": "principal", + "os_answer": "Parents", + "os_eval": "Incorrect", + "mcq_answer": "E. parents", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Working on the elaborate task was taxing, it require extreme what?", + "gold_answer": "concentration", + "os_answer": "Concentration", + "os_eval": "Correct", + "mcq_answer": "C. energy", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What may you have after awaking after a night of heavy drinking?", + "gold_answer": "headache", + "os_answer": "Hangover", + "os_eval": "Correct", + "mcq_answer": "D. headache", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What uses a ribbon to put words on paper?", + "gold_answer": "wrapping paper", + "os_answer": "Typewriter", + "os_eval": "Incorrect", + "mcq_answer": "E. typewriter", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where are sheep likely to live?", + "gold_answer": "farm", + "os_answer": "Farm or pasture", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If I was watching TV on the couch and the air was stuffy, I might turn the fan on to make the what more comfortable?", + "gold_answer": "living room", + "os_answer": "Air", + "os_eval": "Incorrect", + "mcq_answer": "B. living room", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Who watches a play in an auditorium?", + "gold_answer": "crowd", + "os_answer": "Audience", + "os_eval": "Correct", + "mcq_answer": "B. crowd", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a possible outcome for committing murder?", + "gold_answer": "imprisonment", + "os_answer": "Life in prison", + "os_eval": "Correct", + "mcq_answer": "B. incarceration", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "where is a good place to obtain new soap?", + "gold_answer": "supermarket", + "os_answer": "Store", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do professors primarily do?", + "gold_answer": "master physics", + "os_answer": "Teach, research, and publish", + "os_eval": "Incorrect", + "mcq_answer": "E. teach courses", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do you throw a ball at pins?", + "gold_answer": "bowling alley", + "os_answer": "Bowling alley", + "os_eval": "Correct", + "mcq_answer": "A. bowling alley", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What might you need to do cleaning?", + "gold_answer": "sing a song", + "os_answer": "- Cleaning supplies (such as soap, detergent, bleach, etc.)\n- Cleaning tools (such as brooms, mops, sponges, cloths, etc.)\n- Water\n- Gloves\n- Vacuum cleaner\n- Dustpan and brush\n- Ladder\n- Step stool\n- Cleaning caddy\n- Cleaning rags\n- Cleaning wipes\n- Disinfectant\n- Deodorizer\n- Air freshener", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If student got a list of supplies from class like paper and pencils, their parent would have to go where?", + "gold_answer": "store", + "os_answer": "To the store", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a house has a subscription, what likely shows up in the driveway every morning?", + "gold_answer": "newspaper", + "os_answer": "Newspaper", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "what does a person do to stay healthy?", + "gold_answer": "eat every day", + "os_answer": "* Eat a healthy diet\n* Exercise regularly\n* Maintain a healthy weight\n* Get enough sleep\n* Manage stress\n* Avoid tobacco smoke\n* Limit alcohol intake\n* Get vaccinated\n* See a doctor regularly", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a person stutters when he experiences anxiety or excitement, he'll have difficult doing what?", + "gold_answer": "express information", + "os_answer": "Public speaking", + "os_eval": "Correct", + "mcq_answer": "A. express information", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do people need to do to change their lives?", + "gold_answer": "face problems", + "os_answer": "* **Identify the areas of their lives that they want to change.** This could include their career, relationships, health, or anything else that is not currently fulfilling them.\n* **Set realistic goals for themselves.** Trying to change too much too quickly can be overwhelming and lead to discouragement. It is better to start with small, achievable goals and build from there.\n* **Create a plan of action.** This should include specific steps that they need to take to reach their goals. It is important to be realistic about the amount of time and effort that will be required.\n* **Take action.** This is the most important step. Once they have a plan, they need to take action and start working towards their goals.\n* **Be patient and persistent.** Change takes time and effort. There will be setbacks along the way, but it is important to stay focused on their goals and not give up.\n* **Seek support from others.** This could include friends, family, a therapist, or a support group. Having people to help them through the process can make it easier to stay motivated and on track.", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Humans need shelter to survive. They usually find shelter where?", + "gold_answer": "homes", + "os_answer": "Buildings, homes, tents, caves, vehicles, or other structures that provide protection from the elements", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Someone who had a very bad flight might be given a trip in this to make up for it?", + "gold_answer": "first class", + "os_answer": "First class", + "os_eval": "Correct", + "mcq_answer": "A. first class", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The water in clouds turn in to what when it gets cold?", + "gold_answer": "snowflake", + "os_answer": "Rain, snow, sleet, or hail", + "os_eval": "Incorrect", + "mcq_answer": "B. snowflake", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What southern U.S. state is know for having many swamps?", + "gold_answer": "louisiana", + "os_answer": "Louisiana", + "os_eval": "Correct", + "mcq_answer": "D. louisiana", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When going to sleep what happens to your body?", + "gold_answer": "relaxation", + "os_answer": "* Body temperature decreases\n* Heart rate and breathing slow down\n* Muscles relax\n* Brain activity slows down\n* Eyes move slowly under the eyelids (REM sleep)", + "os_eval": "Correct", + "mcq_answer": "D. relaxation", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a monkey likely to enjoy being?", + "gold_answer": "banana tree", + "os_answer": "In a forest or jungle", + "os_eval": "Incorrect", + "mcq_answer": "A. banana tree", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a form of anaerobic exercising?", + "gold_answer": "shortness of breath", + "os_answer": "Sprinting", + "os_eval": "Incorrect", + "mcq_answer": "E. run", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "The earth is one planet in what?", + "gold_answer": "solar system", + "os_answer": "Solar System", + "os_eval": "Correct", + "mcq_answer": "C. solar system", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "James was below the balloon. He watched it rise. What direction did he look in?", + "gold_answer": "upstairs", + "os_answer": "Up", + "os_eval": "Incorrect", + "mcq_answer": "E. upwards", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Joe's cat smelled something delicious and jumped into this, causing him to panic and fear for its life. Where might it have jumped?", + "gold_answer": "microwave", + "os_answer": "A refrigerator", + "os_eval": "Incorrect", + "mcq_answer": "C. microwave", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why would a person put flowers in a room with dirty gym socks?", + "gold_answer": "smell good", + "os_answer": "It is unlikely that a person would put flowers in a room with dirty gym socks because the smell of the socks would overpower the fragrance of the flowers.", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The table wasn't level. some parts were higher and some were lower with no rhyme or reason. It was very what?", + "gold_answer": "uneven", + "os_answer": "Uneven", + "os_eval": "Correct", + "mcq_answer": "C. uneven", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The person signed up for home insurance, what is he seeking?", + "gold_answer": "financial security", + "os_answer": "Protection from financial loss in case of damage to their home or belongings", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "James know that committing murder was wrong, but he thought that he could get away with it. He was really troubled and fearful because of what?", + "gold_answer": "prosecution", + "os_answer": "His conscience", + "os_eval": "Incorrect", + "mcq_answer": "C. prosecution", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "How can someone die from eating hamburger?", + "gold_answer": "mad cow disease", + "os_answer": "* Choking on a piece of hamburger\n* Food poisoning from undercooked or contaminated meat\n* Allergic reaction to ingredients in the hamburger, such as beef, dairy, or wheat", + "os_eval": "Incorrect", + "mcq_answer": "C. mad cow disease", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does a self assured person often do?", + "gold_answer": "feel important", + "os_answer": "* Maintains eye contact\n* Speaks confidently\n* Stands up straight\n* Has good posture\n* Is assertive\n* Is not afraid to take risks\n* Believes in their own abilities\n* Is not easily swayed by others", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "He was very outgoing, for him making friends was no personal what?", + "gold_answer": "conflict", + "os_answer": "Problem", + "os_eval": "Incorrect", + "mcq_answer": "A. scary", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Paul wants carrots and doesn't need to drive anywhere. He gets them from where?", + "gold_answer": "refrigerator", + "os_answer": "Grocery store", + "os_eval": "Incorrect", + "mcq_answer": "A. refrigerator", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What could you use to fill a cup and then drink from it?", + "gold_answer": "water fountain", + "os_answer": "A straw", + "os_eval": "Incorrect", + "mcq_answer": "D. water fountain", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you were looking for a blowfish, you wouldn't look on dry land, you'd look in a what?", + "gold_answer": "body of water", + "os_answer": "Water", + "os_eval": "Correct", + "mcq_answer": "D. body of water", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "George checked the rotor of the Apache, which wasn't powered by internal combustion, but by what?", + "gold_answer": "jet engine", + "os_answer": "Jet fuel", + "os_eval": "Incorrect", + "mcq_answer": "C. electric motor", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a salt shaker most often kept?", + "gold_answer": "table setting", + "os_answer": "On the dining table or kitchen counter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you put a dollar if you want to go to a store and buy something with it?", + "gold_answer": "pocket", + "os_answer": "In your wallet or pocket", + "os_eval": "Correct", + "mcq_answer": "D. pocket", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What room is likely to have a sideboard on the counter?", + "gold_answer": "home", + "os_answer": "Kitchen", + "os_eval": "Incorrect", + "mcq_answer": "E. kitchen", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is unlikely to get bugs on its windshield due to bugs' inability to reach it when it is moving?", + "gold_answer": "airplane", + "os_answer": "A Motorcycle", + "os_eval": "Incorrect", + "mcq_answer": "A. airplane", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can a bath towel be borrowed?", + "gold_answer": "at hotel", + "os_answer": "Hotel, gym, pool, beach, friend's house, family member's house", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why do people stop caring about their problems?", + "gold_answer": "no problems", + "os_answer": "* **Avoidance:** People may stop caring about their problems to avoid dealing with the negative emotions and stress associated with them.\n* **Overwhelm:** When problems become overwhelming, people may feel helpless and give up trying to find solutions.\n* **Learned helplessness:** Past experiences of failing to solve problems can lead people to believe they are incapable of handling them.\n* **Distraction:** People may seek out distractions to avoid thinking about their problems, leading to a decreased sense of urgency.\n* **Denial:** Some people may deny the existence or severity of their problems, which can prevent them from taking action.\n* **Self-sabotage:** People may subconsciously engage in behaviors that worsen their problems due to low self-esteem or a desire for punishment.\n* **Emotional exhaustion:** Dealing with chronic problems can lead to emotional exhaustion, making it difficult to care about them.\n* **Lack of support:** Without adequate support from others, people may feel isolated and lose the motivation to address their problems.\n* **Trauma:** Traumatic experiences can lead to emotional numbing and a decreased ability to care about anything.\n* **Mental health conditions:** Certain mental health conditions, such as depression and anxiety, can affect a person's ability to care about their problems.", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "They were never going to be big actors, but they all had passion for the local what?", + "gold_answer": "theater", + "os_answer": "theater", + "os_eval": "Correct", + "mcq_answer": "A. theater", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you use a folding chair but not store one?", + "gold_answer": "beach", + "os_answer": "At a park", + "os_eval": "Incorrect", + "mcq_answer": "B. city hall", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you spend a long time shopping in uncomfortable shoes, you might develop what?", + "gold_answer": "calluses", + "os_answer": "Blisters", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does impeachment mean for the president?", + "gold_answer": "trouble", + "os_answer": "Impeachment is the process by which a legislative body levels charges against a government official. In the United States, the House of Representatives has the sole power to impeach the President, Vice President, and all civil officers of the United States. The Senate then holds a trial to determine whether to remove the official from office. If two-thirds of the Senate votes to convict, the official is removed from office.\n\nImpeachment is a serious matter, and it is only used in cases of high crimes and misdemeanors. Some of the most common reasons for impeachment include bribery, perjury, and obstruction of justice.\n\nIf the President is impeached, he or she will face a trial in the Senate. The Senate will vote on whether to convict the President. If two-thirds of the Senate votes to convict, the President will be removed from office.\n\nImpeachment is a rare occurrence. Only three Presidents have ever been impeached: Andrew Johnson, Bill Clinton, and Donald Trump. None of them were convicted and removed from office.", + "os_eval": "Incorrect", + "mcq_answer": "C. trouble", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Noble citizen of the Roman empire believed those born with lower status were what to them?", + "gold_answer": "inferior", + "os_answer": "Inferior", + "os_eval": "Correct", + "mcq_answer": "D. inferior", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Spraining an ankle while playing baseball will cause what?", + "gold_answer": "strikes", + "os_answer": "Pain, swelling, and difficulty walking", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "John was traveling to a new city and took time to check out a business. He noticed that its carpet was stained with sauces and ketchup. What type of business might that be?", + "gold_answer": "bedroom", + "os_answer": "Restaurant", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If you have a condo in a Wisconsin city known for beer, where are you?", + "gold_answer": "city", + "os_answer": "Milwaukee", + "os_eval": "Incorrect", + "mcq_answer": "E. milwaukee", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How does someone go about buying beer?", + "gold_answer": "have no money", + "os_answer": "1. **Find a store that sells beer.** This could be a grocery store, convenience store, or liquor store.\n2. **Choose the beer you want to buy.** There are many different types of beer available, so take some time to browse and find one that you think you'll enjoy.\n3. **Bring the beer to the checkout counter.** The cashier will scan the barcode on the beer and tell you the total cost.\n4. **Pay for the beer.** You can pay with cash, credit card, or debit card.\n5. **Take the beer home and enjoy it.**", + "os_eval": "Incorrect", + "mcq_answer": "E. spend money", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If there is gum on your shoe where did it likely come from?", + "gold_answer": "sidewalk", + "os_answer": "Someone stepped on it.", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is main benefit to exercising?", + "gold_answer": "get in shape", + "os_answer": "Improved physical and mental health", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a tactic used to interfere with learning about science?", + "gold_answer": "intimidation", + "os_answer": "Misinformation", + "os_eval": "Incorrect", + "mcq_answer": "D. intimidation", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do people usually feel when falling in love?", + "gold_answer": "happiness", + "os_answer": "* Joy\n* Excitement\n* Happiness\n* Vulnerability\n* Passion\n* Hope\n* Optimism\n* Attraction\n* Euphoria\n* Fulfillment", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why are dogs often known as man's best friend?", + "gold_answer": "very loyal", + "os_answer": "Dogs are often known as man's best friend because they have many qualities that make them ideal companions for humans:\n\n* **Loyalty:** Dogs are incredibly loyal creatures, and they will often bond deeply with their owners. They are always happy to see their humans, and they will often go to great lengths to protect them.\n* **Affection:** Dogs are very affectionate animals, and they love to cuddle and be petted. They enjoy spending time with their humans, and they make great companions for those who are looking for a loving and affectionate pet.\n* **Intelligence:** Dogs are very intelligent animals, and they are able to learn a variety of commands and tricks. They are also able to understand human emotions, and they can often provide comfort and support when their humans are feeling down.\n* **Playfulness:** Dogs are playful animals, and they love to play fetch, go for walks, and chase squirrels. They are always up for a good time, and they can help their humans to stay active and healthy.\n* **Protection:** Dogs are natural protectors, and they will often bark at strangers or other animals that they perceive as a threat. They can be a great deterrent to crime, and they can help to keep their humans safe.", + "os_eval": "Correct", + "mcq_answer": "C. very loyal", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you buy a two wheel transportation machine?", + "gold_answer": "bicycle shop", + "os_answer": "Bicycle store", + "os_eval": "Correct", + "mcq_answer": "D. bicycle shop", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do you buy condoms?", + "gold_answer": "supermarket", + "os_answer": "Pharmacy", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a likely place to store unused soap?", + "gold_answer": "cabinet", + "os_answer": "Soap Dish", + "os_eval": "Incorrect", + "mcq_answer": "A. cabinet", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Loss of someone you love can cause what kind of feeling in your heart?", + "gold_answer": "painful", + "os_answer": "Sadness", + "os_eval": "Correct", + "mcq_answer": "A. painful", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where in your home would you keep a ballpoint pen when not in use?", + "gold_answer": "desk drawer", + "os_answer": "* Desk or office area\n* Kitchen drawer\n* Junk drawer\n* Nightstand drawer\n* Bathroom counter or vanity drawer", + "os_eval": "Correct", + "mcq_answer": "C. desk drawer", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can a student learn to play a triangle?", + "gold_answer": "math class", + "os_answer": "Music class", + "os_eval": "Incorrect", + "mcq_answer": "E. music class", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When you stroke a dogs fur what have you done?", + "gold_answer": "petted", + "os_answer": "Stimulated hair follicles", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The wood was still rough to the touch, what did the woodworker have to do?", + "gold_answer": "sanded", + "os_answer": "Sand it", + "os_eval": "Correct", + "mcq_answer": "B. sanded", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The chief saw his entire tribe wiped out, he was a leader with a single what?", + "gold_answer": "follower", + "os_answer": "Follower", + "os_eval": "Correct", + "mcq_answer": "A. peon", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "If while driving to work another car makes a careless maneuver, what emotion might you feel?", + "gold_answer": "boredom", + "os_answer": "Anger or frustration", + "os_eval": "Incorrect", + "mcq_answer": "E. road rage", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find the sharpest parts of a triangle?", + "gold_answer": "three vertices", + "os_answer": "At the vertices", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "How might a automobile get off a freeway?", + "gold_answer": "exit ramp", + "os_answer": "Take an exit ramp", + "os_eval": "Correct", + "mcq_answer": "A. exit ramp", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Sally thought that competing wasn't worth the risk. If she pushed more what might happen?", + "gold_answer": "pressure", + "os_answer": "If Sally pushed more, she might experience one or more of the following:\n\n* Increased stress and anxiety due to the pressure to succeed.\n* Physical injury or burnout due to overexertion.\n* Relationship issues if her competitive nature negatively impacts her interactions with others.\n* Decreased job satisfaction or career advancement if her focus on competition hinders her collaboration and teamwork abilities.\n* Emotional distress or mental health issues if her self-worth becomes tied to her performance.", + "os_eval": "Correct", + "mcq_answer": "A. pressure", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John is sitting in a toilet stall in a bathroom, outside he can hear cars going around in circles. What is the function of the place he is most likely at?", + "gold_answer": "race track", + "os_answer": "Race track", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What event might one buy tickets for seats?", + "gold_answer": "show", + "os_answer": "A concert, sporting event, or play", + "os_eval": "Correct", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How does a planet usually move around the sun?", + "gold_answer": "writing", + "os_answer": "In an elliptical orbit", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "When a group of people are talking at work they might be doing what?", + "gold_answer": "sharing of ideas", + "os_answer": "Socializing, networking, discussing work-related matters, solving problems, brainstorming ideas, or sharing information.", + "os_eval": "Correct", + "mcq_answer": "C. sharing of ideas", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where could you find a shark before it was caught?", + "gold_answer": "tomales bay", + "os_answer": "In the ocean", + "os_eval": "Incorrect", + "mcq_answer": "B. tomales bay", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is one likely to find poker chips?", + "gold_answer": "bar", + "os_answer": "Casino", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can one obtain a bass fiddle?", + "gold_answer": "jazz band", + "os_answer": "Music store", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Why does having a disability sometimes making academic tasks hard for a person?", + "gold_answer": "mentally challenged", + "os_answer": "* Physical limitations may make it difficult to access materials, write, or interact with technology.\n* Cognitive impairments may affect memory, attention, and problem-solving abilities.\n* Sensory impairments may hinder access to visual or auditory information.\n* Communication difficulties may make it hard to ask for help or participate in class discussions.\n* Social challenges may create barriers to forming study groups or getting support from peers.\n* Emotional or mental health issues may impact motivation and focus.", + "os_eval": "Incorrect", + "mcq_answer": "A. mentally challenged", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the purpose of playing games for children?", + "gold_answer": "learning", + "os_answer": "Games provide numerous benefits for children, including:\n\n**Cognitive Development:**\n* Enhance problem-solving skills\n* Improve memory and attention span\n* Develop strategic thinking and planning abilities\n* Encourage creativity and imagination\n\n**Social and Emotional Development:**\n* Foster cooperation and teamwork\n* Teach children to follow rules and take turns\n* Promote communication and social interaction\n* Help children develop empathy and self-regulation\n\n**Physical Development:**\n* Encourage physical activity and gross motor skills\n* Improve coordination and balance\n* Enhance hand-eye coordination and fine motor skills\n\n**Emotional Regulation:**\n* Provide a safe and controlled environment for children to express and manage their emotions\n* Help children develop coping mechanisms for stress and frustration\n\n**Entertainment and Relaxation:**\n* Provide a fun and enjoyable way to pass time\n* Help children unwind and de-stress\n* Offer a break from academic or other structured activities", + "os_eval": "Incorrect", + "mcq_answer": "B. learning", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If someone laughs after surprising them they have a good sense of what?", + "gold_answer": "humor", + "os_answer": "Humor", + "os_eval": "Correct", + "mcq_answer": "D. humor", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "People played a variety of games in the soccer field. It was the closest thing they had to what?", + "gold_answer": "park", + "os_answer": "Sports", + "os_eval": "Incorrect", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When someone has little knowledge and is judging someone they are considered what?", + "gold_answer": "ignorance", + "os_answer": "Ignorant", + "os_eval": "Correct", + "mcq_answer": "D. ignorance", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a salesman responsible to do at work?", + "gold_answer": "sell products", + "os_answer": "* Greet and assist customers\n* Determine customers' needs\n* Present products or services\n* Answer questions and provide information\n* Process transactions and close sales\n* Follow up with customers after the sale\n* Maintain a positive and professional demeanor\n* Build relationships with customers\n* Stay up-to-date on product knowledge\n* Meet sales goals", + "os_eval": "Correct", + "mcq_answer": "D. sell products", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "How does going jogging generally affect one's self esteem?", + "gold_answer": "feel better", + "os_answer": "Generally, going jogging can positively affect one's self-esteem. Here are several reasons:\n\n**1. Accomplishment and Goal Setting:** Jogging requires effort and consistency, which can lead to a sense of accomplishment when goals are achieved. Completing a jog or reaching certain milestones can boost self-confidence and a feeling of competence.\n\n**2. Improved Physical Appearance:** Jogging is a form of exercise that can help improve physical appearance by reducing body fat, toning muscles, and enhancing posture. These positive physical changes can lead to an enhanced self-image and increased self-esteem.\n\n**3. Endorphin Release:** Jogging triggers the release of endorphins, which have mood-boosting effects. Endorphins can reduce stress, anxiety, and depression, all of which can negatively impact self-esteem.\n\n**4. Sense of Control:** Jogging allows individuals to take control of their physical health and well-being. By setting goals and working towards them, people can gain a sense of control over their lives, which can translate into increased self-esteem.\n\n**5. Social Connections:** Jogging in groups or joining running clubs can provide opportunities for social interaction and support. Connecting with others who share similar goals can create a sense of belonging and improve self-worth.\n\n**6. Stress Relief:** Jogging is an effective way to manage stress, which can have negative effects on self-esteem. By releasing pent-up energy and clearing the mind, jogging can reduce stress levels and improve overall well-being.\n\n**7. Improved Sleep Quality:** Jogging can help improve sleep quality, which is essential for maintaining a positive self-image and overall mental health. When people get a good night's sleep, they tend to feel more confident and energized, which can boost self-esteem.\n\nIt's important to note that while jogging can generally have positive effects on self-esteem, individual experiences may vary. Consistency, gradual progression, and a supportive environment can help maximize the benefits for self-esteem.", + "os_eval": "Correct", + "mcq_answer": "A. feel better", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find people standing in a line outside?", + "gold_answer": "bus depot", + "os_answer": "* Bus stop\n* Ticket booth\n* Store entrance\n* Amusement park ride\n* Food truck", + "os_eval": "Correct", + "mcq_answer": "A. bus depot", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you are committing perjury you have done what while under oath?", + "gold_answer": "lie", + "os_answer": "Lied", + "os_eval": "Correct", + "mcq_answer": "D. lie", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you find the meaning of \"ficus\"?", + "gold_answer": "dictionary", + "os_answer": "Dictionary", + "os_eval": "Correct", + "mcq_answer": "A. dictionary", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The buildings were intended to not have residential kitchens in them, what were they designed for?", + "gold_answer": "university", + "os_answer": "Office space", + "os_eval": "Incorrect", + "mcq_answer": "D. university", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Animals come in all types, some fly thanks to their lightweight hollow what?", + "gold_answer": "bones", + "os_answer": "Bones", + "os_eval": "Correct", + "mcq_answer": "B. bones", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a lake likely to be glacial?", + "gold_answer": "mountains", + "os_answer": "At the foot of a mountain or in a valley", + "os_eval": "Correct", + "mcq_answer": "D. mountains", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why do some people get passports and go to different locations?", + "gold_answer": "desire to travel", + "os_answer": "* To travel for leisure or pleasure\n* To visit friends and family\n* To conduct business or attend conferences\n* To study or work abroad\n* To seek medical treatment\n* To relocate or emigrate\n* To participate in humanitarian or volunteer activities\n* To attend religious pilgrimages\n* To explore different cultures and learn new languages\n* To escape conflict or persecution", + "os_eval": "Correct", + "mcq_answer": "C. desire to travel", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where do apples form on an apple tree?", + "gold_answer": "bloom", + "os_answer": "On branches", + "os_eval": "Incorrect", + "mcq_answer": "D. bloom", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where areas are there likely to be many nightclubs?", + "gold_answer": "major city", + "os_answer": "- Downtown areas\n- Entertainment districts\n- Tourist areas\n- College towns", + "os_eval": "Correct", + "mcq_answer": "D. major city", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What does someone stop doing when being dead?", + "gold_answer": "breathing", + "os_answer": "Breathing", + "os_eval": "Correct", + "mcq_answer": "C. breathing", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The place where my linen closet is really needs repainting a light color as it only has one overhead light.", + "gold_answer": "hallway", + "os_answer": "Yes, repainting the linen closet a light color would help reflect more light and make the space feel brighter.", + "os_eval": "Incorrect", + "mcq_answer": "D. hallway", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Punk rock music is an important part of what action sport?", + "gold_answer": "skate", + "os_answer": "Skateboarding", + "os_eval": "Correct", + "mcq_answer": "A. skate", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a bird likely to make it's home?", + "gold_answer": "forest", + "os_answer": "In a tree or a nest", + "os_eval": "Incorrect", + "mcq_answer": "B. nest", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How would you express information if you do not have a pen or pencil?", + "gold_answer": "talk", + "os_answer": "* Speak verbally\n* Use gestures and body language\n* Use objects as visual aids\n* Write in the sand or dirt\n* Use a computer or other electronic device\n* Use a whiteboard or chalkboard\n* Draw pictures or diagrams\n* Use sign language\n* Use Morse code", + "os_eval": "Correct", + "mcq_answer": "D. talk", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would your hear a bass clarinet along side other wood wind instruments?", + "gold_answer": "orchestra", + "os_answer": "In a woodwind quintet", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the opposite of a little of something?", + "gold_answer": "much", + "os_answer": "A lot of something", + "os_eval": "Correct", + "mcq_answer": "A. much", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The piece of paper was worth a lot of money, it was an old Apple Inc what?", + "gold_answer": "stock certificate", + "os_answer": "Stock certificate", + "os_eval": "Correct", + "mcq_answer": "C. stock certificate", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If a car-less person want to listen to talk radio in private, where might they listen to it?", + "gold_answer": "bedroom", + "os_answer": "At a public library", + "os_eval": "Incorrect", + "mcq_answer": "B. bedroom", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Billy was an astronaut. When he looked at the world from space, how did it look?", + "gold_answer": "round", + "os_answer": "Round", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where is a good place to have a fireplace in a house?", + "gold_answer": "living room", + "os_answer": "Living room", + "os_eval": "Correct", + "mcq_answer": "D. living room", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is the feeling of one having fun?", + "gold_answer": "pleasure", + "os_answer": "Joy, excitement, happiness, exhilaration, amusement", + "os_eval": "Correct", + "mcq_answer": "B. pleasure", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Christians believe you will go to heaven if you're what?", + "gold_answer": "born again", + "os_answer": "Good", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When did mammoth's live?", + "gold_answer": "boscage", + "os_answer": "During the Ice Age, approximately 10,000 to 4,500 years ago", + "os_eval": "Incorrect", + "mcq_answer": "D", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What might result in an unsuccessful suicide attempt?", + "gold_answer": "interruption", + "os_answer": "- Interruption by others or self-interruption\n- Ineffective method\n- Change of heart\n- Accidental survival\n- Medical intervention\n- Resuscitation efforts", + "os_eval": "Correct", + "mcq_answer": "B. interruption", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What can happen if you are buying products that someone else does not want you to buy?", + "gold_answer": "disagreements", + "os_answer": "- You could be wasting your money.\n- You could be getting into debt.\n- You could be damaging your relationship with the person who does not want you to buy the products.\n- You could be breaking the law.", + "os_eval": "Incorrect", + "mcq_answer": "B. disagreements", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The child was getting many gifts for his birthday, his father reminded him to do what after opening each one?", + "gold_answer": "say thank", + "os_answer": "Say thank you", + "os_eval": "Correct", + "mcq_answer": "D. say thank", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "From where does a snowflake form?", + "gold_answer": "cloud", + "os_answer": "Clouds", + "os_eval": "Correct", + "mcq_answer": "A. cloud", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Applying for a job can make someone feel what sort of emotion, even if they get it?", + "gold_answer": "working hard", + "os_answer": "Nervous", + "os_eval": "Incorrect", + "mcq_answer": "E. stress", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "A farmer sees a weasel in the woods, where is the farmer?", + "gold_answer": "great outdoors", + "os_answer": "The farmer is on a farm.", + "os_eval": "Incorrect", + "mcq_answer": "D. great outdoors", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Traveling from new place to new place is likely to be what?", + "gold_answer": "exhilarating", + "os_answer": "Challenging", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Turkey only has a small northern part of their country located in part of the what?", + "gold_answer": "balkan peninsula", + "os_answer": "Europe", + "os_eval": "Incorrect", + "mcq_answer": "E. asia minor", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where might someone store a reusable shopping bag?", + "gold_answer": "supermarket", + "os_answer": "* Car trunk\n* Kitchen pantry\n* Reusable bag holder near the front door\n* Reusable bag holder in the back of the car\n* Under the kitchen sink", + "os_eval": "Incorrect", + "mcq_answer": "E. closet", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How could you have fun by yourself with no one around you?", + "gold_answer": "watching television", + "os_answer": "* **Read a book or listen to an audiobook.** This is a great way to escape into another world and forget about your troubles.\n* **Watch a movie or TV show.** This is a great way to relax and be entertained.\n* **Play a video game.** This is a great way to challenge yourself and have some fun.\n* **Go for a walk or run.** This is a great way to get some exercise and fresh air.\n* **Meditate or do yoga.** This is a great way to relax and de-stress.\n* **Write in a journal.** This is a great way to reflect on your thoughts and feelings.\n* **Draw or paint.** This is a great way to express yourself creatively.\n* **Learn a new skill.** This is a great way to challenge yourself and expand your knowledge.\n* **Volunteer your time.** This is a great way to give back to your community and make a difference in the world.\n* **Spend time in nature.** This is a great way to relax and connect with the natural world.", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What type of fruit is easily broken in to sections?", + "gold_answer": "citrus", + "os_answer": "Orange", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Marathoners feel fatigued after running twenty six miles, but some that have pushed them self too hard might be prone to what?", + "gold_answer": "passing out", + "os_answer": "Rhabdomyolysis", + "os_eval": "Incorrect", + "mcq_answer": "E. exhaustion", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "I am cold, what should I do to stay warm?", + "gold_answer": "light fire", + "os_answer": "* Wear warm clothes, preferably layers of clothing.\n* Seek shelter from the cold, such as a warm room or building.\n* Engage in physical activity to generate body heat.\n* Drink warm beverages or eat warm food.\n* Take a warm bath or shower.\n* Use a heating pad or hot water bottle.\n* Avoid alcohol, as it can dilate blood vessels and make you feel colder.\n* Cover your head and neck, as these areas lose heat quickly.\n* Stay dry, as wet clothes can make you colder.", + "os_eval": "Incorrect", + "mcq_answer": "B. light fire", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Copulating with the wrong partner may be ill advised, many diseases can be transferred that can cause different types of what?", + "gold_answer": "intense pleasure", + "os_answer": "Illnesses", + "os_eval": "Incorrect", + "mcq_answer": "E. skin irritation", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What do audiences clap for?", + "gold_answer": "show", + "os_answer": "* To show appreciation for a performance or presentation\n* To express approval or agreement\n* To create a sense of excitement or anticipation\n* To acknowledge the end of a performance or presentation\n* To show support for a speaker or performer", + "os_eval": "Correct", + "mcq_answer": "B. theatre", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you get a balalaika if you do not have one?", + "gold_answer": "music store", + "os_answer": "- A music store\n- A pawn shop\n- Online retailers\n- A musical instrument rental shop\n- A flea market\n- A friend or family member who plays the balalaika", + "os_eval": "Correct", + "mcq_answer": "B. music store", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Hoping for a beautiful day, what did the clouds do that disappointed everyone?", + "gold_answer": "overcast", + "os_answer": "They rained", + "os_eval": "Incorrect", + "mcq_answer": "B. overcast", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The landscaper was carefully arching stones together, he was creating an elaborate what over the creek?", + "gold_answer": "park", + "os_answer": "Bridge", + "os_eval": "Incorrect", + "mcq_answer": "E. bridge", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find a ticket booth and see a concert?", + "gold_answer": "venue", + "os_answer": "Concert venue", + "os_eval": "Correct", + "mcq_answer": "D. venue", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Who is not famous for a superhighway with no speed limit?", + "gold_answer": "europe", + "os_answer": "Albert Einstein", + "os_eval": "Incorrect", + "mcq_answer": "D. city", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "No matter what date you put on it, we all know the universe to be what?", + "gold_answer": "very old", + "os_answer": "Infinite", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is a person considered a bully known for?", + "gold_answer": "made fun of", + "os_answer": "Intimidating or humiliating others", + "os_eval": "Correct", + "mcq_answer": "C", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "When cooking sheep meat a lot of people might want to be well?", + "gold_answer": "done", + "os_answer": "Done", + "os_eval": "Correct", + "mcq_answer": "C. done", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you sit in a chair while working toward an advanced degree?", + "gold_answer": "university", + "os_answer": "At a desk", + "os_eval": "Incorrect", + "mcq_answer": "D. university", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "A good interview after applying for a job may cause you to feel what?", + "gold_answer": "offer", + "os_answer": "Optimistic", + "os_eval": "Incorrect", + "mcq_answer": "E. hope", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Computers have allowed everybody to answer questions they have quickly, but still we seem to be getting duller despite access to this what?", + "gold_answer": "advance knowledge", + "os_answer": "Information", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "James decided that competing was the right choice. Not competing has a defined outcome, but if he competes then what could happen?", + "gold_answer": "might win", + "os_answer": "If James competes, he has the potential to win or lose.", + "os_eval": "Correct", + "mcq_answer": "A. might win", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What could you use to get to some airplanes?", + "gold_answer": "taxi", + "os_answer": "Runway", + "os_eval": "Incorrect", + "mcq_answer": "A. taxi", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What are our bodies doing after having food?", + "gold_answer": "digesting", + "os_answer": "* Breaking down food into nutrients\n* Absorbing nutrients into the bloodstream\n* Removing waste products\n* Storing energy for later use", + "os_eval": "Correct", + "mcq_answer": "B. digesting", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Why would one try to avoid work?", + "gold_answer": "malaise", + "os_answer": "* To prioritize personal tasks or leisure activities\n* To escape unpleasant or challenging work tasks\n* To manage stress or burnout\n* To engage in other activities that are perceived as more rewarding or enjoyable\n* To avoid social interactions or conflicts at work\n* Due to physical or mental health issues\n* To protest working conditions or policies\n* To pursue other opportunities or goals outside of work\n* To prioritize family or personal responsibilities\n* To conserve energy or avoid exhaustion", + "os_eval": "Incorrect", + "mcq_answer": "D. malaise", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What do you do in order to fly in airplane?", + "gold_answer": "buy tickets", + "os_answer": "1. Purchase a ticket for a flight.\n2. Arrive at the airport on time for your flight.\n3. Check in at the airline counter and check your baggage.\n4. Go through security screening.\n5. Board the airplane and find your seat.\n6. Fasten your seatbelt and follow the instructions of the flight attendants.\n7. Enjoy your flight.", + "os_eval": "Correct", + "mcq_answer": "E. run through checklists", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "What is another name for the color of the fur of a dog with light colored fur?", + "gold_answer": "fair", + "os_answer": "Fawn", + "os_eval": "Incorrect", + "mcq_answer": "A. fair", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "The lion sensed his competitor was timid, so what attitude did the lion take?", + "gold_answer": "aggressive", + "os_answer": "Aggressive", + "os_eval": "Correct", + "mcq_answer": "D. aggressive", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "John felt a snake slither over him as he rested. He was afraid to raise his covers for fear of startling it. Where might he be?", + "gold_answer": "bedroom", + "os_answer": "In bed", + "os_eval": "Correct", + "mcq_answer": "D. bedroom", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you find a place to eat in an urban area close to local nightlife?", + "gold_answer": "downtown", + "os_answer": "Gastropub", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "You have to a lot of thinking while studying a new subject, but it is how you gain what?", + "gold_answer": "fatigue", + "os_answer": "Knowledge", + "os_eval": "Incorrect", + "mcq_answer": "E", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "How will you communicate if you are far away from who you want to communicate with?", + "gold_answer": "think", + "os_answer": "* **Telephone:** Use a landline or mobile phone to make a voice call.\n* **Email:** Send an electronic message that can be read and responded to at the recipient's convenience.\n* **Text message:** Send a short message via a mobile phone network.\n* **Instant messaging:** Use an app or software that allows for real-time communication via text, voice, or video.\n* **Social media:** Send a message or post on a social media platform where the recipient can see it.\n* **Video call:** Use a video conferencing app or software to have a face-to-face conversation.\n* **Letter:** Write a physical letter and send it through the postal service.\n* **Carrier pigeon:** In rare cases, carrier pigeons can be used to send messages over long distances.\n* **Satellite phone:** Use a satellite phone to make calls in remote areas where there is no cellular coverage.", + "os_eval": "Incorrect", + "mcq_answer": "E. send email", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "At a shop what can you buy to put your spare unused things?", + "gold_answer": "basement", + "os_answer": "Storage container", + "os_eval": "Incorrect", + "mcq_answer": "E. container", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "David watched some nesting birds using his binoculars while on vacation. Where might David be?.", + "gold_answer": "forest", + "os_answer": "At a park, nature reserve, or other natural area with bird habitats", + "os_eval": "Correct", + "mcq_answer": "C. forest", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Where would you find many varieties of plants including a rosebush?", + "gold_answer": "kew gardens", + "os_answer": "Nursery", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What are cats often known for?", + "gold_answer": "whiskers", + "os_answer": "Curiosity, independence, cleanliness", + "os_eval": "Incorrect", + "mcq_answer": "C. purr", + "mcq_eval": false, + "dataset": "CommonsenseQA" + }, + { + "question": "Where can you find a dogs house?", + "gold_answer": "found outside", + "os_answer": "In a backyard, under a porch, or in a doghouse", + "os_eval": "Correct", + "mcq_answer": "A. found outside", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "If you really wanted a grape, where would you go to get it?", + "gold_answer": "fruit stand", + "os_answer": "Grocery store", + "os_eval": "Incorrect", + "mcq_answer": "B. fruit stand", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "Setting up framing, truss and beam are some of the first steps in what?", + "gold_answer": "new construction", + "os_answer": "Construction", + "os_eval": "Correct", + "mcq_answer": "A. new construction", + "mcq_eval": true, + "dataset": "CommonsenseQA" + }, + { + "question": "What is another name for a disk for storing information?", + "gold_answer": "computer hard drive", + "os_answer": "Floppy disk", + "os_eval": "Incorrect", + "mcq_answer": "C. computer hard drive", + "mcq_eval": true, + "dataset": "CommonsenseQA" + } +] \ No newline at end of file