diff --git "a/Large/GPT4o/Winogrande.json" "b/Large/GPT4o/Winogrande.json" new file mode 100644--- /dev/null +++ "b/Large/GPT4o/Winogrande.json" @@ -0,0 +1,11405 @@ +[ + { + "question": "Sarah was a much better surgeon than Maria so _ always got the easier cases.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah was a much better surgeon than Maria so _ always got the harder cases.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They were worried the wine would ruin the bed and the blanket, but the _ was't ruined.", + "gold_answer": "bed", + "os_answer": "bedspread", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Terry tried to bake the eggplant in the toaster oven but the _ was too big.", + "gold_answer": "eggplant", + "os_answer": "eggplant", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At night, Jeffrey always stays up later than Hunter to watch TV because _ wakes up late.", + "gold_answer": "Jeffrey", + "os_answer": "Jeffrey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cat of Sarah has some mouth problems, so she takes it to see Maria. _ is a responsible cat owner.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The home that my parents had when I was in school was a lot nicer than my house now because the _ was sophisticated.", + "gold_answer": "home", + "os_answer": "decor", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The home that my parents had when I was in school was a lot nicer than my house now because the _ is trashy.", + "gold_answer": "house", + "os_answer": "neighborhood", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie has a rich husband and lots of money, Jennifer is poor _ needs to make her clothes.", + "gold_answer": "Jennifer", + "os_answer": "and", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe immediately went to bakery before the bank because the _ had a limited supply of what he wanted.", + "gold_answer": "bakery", + "os_answer": "bakery", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe immediately went to bakery before the bank because the _ had a substantial supply of what he wanted.", + "gold_answer": "bank", + "os_answer": "bakery", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I had to read an entire story for class tomorrow. Luckily, the _ was canceled.", + "gold_answer": "class", + "os_answer": "class", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I had to read an entire story for class tomorrow. Luckily, the _ was short.", + "gold_answer": "story", + "os_answer": "story", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He had enough time between classes to go to a cafe or to the library. He went to the _ because his paper could wait.", + "gold_answer": "cafe", + "os_answer": "cafe", + "os_eval": "Correct", + "mcq_answer": "A. cafe", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He had enough time between classes to go to a cafe or to the library. He went to the _ because his paper was due soon.", + "gold_answer": "library", + "os_answer": "library", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey like to read graphic novels but Natalie liked classic literature to read. _ bought the new Frank Miller comic at the book store.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael just bought brand new wheels for his truck unlike Leslie because _ wheels were new and perfect.", + "gold_answer": "Leslie", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "B. Leslie", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael just bought brand new wheels for his truck unlike Leslie because _ wheels were old and used.", + "gold_answer": "Michael", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Leslie was nervous around parrots but Neil was not, since _ was bitten by a bird early in life.", + "gold_answer": "Leslie", + "os_answer": "Leslie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christmas was a special holiday to Eric but not Adam since _ was a Jew.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "To make frosting I needed pudding that was at a store 15 minutes away but pre-made frosting was at a store 5 minutes away. The _ was closer.", + "gold_answer": "frosting", + "os_answer": "store", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin was chosen instead of Brett to be the makeup artist for the play because _ was less experienced.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia violated the rights of Amy, because _ had too much passivity with other people.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They had to eat a lot to gain the strength they had lost and be able to work, the _ was too much.", + "gold_answer": "work", + "os_answer": "effort", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They had to eat a lot to gain the strength they had lost and be able to work, the _ was too little.", + "gold_answer": "strength", + "os_answer": "ration", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The roof of Rachel's home is old and falling apart, while Betty's is new. The home value of _ is lower.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "All the clutter in the house excited Leslie but not Derrick because cleaning energized _ very much.", + "gold_answer": "Leslie", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The portions of food today were bigger than the sizes yesterday because the _ fed more people.", + "gold_answer": "portions", + "os_answer": "chef", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Since Craig threw aluminum cans in the trash and Benjamin recycled, _ was environmentally irresponsible.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine was going to Jessica's house to do some cleaning in the kitchen, because _ was a energetic person.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The students were at their desks taking tests with pencils, they used the _ to hold the papers.", + "gold_answer": "desks", + "os_answer": "clipboards", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary thought poodles were a cool dog but Rachel thought Great Danes were cooler. _ bought a small dog bed for their pet.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary thought poodles were a cool dog but Rachel thought Great Danes were cooler. _ bought a gigantic dog bed for their pet.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Leslie had a lot of issues that Kyle was tired of dealing with, so _ felt abandoned when they finally moved out.", + "gold_answer": "Leslie", + "os_answer": "Leslie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jessica enjoyed a simple, basic life with Betty, but _ was bored having a quiet existence.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I wanted to build a bathroom on the third floor of the house but I couldn't because the _ would be too full.", + "gold_answer": "floor", + "os_answer": "plumbing", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel researched laws and helped to open a preschool for Eric. Because _ is very good with kids.", + "gold_answer": "Eric", + "os_answer": "Joel", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya told Emily she couldn't come to work because her cat had an infection, but _ was lying.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela thinks her husband might be cheating with Lindsey, and _ confesses at the dinner party.", + "gold_answer": "Lindsey", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Donald's understanding of math isn't as good as Joseph's, so _ is more likely a professor.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian was jealous of Brett's new car because _ couldn't afford to buy a new car.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man used his eyes to read the letters but the _ were too small.", + "gold_answer": "letters", + "os_answer": "letters", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jill was on a budget so she only bought a new dress for the ceremony and wore an old hat. She figured the _ would be less noticeable.", + "gold_answer": "hat", + "os_answer": "hat", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jill was on a budget so she only bought a new dress for the ceremony and wore an old hat. She figured the _ would be more noticeable.", + "gold_answer": "dress", + "os_answer": "dress", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "On Monday, Patricia made Felicia eggs for an early breakfast, but _ does not like fried eggs.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Since Craig wears clear contacts and William wears colored ones, it is safe to assume that _ loves the color of their eyes.", + "gold_answer": "Craig", + "os_answer": "William", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Since Craig wears clear contacts and William wears colored ones, it is safe to assume that _ dislikes the color of their eyes.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easy for Angela to become a vegetarian although Kayla couldn't do it. _ really missed the taste of chicken.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter was a better baker than Logan so _ made the kitchen a mess when they tried to make an apple pie.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya spent more on the children's birthday party than Amy. _ thought a magician was a good use of funds.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Judy bought new brushes to paint the etched glasses crack but it didn't fit. The _ was too wide.", + "gold_answer": "brush", + "os_answer": "brush", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Judy bought new brushes to paint the etched glasses crack but it didn't fit. The _ was too narrow.", + "gold_answer": "crack", + "os_answer": "brush", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I look forward to the Sunday newspaper so I can look at the comics. This is the only reason I still get the _ in this day and age.", + "gold_answer": "newspaper", + "os_answer": "newspaper", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer was more of a morning person than Natalie although _ always went to bed early and got a good night's rest.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jennifer was more of a morning person than Natalie because _ always went to bed early and got a good night's rest.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Alcohol is a love of Matthew's, but Ryan can't stand the stuff because _ is a sober alcoholic.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe brought the horse out to the country quite a distance and gave him food but the _ was too much.", + "gold_answer": "distance", + "os_answer": "distance", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy gave their heart to Brian, and _ soon told them that they should have kept their heart to themselves.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nick wanted to play a game on the floor, but Dennis was hesitant because of his knees. _ was disappointed.", + "gold_answer": "Nick", + "os_answer": "Nick", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although she was being prosecuted, Monica was welcomed into the sanctuary of the church by Samantha because _ was a sinful criminal.", + "gold_answer": "Monica", + "os_answer": "Samantha", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The battle was less fierce than the great war, because the _ lasted one year.", + "gold_answer": "war", + "os_answer": "battle", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura used too much super glue on Erins hands, so _ needed to get to the doctor to separate their hands.", + "gold_answer": "Erin", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James panicked when his phone fell on the table thinking it will break but the _ is soft.", + "gold_answer": "table", + "os_answer": "tabletop", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James panicked when his phone fell on the table thinking it will break but the _ is strong.", + "gold_answer": "phone", + "os_answer": "table", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John cannot touch the cup as it was just brought out of the refrigerator. He wanted some air to blow around it. The _ is very warm.", + "gold_answer": "air", + "os_answer": "air", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The fireman used several rags to polish the nozzles on the fire hose; when he was done the _ were dirty.", + "gold_answer": "rags", + "os_answer": "rags", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary wanted to get another piercing in her ear, but the _ was much too tiny.", + "gold_answer": "ear", + "os_answer": "lobe", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary wanted to get another piercing in her ear, but the _ was much too huge.", + "gold_answer": "piercing", + "os_answer": "needle", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura just loved the taste of green beans but Felicia hated the taste of them. _ didn't have a second serving.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bartender cut Carrie off but continued to serve Emily because _ was too drunk.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Blaze always wore a t-shirt instead of a shirt because he thought that the _ was stuffy and old fashioned.", + "gold_answer": "shirt", + "os_answer": "shirt", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The paint would melt in the sun, so we used a varnish instead, since the _ was susceptible to heat.", + "gold_answer": "paint", + "os_answer": "paint", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I tried to make mini lamps by using glow sticks in mason jars, but had to get larger jars because the _ were too big.", + "gold_answer": "glow sticks", + "os_answer": "glowsticks", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel always liked to turn the heater up higher than Joseph did for the reason that _ was never cold.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel always liked to turn the heater up higher than Joseph did for the reason that _ was always cold.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teen found the new hat was no substitute for his cool shirt. The _ was just cool to wear to school.", + "gold_answer": "shirt", + "os_answer": "hat", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary was helping Patricia's daughter put on makeup but _ watches a lot of makeup tutorials.", + "gold_answer": "Patricia", + "os_answer": "Mary", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary was helping Patricia's daughter put on makeup because _ watches a lot of makeup tutorials.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He wanted to kill time at the house instead of the playground, because everyone at the _ was fun.", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron didn't know Dennis had a peanut allergy, so when _ made peanut chicken an ambulance was called.", + "gold_answer": "Aaron", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron didn't know Dennis had a peanut allergy, so when _ ate peanut chicken an ambulance was called.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "God liked to control the day and the night, but the _ was too bright.", + "gold_answer": "day", + "os_answer": "sun", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brett asked Joel for advice and guidance about waxing his mustache, and afterwards _ felt burdened.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The filter in the living room needed to be changed more often than the one in the bedroom because the _ was dirtier.", + "gold_answer": "living room", + "os_answer": "air", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The filter in the living room needed to be changed more often than the one in the bedroom because the _ was cleaner.", + "gold_answer": "bedroom", + "os_answer": "bedroom", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy went over to the waiting room at the hospital to calm Samantha because _ was placid.", + "gold_answer": "Amy", + "os_answer": "it", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Megan forgot to buy deodorant at the store so they borrowed Jessica's deodorant and _ never found out.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan forgot to buy deodorant at the store so they borrowed Jessica's deodorant and _ hoped they never found out.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy thought she was the mirror image of Natalie , but _ could not be convinced to see the similarity.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy thought she was the mirror image of Natalie , but _ could not persuade her to see the similarity.", + "gold_answer": "Amy", + "os_answer": "I", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I helped my sister find her gold necklace. She couldn't wear her woven necklace to the ball because the _ was so casual.", + "gold_answer": "woven necklace", + "os_answer": "woven", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily never had as much money to spend as Carrie, because _ had a good job.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wooden doors at my friends work are worse than the wooden desks at my work, because the _ material is cheaper.", + "gold_answer": "doors", + "os_answer": "door", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wooden doors at my friends work are worse than the wooden desks at my work, because the _ material is stronger.", + "gold_answer": "desks", + "os_answer": "desk", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The arrow stuck to the bark but not the stone because the _ was flimsy.", + "gold_answer": "bark", + "os_answer": "shaft", + "os_eval": "Incorrect. The student's answer indicates that the arrow's shaft was flimsy, which doesn't align with the true answer focusing on the bark's nature as the reason for the arrow sticking. Therefore, the student's answer provides a conflicting explanation.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The arrow stuck to the bark but not the stone because the _ was hard.", + "gold_answer": "stone", + "os_answer": "stone", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The leg of the pig body stuck out of the grave where it was buried because the _ is large.", + "gold_answer": "body", + "os_answer": "pig", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sheet recovered can easily be hiding between the space in the door. The _ is thin.", + "gold_answer": "sheet", + "os_answer": "gap", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sheet recovered can easily be hiding between the space in the door. The _ is wide.", + "gold_answer": "space", + "os_answer": "gap", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mike doesn't like the table in his living room as much as the couch. The _ resonates with the other decorations.", + "gold_answer": "couch", + "os_answer": "couch", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven believes they can buy happiness but Craig thinks otherwise as _ is very realistic.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B. Craig", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven believes they can buy happiness but Craig thinks otherwise as _ is very materialistic.", + "gold_answer": "Steven", + "os_answer": "Steven", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They brought the cornhole supplies to the camp site so they could play while adults cooked dinner. The boys really enjoyed the _ after the game.", + "gold_answer": "dinner", + "os_answer": "snacks", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The game of chess was easy to play for Angela but not Rebecca because _ had a analytical mind.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The game of chess was easy to play for Angela but not Rebecca because _ did not have an analytical mind.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "To pay for dinner, he used the credit card rather than cash. The _ was not available.", + "gold_answer": "cash", + "os_answer": "cash", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The plan devised by Christine to get Kayla to like them failed, as _ did not really try it.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Since the diabetic woman had to limit her sugar intake, she ignored the pie and had a cookie instead because the _ was full of sugar.", + "gold_answer": "pie", + "os_answer": "pie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor offered to treat the patient's illness quickly with surgery or slowly with diet, and the patient refused the _ because he felt it was dangerous.", + "gold_answer": "surgery", + "os_answer": "surgery", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Throughout the practice Rachel pushed the limits of Megan to get ready for the game because _ was the coach.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Throughout the practice Rachel pushed the limits of Megan to get ready for the game because _ was the athlete.", + "gold_answer": "Megan", + "os_answer": "Megan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah was quickly promoted to manager over Kayla, because _ excelled at angering other people.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett was browsing the internet while he found the information unlike Randy, _ prefers using books.", + "gold_answer": "Randy", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis knows that Jeffrey is an animal lover and _ knows he wants to go to the zoo to see them.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty drank chocolate shakes while Elena drank carrot juice, and _ had a very healthy diet.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty drank chocolate shakes while Elena drank carrot juice, and _ had a very unhealthy diet.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie posted their sofa for sale on Craigslist, and had received an offer they had to decline because the _ is valuable.", + "gold_answer": "sofa", + "os_answer": "sofa", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I picked up some leaves to put in the books and dry, but they didn't fit because the _ were too small.", + "gold_answer": "books", + "os_answer": "books", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I picked up some leaves to put in the books and dry, but they didn't fit because the _ were too massive.", + "gold_answer": "leaves", + "os_answer": "leaves", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The president had their speech at the auditorium rather than the park because the _ was bigger.", + "gold_answer": "auditorium", + "os_answer": "auditorium", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The president had their speech at the auditorium rather than the park because the _ was smaller.", + "gold_answer": "park", + "os_answer": "park", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Steven found that their T-shirt had shrunk in the laundry, Robert's first reaction was to laugh, and _ then became angry.", + "gold_answer": "Steven", + "os_answer": "Steven", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "When Steven found that their T-shirt had shrunk in the laundry, Robert's first reaction was to laugh, and _ became apologetic.", + "gold_answer": "Robert", + "os_answer": "then", + "os_eval": "Incorrect. The student answered \"then,\" indicating a sequence of actions, whereas the true answer \"Robert\" identifies the subject who performed the action described in the question. This discrepancy in type of information (sequential connector vs. subject name) makes the student\u2019s answer incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She counted her calories for her diet and found she needed more so she ate a brownie instead of an apple since the _ has fewer.", + "gold_answer": "apple", + "os_answer": "apple", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia liked wearing glasses more than braces because she could take the _ off after two years.", + "gold_answer": "braces", + "os_answer": "braces", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia liked wearing glasses more than braces because she could take the _ off every day.", + "gold_answer": "glasses", + "os_answer": "glasses", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy's hair is dry when compared to Ian's due to _ using a strong conditioner.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam was a crook and not a law-abiding citizen like Joseph, so it was surprising that _ was the one with a restraining order against him.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam was law-abiding and not a crook like Joseph, so it was surprising that _ was the one with a restraining order against him.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wages at the factory were lower than the wages at the plant since it was more safe to work at the _ .", + "gold_answer": "factory", + "os_answer": "plant", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The health of Joel was stronger than that of William due to _ being a cigar smoker.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easy for Amy but not Rachel to create a meal because _ had taken woodshop in school.", + "gold_answer": "Rachel", + "os_answer": "Amy", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Ann's babies were crying, and she could give them a bottle or a rattle. She tried the _ first in case they were bored.", + "gold_answer": "rattle", + "os_answer": "rattle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca thought Disney movies were the best thing to watch but Samantha like horror movies better. _ rented Saw from Redbox.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B. Samantha", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The house of Aaron took some damage from the storm but not Michael's house, because _ lived farther away.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer dragged Felicia along to a self help workshop about how to succeed, because _ wanted some company.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary can read the clock in the room at night without the light even though the _ is dark.", + "gold_answer": "room", + "os_answer": "room", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan reads a lot, while Donald almost never picks up a book because _ is a plumber.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan reads a lot, while Donald almost never picks up a book because _ is a student.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle wanted to crush Ryan 's dreams of becoming a movie actor. _ was a threat to him.", + "gold_answer": "Ryan", + "os_answer": "Ryan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wind during the last hurricane tried to knock over their new house, but the _ was too strong.", + "gold_answer": "house", + "os_answer": "foundation", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty made the choice to reduce Samantha's salary after _ started cutting back on efficiency.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "During the rescue mission, Maria pulled Rebecca away from the minefield since _ was a civilian.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The jewelry sold for less than the baseball card did since the _ was very common.", + "gold_answer": "jewelry", + "os_answer": "jewelry", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura brought extensions to Monica at the salon, so that _ could get their dreads treated professionally.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura brought extensions to Monica at the salon, so that _ could treat their dreads professionally.", + "gold_answer": "Monica", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The installation process was simpler for the cable over the internet because the man had never installed the _ previously.", + "gold_answer": "internet", + "os_answer": "cable", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The installation process was simpler for the cable over the internet because the man had already installed the _ previously.", + "gold_answer": "cable", + "os_answer": "router", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica wanted Mary to help them decorate their new house because _ asked them not to do it alone.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "William went on the ride more than Matthew did because _ thought it was scary.", + "gold_answer": "Matthew", + "os_answer": "Matthew", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan took Monica to a wood shack in the mountains, because _ was a kidnapper trying to hide.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the beauty salon, Angela preferred to work on her eyebrows instead of her eyelashes because the _ were already worked on.", + "gold_answer": "eyelashes", + "os_answer": "eyelashes", + "os_eval": "Correct", + "mcq_answer": "B. eyelashes", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel tried unsuccessfully to get Brett to skip school because _ was a truant that didn't follow the rules.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla prepared a foot soak bath for Cynthia for their birthday so _ is pouring in water.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man looked at the sundial since a watch or clocktower was not at his disposal, having lost the _ .", + "gold_answer": "watch", + "os_answer": "time", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter chose to eat a banana for breakfast every morning but Michael did not because _ is unconcerned about their health.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The IRS sent Tim a letter informing him of the audit, which could occure at the house or the office. Tim chose a comfortable setting of the _ .", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia decided to buy Felicia dinner because they had been through a lot and _ just inherited some money.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia decided to buy Felicia dinner because they had been through a lot and _ just lost some money.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah thought that Elena was overpacking for Hawaii, because _ had a very full suitcase.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William liked to be outside more than Kyle so _ spent time arguing against getting a pool.", + "gold_answer": "Kyle", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B. Kyle", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William liked to be outside more than Kyle so _ spent time arguing for getting a pool.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John never mentioned his canoe, but had a long conversation with Ron about the raft, because John rarely used the _ .", + "gold_answer": "canoe", + "os_answer": "canoe", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica gives Jessica a book about posture, because _ has been trying to get better at ballet dancing.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My gun was inspected with a cloth to make sure it worked fine. The _ was hard.", + "gold_answer": "gun", + "os_answer": "barrel", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My gun was inspected with a cloth to make sure it worked fine. The _ was soft.", + "gold_answer": "cloth", + "os_answer": "cloth", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the estate sale, John saw the hammer was more affordable than the screwdriver, because the _ was used.", + "gold_answer": "hammer", + "os_answer": "screwdriver", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the estate sale, John saw the hammer was more affordable than the screwdriver, because the _ was brand new.", + "gold_answer": "screwdriver", + "os_answer": "screwdriver", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The temperature in winter is much different than summer, the _ is always lower.", + "gold_answer": "winter", + "os_answer": "temperature", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sliding glass door was broken when Eric pushed Ian through it because _ is a pushover.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman used a gentle technique when painting the urn but applied more pressure when painting the vase, because the _ was less fragile.", + "gold_answer": "Vase", + "os_answer": "vase", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman used a gentle technique when painting the urn but applied more pressure when painting the vase, because the _ was more fragile.", + "gold_answer": "Urn", + "os_answer": "urn", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tina made a schedule to keep track of her work and school obligations. She preferred to focus on the _ because she wanted to learn.", + "gold_answer": "school", + "os_answer": "studies", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica wants to protect herself from infectious diseases so she goes to doctor Samantha, because _ is careful.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kerry was running later when he took his car to work than when he took a taxi because he ran into more traffic in the _ .", + "gold_answer": "car", + "os_answer": "morning", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The history of the village is more intriguing than the history of the city because the _ is very new.", + "gold_answer": "city", + "os_answer": "city", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel told Patricia to pick up some baby powder at the store because _ had sweaty feet.", + "gold_answer": "Rachel", + "os_answer": "Patricia", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Rachel told Patricia to pick up some baby powder at the store but _ had sweaty feet too.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil looked all over the neighborhood for their missing dog until Samuel called and _ got their dog back.", + "gold_answer": "Neil", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I did not buy the color pink rose flowers for my wedding because the _ is too bright.", + "gold_answer": "color", + "os_answer": "color", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I started playing drums young. Sometimes I played in the garage and sometimes my room, but my parents preferred knowing I was in the _ .", + "gold_answer": "garage", + "os_answer": "garage", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At work, Mary uses a broiler a lot, but Rebecca uses a chainsaw. That's because _ is a tree cutter.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sand and water in the fish tank were very dirty, so the _ needed to be filtered.", + "gold_answer": "water", + "os_answer": "liquid", + "os_eval": "Incorrect. The student's answer of \"liquid\" could refer to any liquid and is not specific enough to match the \"water\" stated in the true answer. The context specifically mentions \u201cwater,\u201d making the broader term \"liquid\" inaccurate.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sand and water in the fish tank were very dirty, so the _ needed to be scrubbed.", + "gold_answer": "sand", + "os_answer": "tank", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Warts appeared on Jerry's limbs after he went through the jungle because the _ were infectious.", + "gold_answer": "warts", + "os_answer": "warts", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Pete preferred to use the sheet to the blanket, because the _ was much hotter.", + "gold_answer": "blanket", + "os_answer": "blanket", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She preferred a globe of the world made of PVC instead of plastic, because the _ made it look expensive.", + "gold_answer": "PVC", + "os_answer": "material", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "People think _ is embarassed, because Samantha made snide comments about the shirt Rebecca was wearing.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam's mindset was a lot stronger than William's because _ was able to control it.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The puncture healed quicker than the cut because the _ was a more superficial wound.", + "gold_answer": "puncture", + "os_answer": "cut", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "At the beach, Emily collected some seashells for her mother Maria. _ polished the seashells before giving them away.", + "gold_answer": "Emily", + "os_answer": "Emily", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Using a needle to sew together both the leather and silk was difficult. The _ was hard get through.", + "gold_answer": "leather", + "os_answer": "leather", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The maid took away a cozy blanket from Lawrence but not Nick because _ was very hot.", + "gold_answer": "Lawrence", + "os_answer": "it", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The maid took away a cozy blanket from Lawrence but not Nick because _ was very cold.", + "gold_answer": "Nick", + "os_answer": "Lawrence", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The photo came out of the Polaroid camera and fell onto the tray, so now the _ is lighter.", + "gold_answer": "camera", + "os_answer": "image", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brett asked Nelson where they were because _ had no idea after he fell asleep.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett asked Nelson where they were because _ had had been driving after he fell asleep.", + "gold_answer": "Nelson", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Leslie coughed more when they were eating their food than Adam although there was more seasoning in the food of _ .", + "gold_answer": "Adam", + "os_answer": "Adam's", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Craig gifted Eric a new picnic table, because _ borrowed some money a while ago.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Craig gifted Eric a new picnic table, because _ lent him some money a while ago.", + "gold_answer": "Eric", + "os_answer": "Eric", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was eager to make the big sale to Sarah , as _ needed the money that day.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was eager to make the big sale to Sarah , as _ had the money that day.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert took voice lessons from Randy, because _ was known to be on American Idol.", + "gold_answer": "Randy", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Whilst on the beach Cynthia loved to wear a bikini but Laura did not because _ had a flat stomach.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Whilst on the beach Cynthia loved to wear a bikini but Laura did not because _ had a fat stomach.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B. Laura", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Paint was applied to the chairs but not the tables, since the _ were new.", + "gold_answer": "tables", + "os_answer": "tables", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Paint was applied to the chairs but not the tables, since the _ were old.", + "gold_answer": "chairs", + "os_answer": "tables", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "In high school Matthew was most popular among the teachers as were Steven was among the students, _ was liked by adolescents.", + "gold_answer": "Steven", + "os_answer": "Steven", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shoe james bought got pinched by a nail while jogging because the _ is soft.", + "gold_answer": "shoe", + "os_answer": "sole", + "os_eval": "Incorrect. The student's answer specifies \"sole\" which is a part of the shoe, but it does not match the general term \"shoe\" as needed in the blank space per the true answer.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence liked watching foreign movies with subtitles unlike Jason because _ criticized the original language of the film.", + "gold_answer": "Jason", + "os_answer": "Jason", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence liked watching foreign movies with subtitles unlike Jason because _ appreciated the original language of the film.", + "gold_answer": "Lawrence", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The fishing line snagged and broke on a rock because the _ was too heavy.", + "gold_answer": "rock", + "os_answer": "weight", + "os_eval": "Incorrect. The true answer focuses on the rock being heavy as the reason for breaking the fishing line, whereas the student's answer emphasizes the weight (presumably of the line or what's attached to it) as the reason, introducing a conflicting concept.", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Johnny likes fruits more than vegetables in his new keto diet because the _ are saccharine.", + "gold_answer": "fruits", + "os_answer": "fruits", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was still grieving the death of a friend more than Elena, because _ had a more distant relationship with the friend.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was still grieving the death of a friend more than Elena, because _ had a very close relationship with the friend.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bill had extra charges for past due and hookup. I owe the _ for being a new customer.", + "gold_answer": "hookup", + "os_answer": "hookup", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia had a much harder life than Amy, so when _ said life was good, it was an unusual sentiment.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The courage of Ian was a lot stronger than Michael because _ had been through a lot in life.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chef fried less mushrooms than tomatoes because the _ were ordered frequently at the restaurant.", + "gold_answer": "tomatoes", + "os_answer": "tomatoes", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence dealt the cards to Joseph at the blackjack table, because _ was a professional player.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "You can grow cilantro in a garden or buy it at the store, but the _ variety will taste bland because it will be older.", + "gold_answer": "store", + "os_answer": "store", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "You can grow cilantro in a garden or buy it at the store, but the _ variety will taste better because it will be fresh.", + "gold_answer": "garden", + "os_answer": "garden", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha strictly followed their diet while Sarah ate what they felt like, and _ ate chicken and broccoli all week.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It seemed more likely that Brett would wear a fedora rather than Justin because _ was known to dress stylishly.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It seemed more likely that Brett would wear a fedora rather than Justin because _ did not often dress stylishly.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William did not mind if it took them a while to prepare a meal but Adam did because _ was very meticulous.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The wall of the house looks nicer than the one in the garage despite that the _ was painted more recently.", + "gold_answer": "garage", + "os_answer": "garage", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kevin ate large amounts of food but not Adam. _ didn't have to get checked to see if they had a tapeworm.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The computer of Victoria ran faster than that of Carrie because _ downloaded less files.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The computer of Victoria ran slower than that of Carrie because _ downloaded less files.", + "gold_answer": "Carrie", + "os_answer": "Victoria", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "My face was more familiar than it was at the bar than the gym because I went to the _ very rarely.", + "gold_answer": "gym", + "os_answer": "gym", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My face was more familiar than it was at the bar than the gym because I went to the _ several times a week.", + "gold_answer": "bar", + "os_answer": "bar", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Randy showed Samuel the abused horse that he rescued from the shelter. _ was proud of his friend.", + "gold_answer": "Samuel", + "os_answer": "Samuel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena enjoyed yoga classes while Amy preferred other forms of exercise; this was because _ was flexible.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena enjoyed yoga classes while Amy preferred other forms of exercise; this was because _ was inflexible.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cake that Lawrence tried to bake for Ryan didn't rise, and _ felt forgiving abut it.", + "gold_answer": "Ryan", + "os_answer": "Ryan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie took a longer time to take a bath than Jennifer because _ liked relaxing in the tub.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily said that Victoria's hijab was silly and old fashioned. _ heard some very offensive things.", + "gold_answer": "Victoria", + "os_answer": "I", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily said that Victoria's hijab was silly and old fashioned. _ said some very offensive things.", + "gold_answer": "Emily", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary was more reliable and hardworking than Rachel, but to be fair, _ had a better foundation as a child.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "It is likely that Donald but not Jason would get the job promotion because _ never stayed late and never did extra work.", + "gold_answer": "Jason", + "os_answer": "Jason", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "A background check was performed on Natalie by Lindsey due to _ being a nanny.", + "gold_answer": "Natalie", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We reached a settlement with the company but were roadblocked by the court. The _ was just more inflexible in its dealings.", + "gold_answer": "court", + "os_answer": "court", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man paid cash for the phone but purchased the tablet with credit because the _ was pricy.", + "gold_answer": "Tablet", + "os_answer": "tablet", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man paid cash for the phone but purchased the tablet with credit because the _ was inexpensive.", + "gold_answer": "Phone", + "os_answer": "phone", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "There are lots of pills in the home of Neil, but none in the house of Logan, so _ must be healthy.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie asked Betty where the children were on the playground because _ could not see them.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the region was too crowded for our comfortable stay for all the people sent there , the _ were too small..", + "gold_answer": "region", + "os_answer": "quarters", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha had to get car insurance and Jessica did not because _ just got a new car.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stain was lighter on Jason's shirt than Donald's because _ spilled red wine and not white wine.", + "gold_answer": "Donald", + "os_answer": "Jason", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stain was darker on Jason's shirt than Donald's because _ spilled red wine and not white wine.", + "gold_answer": "Jason", + "os_answer": "Jason", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily decided to eat a lot more yucca than Carrie did. _ was still hungry.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily decided to eat a lot more yucca than Carrie did. _ was no longer hungry.", + "gold_answer": "Emily", + "os_answer": "Emily", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian needed to adjust the mirror and Craig did not because _ was shorter than the owner of the car.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian needed to adjust the mirror and Craig did not because _ was the same height as the owner of the car.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The commodities trader decided to buy wool and sell cotton because the _ was priced low.", + "gold_answer": "wool", + "os_answer": "wool", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The commodities trader decided to buy wool and sell cotton because the _ was priced high.", + "gold_answer": "cotton", + "os_answer": "cotton", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was told my eyes are failing so I need to get glasses or contacts. I don't think I'll get the contacts since the _ seem less comfortable.", + "gold_answer": "contacts", + "os_answer": "glasses", + "os_eval": "Incorrect", + "mcq_answer": "B. contacts", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It is an article of faith that the paper is more important than the exam , even though the _ weighs less heavily on the grade.", + "gold_answer": "paper", + "os_answer": "exam", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teenager got a job at the supermarket instead of at the diner because he had to work during school at the _ .", + "gold_answer": "diner", + "os_answer": "weekend", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The tip of James pencil was breaking while writing on the paper sheet. The _ is weak.", + "gold_answer": "pencil", + "os_answer": "lead", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William lived in a rougher part of town than Eric, so _ trained their dog as a guard dog.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman moved the urn in front of the vase on the shelf because the _ was attractive.", + "gold_answer": "urn", + "os_answer": "urn", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer returned the pan to Sarah because _ had borrowed it from her for the potluck party.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer returned the pan to Sarah because _ had loaned it to her for the potluck party.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor told Kevin to exercise more often but not Neil. _ had always been lazy and unmotivated.", + "gold_answer": "Kevin", + "os_answer": "Neil", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor told Kevin to exercise more often but not Neil. _ had always been active and self-motivated.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I always wonder how people prefer reading in a library instead of at the house because the lack of people at the _ would make it easier to concentrate.", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I always wonder how people prefer reading in a library instead of at the house because the amount of people at the _ would make it hard to concentrate.", + "gold_answer": "library", + "os_answer": "library", + "os_eval": "Correct.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The blood sample on the slide was more helpful than the one in the vial, because the _ had been kept pristine.", + "gold_answer": "slide", + "os_answer": "slide", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan had to use a calculator on the test but Michael didn't because _ was very bad at math.", + "gold_answer": "Ryan", + "os_answer": "Ryan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The air in the shop was better than in the garage, because the _ was highly purified.", + "gold_answer": "shop", + "os_answer": "ventilation", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He went to put his pocket watch into his pocket, but realized the chain had broke. Without it, the _ doesn't function correctly.", + "gold_answer": "pocket watch", + "os_answer": "watch", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jason was easily scared, so he watched sci-fi movies instead of horror movies because the _ were not scary.", + "gold_answer": "sci-fi movies", + "os_answer": "aliens", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine accepted the over night challenge from Laura, because _ had a better chance of winning.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman kept the bikini but returned the top, because the _ was the right size.", + "gold_answer": "bikini", + "os_answer": "bottom", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman kept the bikini but returned the top, because the _ was the wrong size.", + "gold_answer": "top", + "os_answer": "bottom", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria taught Elena how to count in Malay for their trip, because _ was a visitor of the island.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela beat Mary in the weightlifting competition, but it wasn't fair. _ had been taking steroids.", + "gold_answer": "Angela", + "os_answer": "Mary", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty assisted Kayla with the daily analysis task they were assigned and then _ ask for help herself.", + "gold_answer": "Betty", + "os_answer": "didn't", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The store sold Michael a fake phone but not Eric so _ could still make a call.", + "gold_answer": "Eric", + "os_answer": "Eric", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The juice from the mango fruit could not fill up the cup because the _ is small.", + "gold_answer": "mango", + "os_answer": "mango", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jeri was deciding what to bring to a potluck and picked cookies over a pie because the _ could be shared with fewer people.", + "gold_answer": "pie", + "os_answer": "pie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian asked Nick to feed their rabbit,because _ was planning on going on vacation to Disney for a week.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James listened carefully to the conversation from the other room but all he could hear was the clock tickling. The _ is pretty loud.", + "gold_answer": "clock", + "os_answer": "clock", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog that Laura found was dirtier than Amy's dog, since _ dog lived in the street.", + "gold_answer": "Laura", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The ambulance went to the hospital without Nelson inside but with Ryan because _ drove there in a car.", + "gold_answer": "Nelson", + "os_answer": "Nelson", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig was a very selfish individual but Kenneth was very generous. _ had a lot of good friends.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "B. Kenneth", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It took a less time for Katrina to read the book than Cynthia since _ was a better reader.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bobby had to use his pen to finish the exam rather than the pencil because the _ was full of ink.", + "gold_answer": "pen", + "os_answer": "pen", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easy for Matthew but not Logan to practice yoga because _ wanted to improve their mind and body.", + "gold_answer": "Matthew", + "os_answer": "Matthew", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia was called back for a second interview but not Victoria, as _ had passed the background check.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia was called back for a second interview but not Victoria, as _ had failed the background check.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Harold liked to play with dolls more than cars because the _ talked back to him.", + "gold_answer": "dolls", + "os_answer": "dolls", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "There was more dirt on the car than the bike because the _ was kept inside.", + "gold_answer": "bike", + "os_answer": "bike", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "There was more dirt on the car than the bike because the _ was kept outside.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was a very calm person with yoga but Jeffrey was hyper so, _ decided to take a yoga class.", + "gold_answer": "Jeffrey", + "os_answer": "Jeffrey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Going to a restaurant is something that Patricia does very often but Carrie rarely goes to one because _ is a very bad cook.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Going to a restaurant is something that Patricia does very often but Carrie rarely goes to one because _ is a very good cook.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eric went to Leslie's house to play with the new dog, but there was no answer. _ was at the park.", + "gold_answer": "Leslie", + "os_answer": "She", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica spends a lot more money on frivolous things than Rachel because _ has more disposable income.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin showed Maria to use the fork and knife in a proper manner as _ attended etiquette school.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian won a fish from Kenneth at the carnival so _ bagged it up and sent it home.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hotline was staffed by Christine when Tanya called in because _ was a volunteer.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven helped Derrick do research on the paper because _ did not have access to the internet.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven helped Derrick do research on the paper because _ had access to the internet.", + "gold_answer": "Steven", + "os_answer": "Steven", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel got advice on buying stocks from his cousin Bob while Eric used a broker. _ had a virtually worthless portfolio of companies.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca asked Kayla to turn the lights out but _ did not want to go to sleep.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis is changing the sand in a pool filter for Joseph, because _ is a bit lazy.", + "gold_answer": "Joseph", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter gave Justin two weeks to respond after sending him a demand letter. .After that _ will sue him in the court.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The mediation and medication both helped me be patient. I lost my temper when the _ got rescheduled.", + "gold_answer": "mediation", + "os_answer": "mediation", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason considers he and Benjamin to be friends so _ puts a lot of effort into their relationship.", + "gold_answer": "Jason", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason considers he and Benjamin to be friends even though _ puts little effort into their relationship.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It took a minute longer to melt the chocolate in the microwave than the caramel, because the _ was very soft.", + "gold_answer": "caramel", + "os_answer": "caramel", + "os_eval": "Correct.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It took a minute longer to melt the chocolate in the microwave than the caramel, because the _ was very firm.", + "gold_answer": "chocolate", + "os_answer": "chocolate", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They discussed the company's budget at the business meeting but the _ was boring and the meeting was ran long.", + "gold_answer": "budget", + "os_answer": "discussion", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "They discussed the company's budget at the business meeting but the _ was boring and the topic of the budget ran long.", + "gold_answer": "meeting", + "os_answer": "discussion", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sponges performed worse at cleaning the tub in the bathroom when compared with the cloths. It's because the _ are cheaper.", + "gold_answer": "sponges", + "os_answer": "cloths", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy only ever added a little bit of hot sauce to his food, especially compared to Adam, as _ was much more sensitive to spice.", + "gold_answer": "Randy", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Matt wanted to change either the plain bathroom or the colorful bedroom, but the _ was already colorful.", + "gold_answer": "bedroom", + "os_answer": "bathroom", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Matt wanted to change either the plain bathroom or the colorful bedroom, but the _ was already plain.", + "gold_answer": "bathroom", + "os_answer": "bathroom", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The snow came down so much that Michael had to go plow Kevins driveway because _ agreed to take care of his neighbors.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The snow came down so much that Michael had to go plow Kevins driveway because _ needed the help of his neighbors.", + "gold_answer": "Kevin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The girl used the comb to try and brush her hair but the _ was too soft.", + "gold_answer": "comb", + "os_answer": "bristles", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Police arrested Maria but let Cynthia go as _ had some paint on their hand from the spray paint used for graffiti.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Police arrested Maria but let Cynthia go as _ had no paint on their hand from the spray paint used for graffiti.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter bought a vehicle to commute in but not Dennis because _ had a driving distance to work.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey went to the doctor to treat their ailments but not Robert so _ became sicker.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria asked Cynthia if she could borrow some fuel for her car, as _ had a shortage of it.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In the accident the vehicle of Nelson received more damage than that of Justin, since _ vehicle was smaller.", + "gold_answer": "Nelson", + "os_answer": "Nelson's", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In the accident the vehicle of Nelson received more damage than that of Justin, since _ vehicle was bigger.", + "gold_answer": "Justin", + "os_answer": "Justin's", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela did a bunch of crunches and sit-ups but Cynthia didn't, consequentially _ had six- pack abs.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica is looking to buy some new furniture and Carrie just bought some, so _ is starting to anticipate their purchase arrival.", + "gold_answer": "Carrie", + "os_answer": "Monica", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Aaron showed Donald how to use google play on an android because _ owned an apple phone.", + "gold_answer": "Donald", + "os_answer": "Aaron", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina turned out to be much more spoiled than Felicia because _ did not have wealthy or generous parents.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina turned out to be much more spoiled than Felicia because _ had wealthy and generous parents.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah rolls her eyes as Monica extolls the virtues of vinegar as a cleaning solution for everything since _ is bored.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson always had the best friendships except with Neil since _ was always so polite.", + "gold_answer": "Nelson", + "os_answer": "Neil", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Derrick really liked working in Human Resources and William wanted to work at the same company, and _ subsequently offered a position.", + "gold_answer": "Derrick", + "os_answer": "was", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Derrick really liked working in Human Resources and William wanted to work at the same company, and _ subsequently accepted a position.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The room at the hotel cost more to stay in than the room at the inn because the _ was nastier.", + "gold_answer": "inn", + "os_answer": "inn", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The room at the hotel cost more to stay in than the room at the inn because the _ was nicer.", + "gold_answer": "hotel", + "os_answer": "decor", + "os_eval": "Incorrect. The student's answer provides a reason (decor) for the difference in cost, whereas the true answer specifies that it is the hotel itself that is nicer. There's no information to directly link the decor to the overall quality of the hotel in the true answer.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman practiced for her interview and not for the sport since the _ was expedient.", + "gold_answer": "interview", + "os_answer": "interview", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The boot was removed from the car tire and put on the truck tire, since the _ was now illegally parked.", + "gold_answer": "truck", + "os_answer": "truck", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The boot was removed from the car tire and put on the truck tire, since the _ was now legally parked.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I have both glasses and contacts, but the cleaning solution was empty so I wore the _ today.", + "gold_answer": "glasses", + "os_answer": "glasses", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He found it harder to write the letter than the e-mail because the _ had so few words.", + "gold_answer": "e-mail", + "os_answer": "e-mail", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jane loved travelling internationally. The current country she was in preferred wine over tea because the _ was less available.", + "gold_answer": "tea", + "os_answer": "tea", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer wanted to get romance in a relationship while Elena did not because _ liked to watch romantic comedies.", + "gold_answer": "Jennifer", + "os_answer": "Elena", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam loved dogs but Jason was afraid of them, so only _ petted the poodle.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena brought the horse to the stables owned by Cynthia, so _ could buy the animal.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B. Cynthia", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena brought the horse to the stables owned by Cynthia, so _ could sell the animal.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brett wanted to get a massage but Kenneth did not. This is because _ was feeling relaxed.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "B. Kenneth", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kevin was worried about Eric's infections so _ decided to go to an emergency clinic.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The bird squawked at Mary's rushed approached and quieted when Jennifer came in since _ was threatening.", + "gold_answer": "Mary", + "os_answer": "nothing", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan was always behind Donald in high school because _ had a diagnosed learning disability.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "People do not want to eat James burnt cake but they love his burger because the _ is tasteless.", + "gold_answer": "cake", + "os_answer": "cake", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had problems with dry skin but not Hunter since _ used a soothing skin lotion.", + "gold_answer": "Hunter", + "os_answer": "Hunter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Craig had problems with dry skin but not Hunter because _ used an irritating skin lotion.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie loves putting sugar in coffee as opposed to Laura because _ thinks the coffee tastes better.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett was actively engaged in weight loss whereas Benjamin was trying to gain weight, so _ maximized their caloric intake.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B. Benjamin", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ben had to drain both water and oil down the sink, but the _ was too viscous.", + "gold_answer": "oil", + "os_answer": "oil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ben had to drain both water and oil down the sink, but the _ was too fluid.", + "gold_answer": "water", + "os_answer": "oil", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "John painted the pole red close to the color of the wall and painted the frame white and now the _ is contrasting.", + "gold_answer": "frame", + "os_answer": "frame", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John painted the pole red close to the color of the wall and painted the frame white and now the _ is similar.", + "gold_answer": "pole", + "os_answer": "pole", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mark preferred his drinks in paper cups over styrofoam cups because the _ are strong.", + "gold_answer": "paper cups", + "os_answer": "paper", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica had trouble paying off their loan unlike Sarah because _ was an infrequent gambler.", + "gold_answer": "Sarah", + "os_answer": "Monica", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick was sad that Robert did not show up, _ forgot they had an agreement to meet each other.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She suspected that her old makeup had expired after she put it on her skin because her _ was harder.", + "gold_answer": "makeup", + "os_answer": "complexion", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kevin drew the blood from Ian's arm, because _ was giving it to do some tests.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sookie roasted a turkey and served it with potatoes instead of carrots, because everyone in her family would have hated the _ .", + "gold_answer": "carrots", + "os_answer": "carrots", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They were wanting to move the bed thru the door. The _ was way to small.", + "gold_answer": "door", + "os_answer": "doorway", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty learned to play the cello well but Erin did not because _ was very impatient.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan ended the one-side relationship they were having with Robert, which made _ feel relieved.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was eating more than Betty was eating for dinner because _ had a big lunch.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was eating more than Betty was eating for dinner because _ had skipped lunch.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I chose to drive the car over the truck because the _ had a small amount of gas.", + "gold_answer": "truck", + "os_answer": "truck", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I chose to drive the car over the truck because the _ had a large amount of gas.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The diary of Carrie is boring, and the one Jennifer writes is interestin. _ has lived a simple life.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian's hair is being worked on by Craig, so it's more likely _ is the customer.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan didn't care for the comedians show but Patricia thought it was brilliant. _ hung out for the comedian's second set.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He liked filling the bucket with the hose better than the faucet, because the _ provided extra water pressure.", + "gold_answer": "hose", + "os_answer": "hose", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine was watching makeup tutorials while Amy was not because _ wanted to forget how to put blush on correctly.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Diana went to the laundromat and she used the washer but not the dryer because she only had enough money for the _ .", + "gold_answer": "washer", + "os_answer": "washer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ben wanted to propose to his girlfriend by hiding the ring in either cake or water. He decided to hide it in the _ because she drank the water fast.", + "gold_answer": "cake", + "os_answer": "water", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The woman avoided the hole but easily stepped over the pit, because the _ was very deep.", + "gold_answer": "hole", + "os_answer": "hole", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman avoided the hole but easily stepped over the pit, because the _ was very shallow.", + "gold_answer": "pit", + "os_answer": "pit", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After I soaked the roller in the paint container, the _ had less paint on it.", + "gold_answer": "container", + "os_answer": "roller", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The lease in the city was more than the lease in the country because the value of the property in the _ was higher.", + "gold_answer": "city", + "os_answer": "city", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The refrigerator was acting up again, so we called a technician to repair the part. The _ was fine when he showed up.", + "gold_answer": "refrigerator", + "os_answer": "technician", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin has a teenager whereas Patricia has toddler-age children because _ became a mother later.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin has a teenager whereas Patricia has toddler-age children because _ became a mother first.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla was very civil when dealing with Emily so that _ would be accepted by her.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin ordered a martini when Tanya only ordered a tonic water with lemon, because _ was pregnant.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The employee tried to put the extra clothes in the closets but the _ were too small.", + "gold_answer": "closets", + "os_answer": "closets", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald has a problem with hearing in his ears unlike Benjamin because _ worked in a quiet area.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil was a very popular kid in school unlike Jeffrey, because _ was very extroverted.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I loved my old gifts but not the new dishes, because the _ were so beautiful.", + "gold_answer": "gifts", + "os_answer": "old", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty used glue to fix Megan's toy because _ was too young to use superglue.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason but not Craig asked the company if they were currently hiring because _ has a job.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The game on television was very important for Ian but not Dennis because _ was into music instead.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The virus stuck to the clothes better than it stuck to the walls, because the _ had less deterrents on them.", + "gold_answer": "clothes", + "os_answer": "clothes", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The virus stuck to the clothes better than it stuck to the walls, because the _ had more deterrents on them.", + "gold_answer": "walls", + "os_answer": "clothes", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At their high school's homecoming dance, Natalie stayed on the floor for the slow dance while Maria got food during it, because _ had broken up with her significant other.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "B. Maria", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At their high school's homecoming dance, Natalie stayed on the floor for the slow dance while Maria got food during it, because _ currently had a significant other.", + "gold_answer": "Natalie", + "os_answer": "Maria", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam always spent all of the free time watching Tv unlike Hunter who volunteered, due to _ being lazy.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ ignored their ear because Jessica has a ear infection and Felicia was fine.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha had to use the potty while Felicia used the restroom because _ is a grownup.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B. Felicia", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After walking barefooted, James washed his foot in the bowl of water and the _ got dirty.", + "gold_answer": "water", + "os_answer": "water", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Benjamin put the family into debt, Adam filed for divorce; then the judge gave _ a sympathetic look.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Benjamin put the family into debt, Adam filed for divorce; then the judge gave _ a withering look.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin read a book to Monica because _ was old enough to be able to read.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The box slid down James hand when he was wearing a glove, hence he removed it and lift it again. The _ is dry.", + "gold_answer": "hand", + "os_answer": "hand", + "os_eval": "Correct", + "mcq_answer": "B. hand", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The box slid down James hand when he was wearing a glove, hence he removed it and lift it again. The _ is slippery.", + "gold_answer": "glove", + "os_answer": "box", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The building's ancient foundation was re-enforced with a steel alloy during the remodel because the _ was strengthening.", + "gold_answer": "steel", + "os_answer": "structure", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When we go hiking I bring my backpack because it has built in water bottles and places for snacks. Today I forgot to fill the _ and was dehydrated.", + "gold_answer": "water bottles", + "os_answer": "bottles", + "os_eval": "Correct.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When we go hiking I bring my backpack because it has built in water bottles and places for snacks. Today I forgot to bring the _ and was starving.", + "gold_answer": "snacks", + "os_answer": "snacks", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She wanted to learn how to pair wine so she bought book instead of using a magazine because the _ was too broad.", + "gold_answer": "magazine", + "os_answer": "magazine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya read the contract carefully before signing it but Patricia didn't. _ didn't get ripped off by the shady merchant.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The garbage can smells much worse than the recycling, so the _ is probably a lot more sterile.", + "gold_answer": "recycling", + "os_answer": "recycling", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My pain was not nearly as bad as Joe's burn because the _ Joe had was uncontrollable.", + "gold_answer": "burn", + "os_answer": "pain", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hotel had a terrible gym but a nice restaurant; the _ was something management attended to.", + "gold_answer": "restaurant", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Refraining from drinking was easy for Kyle but not Eric, as _ never enjoyed the taste of alcohol.", + "gold_answer": "Kyle", + "os_answer": "Eric", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia ate all of the dessert while Sarah did not have any since _ was not trying to lose any weight.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary went to the office to receive a new card with her photo on it and discarded a sticker because the _ was temporary.", + "gold_answer": "sticker", + "os_answer": "sticker", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The new cream didn't remove the warts like the last lotion, because the _ was not powerful enough.", + "gold_answer": "cream", + "os_answer": "formula", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth is accused of destroying drywall in Jeffrey's house, _ is leasing out the house.", + "gold_answer": "Jeffrey", + "os_answer": "Jeffrey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth is accused of destroying drywall in Jeffrey's house, _ is renting the house.", + "gold_answer": "Kenneth", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Adam was cold and Michael was hot so _ removed a heavy jacket to withstand the freezing weather.", + "gold_answer": "Michael", + "os_answer": "Adam", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "After a short time we stopped pouring the tea glass in the pot because the _ was full.", + "gold_answer": "pot", + "os_answer": "pot", + "os_eval": "Correct", + "mcq_answer": "A. glass", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "After a short time we stopped pouring the tea glass in the pot because the _ was empty.", + "gold_answer": "glass", + "os_answer": "pot", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "When the dog behaves I like to give him a sausage otherwise I give him a ball. I gave him the _ since he was bad.", + "gold_answer": "ball", + "os_answer": "ball", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John decided to grow a new breed of plant in his garden but the _ is big.", + "gold_answer": "plant", + "os_answer": "risk", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was sick of the pests like Amy always cutting out their internet, so _ decided to lay low.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "William wanted to go biking but Aaron wanted to stay home, so _ went out by themselves.", + "gold_answer": "William", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela loved to wear sun glasses but Jessica didn't. _ bought a fancy new pair of shoes.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica was caught napping in class more often than Katrina because _ stayed up all night.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The highlands were a lot colder than the beaches because the _ were lower down in elevation.", + "gold_answer": "beaches", + "os_answer": "beaches", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine had really good grammar but Cynthia didn't have good grammar because _ studied math in college.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica was given a sapphire ring by Christine for her birthday because _ really likes sapphires.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The waist of Joel measured more inches than that of Kevin because _ ate much less.", + "gold_answer": "Kevin", + "os_answer": "Kevin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The lips on Cynthia were much bigger than Monica because _ got hit with a softball in the mouth.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The lips on Cynthia were much smaller than Monica because _ got hit with a softball in the mouth.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary goes around telling everyone that Christine is too clingy because _ likes to be touched..", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The parakeet flew to Hunter but flew past Samuel because _ had some bird seed in their hand.", + "gold_answer": "Hunter", + "os_answer": "Hunter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John opened the window for air to come him when he was sweating in his bedroom. The _ is cold.", + "gold_answer": "air", + "os_answer": "air", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Even though Ian had less of a sweet tooth than Robert, _ liked chocolate more.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "James walked into a ditch while trying to catch the ball thrown at him. The _ is farther.", + "gold_answer": "ball", + "os_answer": "ditch", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Caroline works in the catering and food wholesale industries, but enjoys food preparation more, so she prefers her work in the _ industry.", + "gold_answer": "catering", + "os_answer": "catering", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Caroline works in the catering and food wholesale industries, but enjoys food distribution more, so she prefers her work in the _ industry.", + "gold_answer": "food wholesale", + "os_answer": "distribution", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria never received flowers from the customers unlike Monica, by virtue of _ being polite.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hugh scrubbed the mold in his apartment with a cleaner but had to call a pro because the _ was too weak.", + "gold_answer": "cleaner", + "os_answer": "cleaner", + "os_eval": "Correct", + "mcq_answer": "B. cleaner", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher tried to empty all the water from the tank in the yard because Michael had asked him to, but _ wasn't able to get it all out.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The watch could not fit on the arm properly because it had been cut by a blade. The _ was short.", + "gold_answer": "Watch", + "os_answer": "band", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "A very active Randy injured their elbow playing basketball against Lawrence, so _ said sorry.", + "gold_answer": "Lawrence", + "os_answer": "Lawrence", + "os_eval": "Correct", + "mcq_answer": "B. Lawrence", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John sold the three chairs and used the money to buy twelve shoes. The _ were cheaper.", + "gold_answer": "shoes", + "os_answer": "shoes", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John sold the three chairs and used the money to buy twelve shoes. The _ were more expensive.", + "gold_answer": "chairs", + "os_answer": "shoes", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The barista loved to make all types of coffee including iced and hot. The _ coffee was popular in the cooler weathers.", + "gold_answer": "hot", + "os_answer": "hot", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The barista loved to make all types of coffee including iced and hot. The _ coffee was popular in the hotter weathers.", + "gold_answer": "iced", + "os_answer": "iced", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The apartment that Samantha lived in was a lot smaller than Megan, because _ had a little salary.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The girl put her money in the bag instead of her pocket although the bully would look in the _ .", + "gold_answer": "bag", + "os_answer": "pocket", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The girl put her money in her bag instead of her pocket because the bully looked in the _ .", + "gold_answer": "pocket", + "os_answer": "pocket", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ ignores Google to search for information because Betty trusts in it and Cynthia doesn't.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Irena didn't like other people living in something before her so she felt more comfortable buying the house instead of the mansion as the _ was old.", + "gold_answer": "mansion", + "os_answer": "mansion", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kevin was not able to run fast compared to William because _ had no broken bones in his body.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I did not see the sign on the billboard on the highway because the _ was too huge.", + "gold_answer": "billboard", + "os_answer": "billboard", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I did not see the sign on the billboard on the highway because the _ was too tiny.", + "gold_answer": "sign", + "os_answer": "text", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After Logan pitched a ball that got clobbered for a home run by Justin in a baseball game, _ felt exultant.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela thought that Elena talked too slowly, and _ had a hard time being understood when they spoke.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel complained to Ian about the condition of the house. _ preferred a messy space.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At Jan's home, she dusted the dresser more frequently than the fan, because the _ was easier to reach.", + "gold_answer": "dresser", + "os_answer": "dresser", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At Jan's home, she dusted the dresser more frequently than the fan, because the _ was more difficult to reach.", + "gold_answer": "fan", + "os_answer": "fan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor suggested alternating between ice and a heating pad when I strained a muscle, but he warned me to not let the _ get too warm.", + "gold_answer": "pad", + "os_answer": "pad", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor suggested alternating between ice and a heating pad when I strained a muscle, but he warned me to not let the _ get too cold.", + "gold_answer": "ice", + "os_answer": "ice", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When other people were smoking, Kayla was more disgusted than Erin because _ had always avoided smoke.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin has a spouse and Kyle is single after being divorced, so _ is celebrating their independence this year.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher taught Hunter to play go fish so that _ had someone to play with.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie was helping Patricia diet and exercise at the gym to lose weight because _ used to be overweight.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I had to rake more leaves at the house than at the office because there were more trees at the _ .", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The quality of music produced largely depends on the instrument used. The _ is vital.", + "gold_answer": "Instrument", + "os_answer": "instrument", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael made pickled eggs for Kenneth, but _ really loved his own and wanted to share them.", + "gold_answer": "Kenneth", + "os_answer": "Michael", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Henry wanted to stop yelling and start using a more effective type of communication because the _ was nice.", + "gold_answer": "communication", + "os_answer": "outcome", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tommy was able to carry the tripod himself, but his friend had to help him carry the camera because the _ was heavier.", + "gold_answer": "camera", + "os_answer": "camera", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tommy was able to carry the tripod himself, but his friend had to help him carry the camera because the _ was lighter.", + "gold_answer": "tripod", + "os_answer": "tripod", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog ran into the bedroom during the rainstorm while we stayed in the kitchen because the rain was louder in the _ .", + "gold_answer": "kitchen", + "os_answer": "bedroom", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog ran into the bedroom during the rainstorm while we stayed in the kitchen because the rain was softer in the _ .", + "gold_answer": "bedroom", + "os_answer": "kitchen", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Maria gave Samantha the blue floral pants, because _ didn't fit into them very well.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey was considered more masculine than Amy because every year _ went into the woods to French kiss deer.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A.", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "He was late for the party but on time for the sleepover because the _ had just finished.", + "gold_answer": "party", + "os_answer": "party", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia had to pee after one large coffee but Betty did not as _ had a very big bladder.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia had to pee after one large coffee but Betty did not as _ had a very small bladder.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The remote control worked better than the toy car because the batteries in the _ were fresher.", + "gold_answer": "remote control", + "os_answer": "remote", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily bought a piece of jewelry from Natalie, later _ thought she sold too low but kept a cool attitude.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert was simply not as stoic as Joel , as _ tended to handle things gracefully.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron drank plenty of water before the hike, but Christopher forgot to, so _ ended up staying hydrated.", + "gold_answer": "Aaron", + "os_answer": "Aaron", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron drank plenty of water before the hike, but Christopher forgot to, so _ ended up getting dehydrated.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The TV that Samantha bought costs more than that of Carrie, because _ was poor.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The TV that Samantha bought costs more than that of Carrie, because _ was rich.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie had an easier time crawling through the narrow tunnel than Patricia because _ was larger.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia gave a rabbit as a companion to Carrie because _ thought they were lonely.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia gave a rabbit as a companion to Carrie because _ explained they were lonely.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Smoke still rose from the house but had subsided at the barn. The fire was doused at the _ .", + "gold_answer": "barn", + "os_answer": "barn", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although William liked animals less overall than Justin, _ couldn't stand to be around hamsters.", + "gold_answer": "Justin", + "os_answer": "William", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina drove Emily to the prison, so that _ could say goodbye to them before they went to jail.", + "gold_answer": "Katrina", + "os_answer": "Emily", + "os_eval": "Incorrect", + "mcq_answer": "B. Emily", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Ian was tired of trying new diets while Steven had luck with one, so _ decided to do their own thing.", + "gold_answer": "Ian", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian was tired of trying new diets while Steven had luck with one, so _ stuck to their routine.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Katrina wanted to build a new picture frame for Samantha's portrait because _ was an inexperienced woodworker.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Nick struggled with unresolved trauma that Ian couldn't understand, since _ had frequently experienced childhood abuse.", + "gold_answer": "Ian", + "os_answer": "Nick", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Nick struggled with unresolved trauma that Ian couldn't understand, since _ had never experienced childhood abuse.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Victoria decided to adopt a Yorkie, but Elena wouldn't even consider it, because _ loved small dogs.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie kept written records of their expenses but not Laura because _ had a faulty memory.", + "gold_answer": "Carrie", + "os_answer": "Laura", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Carrie kept written records of their expenses but not Laura because _ had a sharp memory.", + "gold_answer": "Laura", + "os_answer": "Laura", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My employer offers a bonus of either a phone or a television, but unfortunately the _ is just way too large to be useful.", + "gold_answer": "phone", + "os_answer": "television", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "My employer offers a bonus of either a phone or a television, but unfortunately the _ is just way too small to be useful.", + "gold_answer": "television", + "os_answer": "phone", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The stain in the bucket could not be cleaned with the brush because the _ is soft.", + "gold_answer": "brush", + "os_answer": "bristles", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stain in the bucket could not be cleaned with the brush because the _ is tough.", + "gold_answer": "stain", + "os_answer": "grime", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha was not interested in hearing about Tanya awesome marriage, because _ was happy all the time.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha wanted to reduce smoking by relying on a new nicotine patch and therapy video, but the _ was boring.", + "gold_answer": "video", + "os_answer": "video", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha wanted to reduce smoking by relying on a new nicotine patch and therapy video, but the _ was addictive.", + "gold_answer": "patch", + "os_answer": "patch", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had a slower running phone than Logan because _ had more apps running on theirs.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had a faster running phone than Logan because _ had more apps running on theirs.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The roof would have to be repaired using tarps or shingles before the storm comes. The _ are a temporary fix, though.", + "gold_answer": "tarps", + "os_answer": "tarps", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty had more burns on their hands than Amy because _ worked as a welder.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary wanted to surprise Cynthia with a puppy for Christmas, so _ asked about allergies to dogs.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Keeping the doors closed and the windows opened kept the apartment cool , because the _ let out the heat.", + "gold_answer": "windows", + "os_answer": "windows", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Keeping the doors closed and the windows opened kept the apartment cool , because the _ kept out the heat.", + "gold_answer": "doors", + "os_answer": "doors", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The student tried to write down the notes on the papers but the _ were too long.", + "gold_answer": "notes", + "os_answer": "notes", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel had a shorter expected lifespan than Kenneth, so _ procrastinated in following all their dreams.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The personal trainer gave Laura but not Victoria the more difficult exercise because _ was in shape.", + "gold_answer": "Laura", + "os_answer": "Laura", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The personal trainer gave Laura but not Victoria the more difficult exercise because _ was out of shape.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "When the car was brought up into the shop, the brake was replaced when the wheel wasn't, since the _ was fixed.", + "gold_answer": "wheel", + "os_answer": "caliper", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "At the dance, Adam asked the girl to dance before Donald, so _ is angry with himself.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "B. Donald", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "If I want to build a swing should I build it out of wood or use a tire? It seems like the _ would get dirty and gross inside.", + "gold_answer": "tire", + "os_answer": "tire", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "If I want to build a swing should I build it out of wood or use a tire? It seems like the _ would get rotten eventually.", + "gold_answer": "wood", + "os_answer": "wood", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The beef tasted better than the pork did although the _ had been slightly undercooked.", + "gold_answer": "beef", + "os_answer": "pork", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The chef added butter to the pan on the stove and it began to melt right away because the _ was hot.", + "gold_answer": "pan", + "os_answer": "pan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chef added butter to the pan on the stove and it began to melt right away because the _ was soft.", + "gold_answer": "butter", + "os_answer": "butter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie had a pig while Jennifer had a cow so _ thought mines smaller so its better.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sink in the bathroom looked good but the toilet was leaking so James kept the _ .", + "gold_answer": "sink", + "os_answer": "plumber", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca slept in the hammock in the backyard while Tanya gardened because _ was tired.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bagel shop was closer to Michael than Joel because _ lived in a different area of town.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel but not Christine was tracked down by police because _ made it to the hideout.", + "gold_answer": "Christine", + "os_answer": "Rachel", + "os_eval": "Incorrect. The student's answer conflicts with the true answer provided.", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Rachel but not Christine was tracked down by police because _ did not make it to the hideout.", + "gold_answer": "Rachel", + "os_answer": "Christine", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin had less piercings than Jeffrey did so it was harder for _ to get a job.", + "gold_answer": "Jeffrey", + "os_answer": "Jeffrey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel wanted children, but Megan had no interest, so _ looked for someone else to have babies with.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel wanted children, but Megan had no interest, so _ looked for someone else to have freedom with.", + "gold_answer": "Megan", + "os_answer": "Rachel", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe drank his milk and tried to dunk his cookie in the glass but the _ was too small.", + "gold_answer": "glass", + "os_answer": "glass", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe drank his milk and tried to dunk his cookie in the glass but the _ was too big.", + "gold_answer": "cookie", + "os_answer": "cookie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Anxiety is a feeling Rebecca gets when she has face Erin who is a probation officer, _ does not a fear of authority.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam cried when Donald had a stubbed toe since _ had a look of pain on his face.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bank permitted Michael to open a checking account, but not Matthew, because _ was employed.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bank permitted Michael to open a checking account, but not Matthew, because _ was unemployed.", + "gold_answer": "Matthew", + "os_answer": "Matthew", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The children were not vaccinated, which was fine with Betty but annoyed Mary. _ knew they didn't make kids autistic.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The children were not vaccinated, which was fine with Betty but annoyed Mary. _ believed they made kids autistic.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Firing a shotgun came more naturally for Megan than Tanya because _ grew up around them.", + "gold_answer": "Megan", + "os_answer": "Megan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ ignored drinking milk from the bottle because Rachel was thirsty and Erin already drank some water.", + "gold_answer": "Erin", + "os_answer": "Rachel", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "So _ drank milk from the bottle because Rachel was thirsty and Erin already drank some water.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donna needed dentures or implants for her bad teeth. She chose the _ because they are cheaper.", + "gold_answer": "dentures", + "os_answer": "dentures", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donna needed dentures or implants for her bad teeth. She chose the _ because they are permanent.", + "gold_answer": "implants", + "os_answer": "implants", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We were going fishing out on the dock later in the day after we couldn't all fit in the boat, because the _ was confined.", + "gold_answer": "boat", + "os_answer": "space", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie tended to wear their hair in a ponytail, while Maria wasn't able to, because _ had long hair.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The pine trees were still green in December, but the oak trees were not, because the _ keep their leaves in fall.", + "gold_answer": "pine trees", + "os_answer": "pines", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The pine trees were still green in December, but the oak trees were not, because the _ lose their leaves in fall.", + "gold_answer": "oak trees", + "os_answer": "oak", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Fiction books were interesting and easy to read for Logan but not Brett because _ enjoyed real tales.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel had many extra possesions while Neil didn't, so _ had to rent a storage shed.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel had many extra possesions while Neil didn't, so _ didn't have to rent a storage shed.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey thought Craig probably had gum and asked for a piece, because _ had fresh breath.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey thought Craig probably had gum and asked for a piece, because _ had bad breath.", + "gold_answer": "Jeffrey", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin was able to use their device for longer than Steven because _ remembered to bring their charger.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura was thrilled to get their lip pierced but Rachel was pretty scared. _ had theirs done and cried.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wound responded quickly to the rubbing alcohol, but slowly to the ointment because the _ is more efficient.", + "gold_answer": "rubbing alcohol", + "os_answer": "alcohol", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He tried to use the rag to clean the bacteria off the table but the _ was too large.", + "gold_answer": "table", + "os_answer": "rag", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She decided to report the accident and the burglary, but the _ required much more investigation.", + "gold_answer": "burglary", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She decided to report the accident and the burglary, but the _ required much less investigation.", + "gold_answer": "accident", + "os_answer": "burglary", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brian informed Aaron that their coach had scheduled an extra event on Saturday morning since _ was present at yesterday's practice.", + "gold_answer": "Brian", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "For work I can either get there by car or bicycle. I'm going to take the _ today because the weather is supposed to be rainy.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "No one would have noticed the spot on that skin because the _ is small.", + "gold_answer": "spot", + "os_answer": "blemish", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Because William developed a sore knee during his race against against Kyle, _ won the race.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I couldn't figure out what my costume would be for Halloween Peter Pan or Snow White. The _ costume I'd have to wear a dress.", + "gold_answer": "Snow White", + "os_answer": "Snow White", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I couldn't figure out what my costume would be for Halloween Peter Pan or Snow White. The _ costume I'd have to make myself a boy.", + "gold_answer": "Peter Pan", + "os_answer": "Peter Pan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James passport was kept inside the purse. He never knew the _ is that small.", + "gold_answer": "passport", + "os_answer": "purse", + "os_eval": "Incorrect", + "mcq_answer": "B.", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "James passport was kept inside the purse. He never knew the _ is that big.", + "gold_answer": "purse", + "os_answer": "purse", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Of the two owners, Jessica was far worse than Jennifer, because _ like to treat the dogs.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Of the two owners, Jessica was far worse than Jennifer, because _ like to beat the dogs.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The handle of the spoon was submerged in the cup of tea because the _ is short.", + "gold_answer": "spoon", + "os_answer": "spoon", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tom recently was approved for botox therapy. He had a choice between near the office or near his house and went with his weekday convenience of the _ .", + "gold_answer": "office", + "os_answer": "office", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The water in the car was cooler than the water in the truck because the engine in the _ had run more recently.", + "gold_answer": "truck", + "os_answer": "truck", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The water in the car was hotter than the water in the truck because the engine in the _ had run more recently.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The color of the paint was quite pleasing to Jessica however Natalie believed it to be too bright. _ painted their room with a subdued color paint.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B. Natalie", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Research came easy to Monica as compared to Erin because _ 's father was a landscaper.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Because of his rash, he opted not to wash with soap but with oil, as the _ would soothe it.", + "gold_answer": "oil", + "os_answer": "oil", + "os_eval": "Correct", + "mcq_answer": "B.", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James took out a seat from his office to create more space. The _ is too big.", + "gold_answer": "seat", + "os_answer": "seat", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "His addiction was getting bad so they handed him over to therapy and stopped taking medicine since the _ was cheaper.", + "gold_answer": "therapy", + "os_answer": "therapy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easier for the diner to follow their budget than the food truck because the _ had more money to spend.", + "gold_answer": "diner", + "os_answer": "diner", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easier for the diner to follow their budget than the food truck because the _ had less money to spend.", + "gold_answer": "food truck", + "os_answer": "diner", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Donald stuck his nose up and scoffed at William's ragged outfit, because _ looked like the working class.", + "gold_answer": "William", + "os_answer": "it", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We didn't get the biscuits this morning before school, so I ordered an omelet instead of a hash brown as the _ would make me hungry.", + "gold_answer": "hash brown", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We didn't get the biscuits this morning before school, so I ordered an omelet instead of a hash brown as the _ would make me full.", + "gold_answer": "omelet", + "os_answer": "omelet", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett threw away all the soda and junk food to reduce Leslie's dependence on unhealthy foods because _ cares for his health.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Gem needed both therapy and medicines to cope with her broken leg. She preferred the _ because it was painless.", + "gold_answer": "medicine", + "os_answer": "medicines", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil told Lawrence that he was training to be a race car driver. _ was excited.", + "gold_answer": "Neil", + "os_answer": "Lawrence", + "os_eval": "Incorrect", + "mcq_answer": "B. Lawrence", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Neil told Lawrence that he was training to be a race car driver. _ was worried about him.", + "gold_answer": "Lawrence", + "os_answer": "Lawrence", + "os_eval": "Correct", + "mcq_answer": "B. Lawrence", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the water poured freely into the hole until it disappeared , the _ was little.", + "gold_answer": "water", + "os_answer": "depth", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the water poured freely into the hole until it disappeared , the _ was deep.", + "gold_answer": "hole", + "os_answer": "hole", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena was an excellent flight attendant when Sarah boarded the plane with a fear of flying because, _ was able to overcome their fears.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She wanted to sew a shirt from silk she bought and a jacket in denim from old jeans so the _ was recycled.", + "gold_answer": "denim", + "os_answer": "denim", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty reluctantly confided in Rebecca that she was suffering from memory loss. _ was distraught.", + "gold_answer": "Betty", + "os_answer": "Rebecca", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Carla start doing sit-ups and pushups for her weak spots. The _ are for her abs.", + "gold_answer": "sit-ups", + "os_answer": "sit-ups", + "os_eval": "Correct", + "mcq_answer": "A.", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carla start doing sit-ups and pushups for her weak spots. The _ are for her chest.", + "gold_answer": "pushups", + "os_answer": "pushups", + "os_eval": "Correct", + "mcq_answer": "B. pushups", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher was getting ready to wash Joel's hair,so _ got out shampoo by the sink and sat in the chair.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis invited Joseph on a trip to the hatchery tomorrow morning because _ was also interested in fish.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man finally decided to become a guardian for the child at the orphanage because the _ was loving.", + "gold_answer": "guardian", + "os_answer": "child", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela's room was a lot lighter than Rebecca's room, because the light of _ went out.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca's", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan wrote on the paper with a pencil unlike Jennifer who wrote with a pen, because _ wanted to erase it later.", + "gold_answer": "Megan", + "os_answer": "Megan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan wrote on the paper with a pencil unlike Jennifer who wrote with a pen, because _ wanted to keep it for later.", + "gold_answer": "Jennifer", + "os_answer": "Jennifer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura asked Rachel if she could borrow some clothes because _ loved her fashion sense.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When you buy food for your cat, choose dry instead of wet as the crunchy texture of the _ is better for their teeth.", + "gold_answer": "dry", + "os_answer": "kibble", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easier to get the soil loosened up with the pick than with the shovel, because the _ was solid.", + "gold_answer": "pick", + "os_answer": "ground", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin knew the perfect gift for the wedding shower, but Samantha had to do some research, because _ was slightly acquainted with the bride.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gothic lolita style suited Victoria better than Sarah because _ looked the worst in frilly dresses.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha couldn't see any alternatives, but Emily could, because _ wasn't nearly as open minded.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joseph wanted to sell lemonade at a stand in the summer months instead of the spring months since people in the _ would be thirstier.", + "gold_answer": "summer", + "os_answer": "summer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After a boring meeting, Monica closed her eyes and dozed while Carrie took a walk, as _ had gone to bed late the night before.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After a boring meeting, Monica closed her eyes and dozed while Carrie took a walk, as _ had gone to bed early the night before.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B. Carrie", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My mom didn't fit the shape into the painting, because the _ was too awkward.", + "gold_answer": "shape", + "os_answer": "angle", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My mom didn't fit the shape into the painting, because the _ was too complete.", + "gold_answer": "painting", + "os_answer": "picture", + "os_eval": "Incorrect", + "mcq_answer": "B. painting", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My mom always had training at the house, but not today because the _ was unavailable.", + "gold_answer": "house", + "os_answer": "instructor", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Erin frequently suffered from hair loss while Samantha had healthy hair, as _ was never stressed out.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B. Samantha", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason was at practice all the time to try and get better than Christopher. _ needed more practice.", + "gold_answer": "Jason", + "os_answer": "Christopher", + "os_eval": "Incorrect", + "mcq_answer": "B. Christopher", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The team won a trophy instead of a plaque as a result of hard times as the _ was cheap to make.", + "gold_answer": "trophy", + "os_answer": "trophy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The creatures attacked Derrick while ignoring Ryan, because _ remembered to put on the repellent.", + "gold_answer": "Ryan", + "os_answer": "Ryan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan liked to read a book good more than Samantha because _ liked the peace and quiet.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan liked to read a book good more than Samantha because _ hated the peace and quiet.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Late at night, Rebecca was more tired than Jessica so _ was unable to go right to sleep.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Late at night, Rebecca was more tired than Jessica so _ was able to go right to sleep.", + "gold_answer": "Rebecca", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman pierced the customer's tongue with a needle before piercing his nose because the _ was numb.", + "gold_answer": "tongue", + "os_answer": "tongue", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The woman pierced the customer's tongue with a needle before piercing his nose because the _ was still sensitive.", + "gold_answer": "nose", + "os_answer": "tongue", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Starting the engine of the car took less time unlike the truck since the _ 's engine was working at the time.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil used a chainsaw to cut down the tree instead of a regular saw like William, because _ believed in modern equipment.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shirts were straighter than the pants because the _ were hanging on the hanger.", + "gold_answer": "shirt", + "os_answer": "shirts", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shirts were straighter than the pants although the _ were hanging on the hanger.", + "gold_answer": "pants", + "os_answer": "pants", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man thought lifting the rock, not the log, would give him a hernia because the _ was lighter.", + "gold_answer": "log", + "os_answer": "log", + "os_eval": "Correct", + "mcq_answer": "B. log", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria was able to keep their weight off long term, unlike Felicia, because _ followed a healthy diet.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Maria was able to keep their weight off long term, unlike Felicia, because _ followed a crash diet.", + "gold_answer": "Maria", + "os_answer": "Felicia", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The dog was more suspicious of the locker than of the package because the drugs were in the _ .", + "gold_answer": "locker", + "os_answer": "locker", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin usually paid for the gas when Craig always said he was broke. _ was generous.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin loved people and wanted to help them while Katrina loved to help animals. _ volunteered at the local shelter.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis did not enjoy their afternoon but Hunter did because _ left work after the sunset.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Dennis did not enjoy their afternoon but Hunter did because _ left work after the sunrise.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We were making orange jack o lanterns and bought candles to put in the oranges, the candles did not fit. The _ were too big.", + "gold_answer": "candles", + "os_answer": "candles", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We were making orange jack o lanterns and bought candles to put in the oranges, the candles did not fit. The _ were too small.", + "gold_answer": "oranges", + "os_answer": "oranges", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie committed a bunch of good deeds in Samantha's name, because _ wanted all the credit.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Natalie committed a bunch of good deeds in Samantha's name, because _ didn't want the credit.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "She wanted to shop for more clothes and ultimately decided on the velvet dress instead of the denim jacket because the _ was more casual.", + "gold_answer": "jacket", + "os_answer": "jacket", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil put the finishing touches on the android as he sold it off to Brian because _ was an engineer.", + "gold_answer": "Neil", + "os_answer": "Brian", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura didn't buy anything at all for Betty's birthday, because _ forgot to mention it.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel plans to go to Latin America next year where Dennis is currently living, _ has never been to Latin America.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Beautiful to Angela means something physical, while it's mental to Emily, so _ is deeper.", + "gold_answer": "Emily", + "os_answer": "Emily", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Beautiful to Angela means something physical, while it's mental to Emily, so _ is shallower.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason really wanted to get the job, but he felt like he flunked the interview. The manager called and said he could try the _ again next week.", + "gold_answer": "interview", + "os_answer": "interview", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was wearing wool socks when I went to try on my new boots but I couldn't get them on because the _ were too small.", + "gold_answer": "boots", + "os_answer": "boots", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was wearing wool socks when I went to try on my new boots but I couldn't get them on because the _ were too large.", + "gold_answer": "socks", + "os_answer": "socks", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The library always had more books than computers, most likely because the _ are smaller.", + "gold_answer": "books", + "os_answer": "books", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The library always had more books than computers, most likely because the _ are bigger.", + "gold_answer": "computers", + "os_answer": "books", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hair stylist gave Laura hair extensions and not Katrina because _ had very short hair.", + "gold_answer": "Laura", + "os_answer": "Laura", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Monica did not need a recipe in order to mix a cake but Angela did because _ was an instinctive baker.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had cereal for breakfast while Dennis had a shake, so _ finished drinking their breakfast.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had cereal for breakfast while Dennis had a shake, so _ finished eating their breakfast.", + "gold_answer": "Craig", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan ended up calling the police over an incident involving Jason because _ was scratched by them.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carl needed a new top after ripping his epaulette shirt. He wanted a flannel shirt because the _ is old.", + "gold_answer": "epaulette shirt", + "os_answer": "old", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Garrett was always feeling fatigued because of the energy his job demands. The _ of the job is too much.", + "gold_answer": "demand", + "os_answer": "strain", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ben had to respect his toys and his books to ensure they last long. However, it was difficult to respect the _ because they were fun.", + "gold_answer": "toys", + "os_answer": "toys", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He made a few dishes to serve. One was a salad and the other was a steak. The _ was healthy.", + "gold_answer": "salad", + "os_answer": "salad", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although Angela was overall a nicer person than Natalie, _ often did practice humility very regularlly.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia has a pond in their backyard, but Carrie cannot afford one, which means _ lives in the richer neighborhood.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil's cat was terrified of thunderstorms but Kyle's wasn't bothered by them. _ found their cat hiding under the bed after the loud crackle of thunder.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jay could comfort sad people better instead of happy people because the _ people weren't realistic.", + "gold_answer": "happy", + "os_answer": "happy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eric often thought of his annoying habits, like hitting his pen on his desk, and asked Ryan if it bothered him; _ said he was sorry he had done it.", + "gold_answer": "Eric", + "os_answer": "Eric", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya wanted poppies for her wedding flowers but Carrie said that was an odd choice. _ pointed out it was a wedding and tradition mattered.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin shaved his beard, but Nick had just grown one, so _ gave them all his old oils.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "A. Benjamin", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I got more use in the gym than at the playground because the _ had more things to do.", + "gold_answer": "gym", + "os_answer": "gym", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica can speak English and German but Samantha can only speak English because _ is trilingual.", + "gold_answer": "Samantha", + "os_answer": "Monica", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "All of the bands were not able to march on the fields at the same time because the _ were massive.", + "gold_answer": "bands", + "os_answer": "crowds", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Marty needed some sport and dress shoes, but could only buy one pair. He went with the _ since he would be going to a wedding.", + "gold_answer": "dress", + "os_answer": "dress", + "os_eval": "Correct", + "mcq_answer": "A.", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I like to drink mineral water over tap water when I travel outside of the USA because the _ water in other countries is safe.", + "gold_answer": "mineral", + "os_answer": "bottled", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Pine trees were a big part of Erin s Christmas tree farm while Megan was jewish but helped _ celebrate anyhow.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eating spicy foods better suited Robert and not Adam because _ never got acid reflux from salsa.", + "gold_answer": "Robert", + "os_answer": "Robert", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel hated their new in-laws, but tried to keep it secret from Monica. Eventually _ told them.", + "gold_answer": "Rachel", + "os_answer": "Monica", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha was pretty good at math while Natalie was better at English. _ enrolled in a storytelling class this semester.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth had worse skin than Craig so _ had to use more of the moisturizer.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth had better skin than Craig so _ had to use more of the moisturizer.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cat Natalie owned would snuggle up on Jessica's lap because _ was nice to it all the time.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian always tried to find ways to be productive at work unlike Kenneth, because _ was a hard worker.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya loved pepperoni on their pizza and Katrina loved sausage, so when it had just sausage _ was not very happy.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya loved pepperoni on their pizza and Katrina loved sausage, so when it had just pepperoni _ was not very happy.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jen planned a retreat to a mountain or the park. She chose the _ because it was warmer.", + "gold_answer": "park", + "os_answer": "park", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin bought a new RV but Lawrence liked his old one, so _ decided to buy it.", + "gold_answer": "Lawrence", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin bought a new RV but Lawrence liked his old one, so _ decided to sell it.", + "gold_answer": "Justin", + "os_answer": "Lawrence", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Tanya was unrecognizable after Sarah was done beating them, so _ ended up going to jail.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Frank wanted to put the burger on the barbecue, but the _ wasn't formed yet.", + "gold_answer": "burger", + "os_answer": "charcoal", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "All the glaciers that fell from the top of the mountains were found at the bottom. The _ were large.", + "gold_answer": "Glaciers", + "os_answer": "glaciers", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The student liked writing their signature with a pen instead of a pencil, because the _ showed up lighter.", + "gold_answer": "pencil", + "os_answer": "pencil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The student liked writing their signature with a pen instead of a pencil, because the _ showed up darker.", + "gold_answer": "pen", + "os_answer": "ink", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick showed Jason how to cut the tiles for their kitchen, and _ was shown appreciation for their help.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ avoids eating carrots for their eye health because Emily needs good eyesight while Monica doesn't.", + "gold_answer": "Monica", + "os_answer": "Emily", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The medical waste was moved from the bag to the bucket, so the _ soon became sterilized.", + "gold_answer": "bag", + "os_answer": "bucket", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Sarah but not Erin would get a retirement pension because _ had a 30 year work career.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick had been working on his script for years and refused to get any other job, much to Logan's dismay. _ was worried and upset.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Connie likes to cook at home and decided to forgo a roast in favor of tofu because the _ is useless for a vegetarian meal.", + "gold_answer": "roast", + "os_answer": "meat", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He has a much harder time with this fever compared to the flu, because the _ took one week to get over.", + "gold_answer": "fever", + "os_answer": "flu", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I couldn't decide if I should pressure cook or smoke the pig feet. After looking outside, I decided the weather was poor enough to _ them.", + "gold_answer": "pressure cook", + "os_answer": "smoke", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I couldn't decide if I should pressure cook or smoke the pig feet. After looking outside, I decided the weather was good enough to _ them.", + "gold_answer": "smoke", + "os_answer": "smoke", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The computer ran faster than the tablet because the files on the _ were larger.", + "gold_answer": "tablet", + "os_answer": "tablet", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Gem had a husky breed named Ben. Ben liked both bones and toys. However, he liked the _ the best because it was inedible.", + "gold_answer": "toys", + "os_answer": "toys", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian agreed to buy soap for Kenneth while at the store, and _ paid them back the following day for the errand.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The company wanted to increase labor productivity with its new machinery and camera, but the _ had faulty screws.", + "gold_answer": "machinery", + "os_answer": "machinery", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter prepared the documents and data tables for Matthew's scientific research because _ is his assistant.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel was blown away to find out from Lawrence that goldfish are a type of carp, so _ decided to fact check his friend.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The professor's eyes could not see clearly because of the sunglasses he had. The _ were poor.", + "gold_answer": "Sunglasses", + "os_answer": "sunglasses", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "For her birthday gifts, Sarah was upset with the pearls, but felt the opposite about the rings she received. The _ were fancier.", + "gold_answer": "rings", + "os_answer": "rings", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jody wanted new mascara and eyeliner, either black or brown, but the _ was too light.", + "gold_answer": "brown", + "os_answer": "brown", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jody wanted new mascara and eyeliner, either black or brown, but the _ was too heavy.", + "gold_answer": "black", + "os_answer": "mascara", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron wanted to go the gym but the others wanted to go to the park because the _ did require membership.", + "gold_answer": "gym", + "os_answer": "gym", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor couldn't treat the arm infection, but was able to handle the ear ache. The _ was more petty.", + "gold_answer": "ear ache", + "os_answer": "arm", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had a cat as a pet but Nelson didn't have any pets because _ had little allergies in their system.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Maria mimicked everything that Christine did at work because _ was like a fan to her.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle paid Craig to board the family dog at the kennel for a week, because _ was going on vacation.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria told Monica they looked too sick to go to work and asked if they had a fever. _ went to the Doctor.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stove was left on after Matthew used it, so Nelson turned it off. _ was careful.", + "gold_answer": "Nelson", + "os_answer": "Nelson", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica found the heavy load at work overwhelming but not Katrina because _ did a poor job at planning their work.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The brutal boxing match was suitable for Christopher but not Samuel because _ did damage to his opponent.", + "gold_answer": "Christopher", + "os_answer": "Christopher", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The brutal boxing match was suitable for Christopher but not Samuel because _ did not damage his opponent.", + "gold_answer": "Samuel", + "os_answer": "Christopher", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Going on a diet was easier for Benjamin but not Donald because _ did not know about any different programs.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer got about with a seeing-eye dog but Mary did not because _ was blind.", + "gold_answer": "Jennifer", + "os_answer": "Mary", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer got about with a seeing-eye dog but Mary did not because _ was sighted.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog loved Kevin but hated Derrick, so _ started bringing the dog treats to change its mind.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog hated Kevin but loved Derrick, so _ started bringing the dog treats to change its mind.", + "gold_answer": "Kevin", + "os_answer": "Kevin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The kitty ran away from Kayla and not Felicia because the kitty had known _ for many years.", + "gold_answer": "Felicia", + "os_answer": "Kayla", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "During the summer, I like visiting the zoo more than the aquarium because the _ is inside.", + "gold_answer": "aquarium", + "os_answer": "aquarium", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The market was going out of business so they sold their products but not the lots as the _ were useful.", + "gold_answer": "lots", + "os_answer": "lots", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The market was going out of business so they sold their products but not the lots as the _ were useless.", + "gold_answer": "products", + "os_answer": "plots", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Patricia has a trouble with training her horse and wants Tanya's help, because _ wants her horse to behave.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel had to recently recover from a stroke unlike William because _ was living an unhealthy lifestyle.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy was going to see an X-rated film but was stopped on the sidewalk and yelled at by Nick. The anger showed on _ 's face.", + "gold_answer": "Nick", + "os_answer": "Nick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy was going to see an X-rated film but was stopped on the sidewalk and yelled at by Nick. The shame showed on _ 's face.", + "gold_answer": "Randy", + "os_answer": "Randy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela noticed the lumps on Amy 's arms that she had failed to notice, _ is just oblivious that way.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel ran out of toilet paper, so he asked Dennis in the stall next to him for some. _ was relieved when he agreed.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla was the subject of a secret crush from Rebecca. _ was aware they were a secret admirer.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya was the most powerful person in the world, and Sarah admired them, because _ was something to aspire to.", + "gold_answer": "Tanya", + "os_answer": "power", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian was supposed to be babysitting for Dennis but didn\u2019t show up because _ was forgotten.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Donald was able to catch the Frisbee thrown by Eric, then _ was thrown the Frisbee back.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald was able to catch the Frisbee thrown by Eric, then _ threw the Frisbee back.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Correct. The student's answer \"he\" correctly refers back to Donald, who is mentioned in the question. Both answers are factually correct and refer to the same individual performing the action.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was driving my car and tried to get through the intersection, but the light turned red. The _ is too fast.", + "gold_answer": "light", + "os_answer": "light", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe brought his books to school in a suitcase instead of a backpack because the _ was bigger.", + "gold_answer": "suitcase", + "os_answer": "suitcase", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe brought his books to school in a suitcase instead of a backpack because the _ was smaller.", + "gold_answer": "backpack", + "os_answer": "backpack", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "During the earthquake, the boy hid under the desk instead of the table because the _ was sturdy.", + "gold_answer": "desk", + "os_answer": "desk", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While playing soccer, Robert got kicked in the head and Joel laughed at him causing the coach to look at _ with pity.", + "gold_answer": "Robert", + "os_answer": "Joel", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald had to wax a lot more frequently than Ian because _ had blonde colored hair.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joseph asked Robert to clean the floor with a mop nearby because _ needs to work.", + "gold_answer": "Robert", + "os_answer": "Joseph", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Christine took all the money while Mary told her to save the money for herself. _ only knows to take.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig grew frustrated trying to coach Nick in soccer, as _ lacked the aptitude needed for the task.", + "gold_answer": "Nick", + "os_answer": "Nick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig grew frustrated trying to coach Nick in soccer, as _ lacked the patience needed for the task.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Getting a divorce as soon as possible suited Victoria but not Lindsey because _ was no longer in love.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The musician liked playing at the auditorium more than at the park because he sounded quieter at the _ .", + "gold_answer": "park", + "os_answer": "park", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The musician liked playing at the auditorium more than at the park because he sounded louder at the _ .", + "gold_answer": "auditorium", + "os_answer": "auditorium", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Wanting to impress his boss, the man put the brandy away and served scotch instead because the _ was expensive.", + "gold_answer": "Scotch", + "os_answer": "scotch", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Wanting to impress his boss, the man put the brandy away and served scotch instead because the _ was cheap.", + "gold_answer": "Brandy", + "os_answer": "brandy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Pho needs cilantro and beef to be tasty. However, the _ can be too bitter.", + "gold_answer": "cilantro", + "os_answer": "cilantro", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Pho needs cilantro and beef to be tasty. However, the _ can be too savory.", + "gold_answer": "beef", + "os_answer": "beef", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty's blanket was much thicker than Jessica's blanket, so _ felt cold all night in bed.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher declined when asked by Ian to play a game of chess because _ liked to play intellectual games.", + "gold_answer": "Ian", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie had a phobia about crossing over high bridges but Tanya didn't. _ had to re-route their trip to avoid bridges.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth explained to Ryan that he was dressed like this because he was going to a disco party. _ was excited.", + "gold_answer": "Kenneth", + "os_answer": "Ryan", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth did not like Hunter because he was not a good manager. But he still respected _ because he was his superior.", + "gold_answer": "Hunter", + "os_answer": "him", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca had a way of minimizing risks whereas Mary usually did not. This made _ want to assist.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Paolo tries to remember what he read in the textbook, but all he can think of is the email from his friend because he read the _ ages ago.", + "gold_answer": "textbook", + "os_answer": "textbook", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "If you are trying to get rid of blood spots from clothes use cold water instead of hot water the _ releases the stain.", + "gold_answer": "cold water", + "os_answer": "cold", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "If our relationship just started, should I get her a card or gift for Christmas? She might think I'm cheap if I give the _ .", + "gold_answer": "card", + "os_answer": "card", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "More people attended the funeral of Joel than of Derrick because _ was a mean person.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cleavage had to be hidden for this event's clothing because the _ was inappropriate.", + "gold_answer": "cleavage", + "os_answer": "dress", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Adam decided to shave Denniss beard before the reuinion, because _ thought it was too long.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam decided to shave Denniss beard before the reuinion, but _ thought it was too short.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca had a sneezing reflex unlike Monica, so when they took the cinnamon challenge _ won.", + "gold_answer": "Monica", + "os_answer": "Rebecca", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John tried to clean the juice that spilled on the carpet with a towel but it has sunk deep. The _ is still dry.", + "gold_answer": "towel", + "os_answer": "towel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The landscaping looked better at the house than at the cottage because the _ owners used a hardworking company.", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily had always loved kids and Jessica felt the opposite, so _ was surprised to become a pediatrician.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The intelligence agency ordered new computers for the workers and kept the same peripherals because the _ were at risk.", + "gold_answer": "computers", + "os_answer": "agents", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria planned to spring clean this weekend and told Katrina they should help too. _ purposely left home very early.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria planned to spring clean this weekend and told Katrina they should help too. _ expected her help.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson wanted to be an actor so Neil got them an audition because _ had poor connections in the movie industry.", + "gold_answer": "Nelson", + "os_answer": "Neil", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "During the charity drive, they decided to donate the couch but not the bed because the _ was broken.", + "gold_answer": "bed", + "os_answer": "bedframe", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man decided to use a nail instead of a screw because the _ would be looser in the wood.", + "gold_answer": "screw", + "os_answer": "screw", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jen made charcoal to use as a mask and as toothpaste, but using the _ made her skin very black.", + "gold_answer": "mask", + "os_answer": "charcoal", + "os_eval": "Incorrect", + "mcq_answer": "A. mask", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jen made charcoal to use as a mask and as toothpaste, but using the _ made her teeth very white.", + "gold_answer": "toothpaste", + "os_answer": "toothpaste", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was disappointed as Logan asked him if he had any herb. _ was a stoner.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was disappointed as Logan asked him if he had any herb. _ was let down.", + "gold_answer": "Steven", + "os_answer": "He", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert usually didn't like fish as much as Kyle however _ had a disliking for sardines on pizza.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Monica painted the porch for Kayla so the neighbor berated _ for being so lazy.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis made their weight loss goal before Eric, because _ only ate a healthy diet.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya looked for an escape route while Elena did not because _ liked to live in the moment.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya looked for an escape route while Elena did not because _ liked to be aware of all the surroundings.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was on a diet, but cheated by eating junk food with Christopher. _ felt bad for ruining his plan.", + "gold_answer": "Christopher", + "os_answer": "He", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Elena waited patiently for Angela, as _ arrived early to meet at their prearranged spot.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Incorrect. The student should have used the name \"Elena\" instead of \"she\" to directly match the true answer provided.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In her newly purchased house, Patricia was upset to discover a woodworm infestation and called the realtor Victoria. _ called the sellers to ask them pay for an exterminator.", + "gold_answer": "Victoria", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In her newly purchased house, Patricia was upset to discover a woodworm infestation and called the realtor Victoria. _ wanted the sellers to pay for an exterminator.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We set up the treasure hunt, but the treasure chest was found easily on the path because the _ was big.", + "gold_answer": "chest", + "os_answer": "clue", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We set up the treasure hunt, but the treasure chest was found easily on the path because the _ was short.", + "gold_answer": "path", + "os_answer": "hunt", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald took medication for their anxiety, but Craig went to therapy because _ was open with their feelings.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald took medication for their anxiety, and Craig went to therapy because _ was private with their feelings.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Hunter found they no longer returned Joseph's love in their marriage, therefore _ received divorce papers.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In order to grow his plants naturally, he bought fertilizer and water. The _ was lacking with nutrients.", + "gold_answer": "water", + "os_answer": "fertilizer", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In order to grow his plants naturally, he bought fertilizer and water. The _ was filled with nutrients.", + "gold_answer": "fertilizer", + "os_answer": "fertilizer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla threw the phone to Rebecca, then _ asked for it to be thrown back.", + "gold_answer": "Kayla", + "os_answer": "Rebecca", + "os_eval": "Incorrect", + "mcq_answer": "B. Rebecca", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Michael had less money than Samuel did because _ liked to shop and spend money too much.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had more money than Samuel did because _ like to shop and spend money too much.", + "gold_answer": "Samuel", + "os_answer": "Samuel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After a nasty breakup, Kayla needed a restraining order from Samantha because _ was scary to them.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I didn't do well on my exam even though I did all the problems in the textbook correctly. I guess the questions in the _ were just too hard.", + "gold_answer": "exam", + "os_answer": "exam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At dinner time, Tanya ate Erin's serving of peas even though _ really likes green vegetables.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sally knew the exam would be hard so she developed a study schedule. The _ was 4 weeks long.", + "gold_answer": "schedule", + "os_answer": "schedule", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sally knew the exam would be hard so she developed a study schedule. The _ was 4 weeks away.", + "gold_answer": "exam", + "os_answer": "exam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey brushed their teeth quite regularly but Brian did not. _ rarely had to go to a dentist.", + "gold_answer": "Jeffrey", + "os_answer": "Jeffrey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey brushed their teeth quite regularly but Brian did not. _ had to go to a dentist often.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The kid looked terrible in the ancient Egyptian dress because the _ was too small.", + "gold_answer": "kid", + "os_answer": "costume", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Monica was worried that Mary might be caught in a scam when they started their new job, but _ decided to trust their friend's judgement.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian taught Michael how to feed a rabbit greens because _ had rabbits as a kid.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "i had to walk closer to the board to see the phone numbers, only the monogram of the company is visible from a distance. The _ is bold.", + "gold_answer": "monogram", + "os_answer": "monogram", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He was having an asthma attack but forgot his inhaler so someone recommended coffee as the _ was unavailable.", + "gold_answer": "inhaler", + "os_answer": "alternative", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy tried to spread the cake icing all over the cake but the _ was not enough.", + "gold_answer": "icing", + "os_answer": "amount", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia teaches Kindergarten students, Christine teaches High School students therefore _ doesn't read aloud a lot.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia teaches Kindergarten students, Christine teaches High School students therefore _ reads aloud a lot.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey has dark lips unlike Elena due to _ remembering to put on chapsticks at night.", + "gold_answer": "Elena", + "os_answer": "not", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey has dark lips unlike Elena due to _ forgetting to put on chapsticks at night.", + "gold_answer": "Lindsey", + "os_answer": "her", + "os_eval": "GRADE: Incorrect\n\nThe student's answer \"her\" is a pronoun that does not clearly specify whether it is Lindsey or Elena who forgets to put on chapstick. The true answer \"Lindsey\" specifically identifies the subject, which should clearly be indicated in the response. Therefore, the student's answer is considered incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joseph has an allergy to mangoes, but Nelson does not, so _ has to be very careful.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin went with Donald to the game because _ wanted to be the designated driver.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mike wanted to make the picture with the Photoshop software instead of the Paintshop software because the _ was more reliable.", + "gold_answer": "Photoshop software", + "os_answer": "output", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason missed his work shift in order to finish his research paper, because the _ was less important.", + "gold_answer": "work shift", + "os_answer": "shift", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The paper bags got torn when James was using it to move the groceries. The _ are weak.", + "gold_answer": "bags", + "os_answer": "bags", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was worried about the height requirements for the rollercoaster more than Dennis was since _ was short.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was worried about the height requirements for the rollercoaster more than Dennis was since _ was tall.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The quill was used by the writer much more than the pen for the job since the _ is heavy.", + "gold_answer": "pen", + "os_answer": "pen", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel has experience driving large vehicles and Lawrence doesn't. _ drives their RV with accuracy.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She used vinegar to wipe down the cabinets hourly and a wood cleaner monthly. The _ was overused.", + "gold_answer": "vinegar", + "os_answer": "vinegar", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Despite the fact that Joseph was sick and Craig was healthy, _ still stayed home from work that day.", + "gold_answer": "Craig", + "os_answer": "Joseph", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The teacher asked for the homework. Elena played games the night before and Tanya did not, so _ got an F.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teacher asked for the homework. Elena played games the night before and Tanya did not, so _ got an A.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "B. Tanya", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William had a fear about nothing unlike Benjamin, because _ had a horrible childhood growing up.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The smell in the kitchen of the home is unbearable, while the laundry room smells fine. The _ must have been cleaned longer ago.", + "gold_answer": "kitchen", + "os_answer": "kitchen", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The clothing in the north was warmer than the clothing in the south because there was more snow in the _ .", + "gold_answer": "north", + "os_answer": "north", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The clothing in the north was warmer than the clothing in the south because there was more sun in the _ .", + "gold_answer": "south", + "os_answer": "south", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan grew the houseplant from seed, but Matthew bought a plastic plant instead, because _ tended to neglect plants.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The thief tried to escape over the fence, but the _ was too short for him to climb over.", + "gold_answer": "thief", + "os_answer": "ladder", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The rib-eye steak needed some artisan pepper to season it because the _ was flavorful.", + "gold_answer": "pepper", + "os_answer": "steak", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The rib-eye steak needed some artisan pepper to season it because the _ was bland.", + "gold_answer": "steak", + "os_answer": "meat", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil introduced William, who is very shy, to his friends, but _ was being very embarrassing.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil introduced William, who is very shy, to his friends, but _ was being very quiet.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gas was not smelling out of the tank but out of the hose because the _ is leaky.", + "gold_answer": "hose", + "os_answer": "hose", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gas was not smelling out of the tank but out of the hose because the _ is sealed.", + "gold_answer": "tank", + "os_answer": "tank", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura had a much better body than Katrina, because _ spent all of their time at the ice cream shop.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My home is closer to the store than John's house, because the _ of me is next door.", + "gold_answer": "home", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha believed in life after death while Christine did not, so _ never tried to talk to spirits.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James always had to wash his shoe after jogging on the street but it is not always the same when jogging on the lawn. The _ is clean.", + "gold_answer": "lawn", + "os_answer": "lawn", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While at the store, Logan grabbed a head of lettuce for Eric to use for dinner, but _ already had some at home.", + "gold_answer": "Eric", + "os_answer": "Eric", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While at the store, Logan grabbed a head of lettuce for Eric to use for dinner because _ knew there was none at home.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In the hotel laundry room, Felicia burned Mary's shirt while ironing it, so the manager wrote _ up.", + "gold_answer": "Felicia", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In the hotel laundry room, Felicia burned Mary's shirt while ironing it, so the manager gave _ a refund.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey asked Hunter when was the date set for the wedding because _ was getting married.", + "gold_answer": "Hunter", + "os_answer": "Hunter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey asked Hunter when was the date set for the wedding because _ was his best man.", + "gold_answer": "Jeffrey", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had never learned handwriting in school but Michael had learned beautiful script so, _ always typed all their correspondence.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia did laundry by hand, but Lindsey used the electric washer, because _ wore clothes made of delicate fabrics.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dancer would leave the stage and enter the hall after her dance was finished, as the _ was where she belonged during the dance.", + "gold_answer": "stage", + "os_answer": "stage", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick needed Kenneth to go to the store and get a baby bib, but _ said the one they had was still ok.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "His hands were a lot rougher than his thighs, because he used the _ for nothing.", + "gold_answer": "thighs", + "os_answer": "thighs", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine told Samantha at court their reasons for their expired license, since _ had the responsibility to attend.", + "gold_answer": "Christine", + "os_answer": "they", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine told Samantha at court their reasons for their expired license, since _ had the responsibility to judge.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig was all about self-publishing his first album, but a PRO rep Lawrence advised against it. _ advocated for a very hands-on approach to publishing.", + "gold_answer": "Craig", + "os_answer": "Lawrence", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig was all about self-publishing his first album, but a PRO rep Lawrence advised against it. _ advocated for a very hands-off approach to publishing.", + "gold_answer": "Lawrence", + "os_answer": "He", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The cleaning crew always used rags instead of washcloths, although the _ tended to wear out quickly.", + "gold_answer": "rags", + "os_answer": "rags", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I hated the project this year compared to the essay last year, because the _ required more work.", + "gold_answer": "project", + "os_answer": "project", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While waiting for the movie to begin, Natalie bought popcorn and drinks for Lindsey, since _ had little money.", + "gold_answer": "Lindsey", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher was able to travel abroad, while William only travelled domestically, as _ had never applied for a passport.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The rubber resisted the rock but snapped on the concrete, as the _ was abrasive.", + "gold_answer": "concrete", + "os_answer": "concrete", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The rubber resisted the rock but snapped on the concrete, as the _ was smooth.", + "gold_answer": "rock", + "os_answer": "concrete", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Al got solar panels and a small generator installed at his house for electricity as the _ would be his main power supply.", + "gold_answer": "panels", + "os_answer": "solar", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The newborns in the nursery were very frail because they were fed the _ calorie food during the high and low calorie experiment..", + "gold_answer": "low", + "os_answer": "low", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The newborns in the nursery were very hardy because they were fed the _ calorie food during the high and low calorie experiment.", + "gold_answer": "high", + "os_answer": "high", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jane's hair was bound by a band until the band was cut because the _ is bulky.", + "gold_answer": "hair", + "os_answer": "band", + "os_eval": "Incorrect", + "mcq_answer": "B. hair", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The patient put in a special request for Brett instead of Kyle because _ was always stern.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel decided on adopting a young puppy but Megan didn't because _ didn't want to train a pupply.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin became very ill with pneumonia, so Matthew made him some soup; then _ finally went home.", + "gold_answer": "Matthew", + "os_answer": "Matthew", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Applying to dance in music videos was great for Erin but not Lindsey because _ was a beginner dancer.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The landlord said she had violated her lease by allowing a dog into the apartment. She said that the dog did not violate the _ at all.", + "gold_answer": "lease", + "os_answer": "lease", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin asked Samuel to buy them a puppy, because _ could not have a pet.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The jeans fit worse than the shirt because I had tried the _ on at the store.", + "gold_answer": "shirt", + "os_answer": "shirt", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson teased Christopher about needing to find a homecoming date because _ could not find one.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson teased Christopher about needing to find a homecoming date because _ already had one.", + "gold_answer": "Nelson", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The athletes on the team of Christine were more tired than those on the team of Monica because the ones with _ did less laps.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The athletes on the team of Christine were less tired than those on the team of Monica because the ones with _ did less laps.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John could not buy anything from the store than night and he went to the kiosk to buy some things because the _ is opened.", + "gold_answer": "kiosk", + "os_answer": "kiosk", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In order to increase her estrogen, Jenny started eating carrots instead of donuts because the _ were not junky.", + "gold_answer": "carrots", + "os_answer": "carrots", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It smelled a lot better near the pool than it did near the compost because there was no garbage in the _ .", + "gold_answer": "pool", + "os_answer": "pool", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide the book inside his jacket because the _ is small.", + "gold_answer": "book", + "os_answer": "book", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide the book inside his jacket because the _ is big.", + "gold_answer": "jacket", + "os_answer": "jacket", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian laughs at Ryan because of the small Christmas tree they picked out. _ wants a table top tree.", + "gold_answer": "Ryan", + "os_answer": "Ryan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian laughs at Ryan because of the small Christmas tree they picked out. _ wants a six foot tree.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Betty gave the full pitcher to Rachel so _ could fill her glass with water.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett looks as if they are aging at half the rate of Craig because _ has lived a rough lifestyle.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel's date was shorter than she, so she wore her shoes rather than her boots, because the _ had high heels.", + "gold_answer": "boots", + "os_answer": "boots", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel's date was shorter than she, so she wore her shoes rather than her boots, because the _ had low heels.", + "gold_answer": "shoes", + "os_answer": "shoes", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The store had 80 platters but only 2 bowls left in stock because the _ were in high demand.", + "gold_answer": "bowls", + "os_answer": "bowls", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The store had 80 platters but only 2 bowls left in stock because the _ were in low demand.", + "gold_answer": "platters", + "os_answer": "platters", + "os_eval": "Correct", + "mcq_answer": "A.", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah had to call in an expert unlike Erin because _ had no knowledge on the subject.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A. Sarah", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah had to call in an expert unlike Erin because _ had vast knowledge on the subject.", + "gold_answer": "Erin", + "os_answer": "Sarah", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica really enjoys a vodka drink, but Felicia prefers whiskey because _ likes dark liquors.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica really enjoys a vodka drink, but Felicia prefers whiskey because _ likes clear liquors.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The knee injury of Samantha has healed much quicker than Katrina's. _ 's injury was minor.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia felt very thirsty but Sarah did not feel thirsty. _ bought a bag of chips.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha failed on the test but Mary got very good marks because _ had been very lazy.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle wanted to write to Aaron every day, because _ enjoyed sending letters to friends.", + "gold_answer": "Kyle", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle wanted to write to Aaron every day, because _ enjoyed receiving letters from friends.", + "gold_answer": "Aaron", + "os_answer": "Aaron", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The toddler kicked the soft furniture and hard toy, but only the _ caused pain.", + "gold_answer": "toy", + "os_answer": "toy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The toddler kicked the hard furniture and soft toy, but only the _ caused pain.", + "gold_answer": "furniture", + "os_answer": "furniture", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica saw Laura constantly flirt with men in the office. _ thought it was normal in a place of business and she was admired by their coworkers.", + "gold_answer": "Laura", + "os_answer": "They", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Much to the dismay of Christopher, Jeffrey learned of their evil plan, and _ was stopped before it succeeded.", + "gold_answer": "Christopher", + "os_answer": "it", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The student wanted to be respectful to the teacher so he got her a book instead of an apple because the _ was old.", + "gold_answer": "apple", + "os_answer": "tradition", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha's main artistic medium was paint, while Patricia preferred to work with clay, since _ was trained as a sculptor.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil asked Brian to hand him the measuring tape, but _ already measured the wall to center the picture.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The creams didn't work as well on my skin as the lotions did because the _ were new.", + "gold_answer": "lotions", + "os_answer": "creams", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kiwis are a favorite of Ryan, while Derrick can't eat them. _ has sensitive teeth.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although Amy worked harder and longer than Rebecca, _ was a more wealthy person overall.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to write a list of what he can do for Christmas and he ended up using all the pages in the notepad. The _ is long.", + "gold_answer": "list", + "os_answer": "list", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to write a list of what he can do for Christmas and he ended up using all the pages in the notepad. The _ is short.", + "gold_answer": "page", + "os_answer": "list", + "os_eval": "Incorrect", + "mcq_answer": "C. notepad", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha gifted her new bathrobe to Betty because it felt very comfortable for _ when she tried it on.", + "gold_answer": "Betty", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha gifted her new bathrobe to Betty because it felt very itchy for _ when she tried it on.", + "gold_answer": "Samantha", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chopstick were better to eat the noodles with than the fork as the _ was repaired.", + "gold_answer": "chopstick", + "os_answer": "fork", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "James was finding a space on the couch for the box to be placed but he could not find it because the _ is big.", + "gold_answer": "box", + "os_answer": "box", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael loved eating many different vegetables but not Brett because _ was on a vegetarian diet.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "It was painful for Justin to break up with Jason, but _ wasn't ready to move on.", + "gold_answer": "Jason", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Needing a boost Emily asked Rachel to put them on their shoulders in order to reach the roof, _ is tall in height.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bill had complicated feelings about getting a car after his motorcycle died because the _ possessed a lot of new features.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bill had complicated feelings about getting a car after his motorcycle died because the _ possessed a lot of sentimental value.", + "gold_answer": "motorcycle", + "os_answer": "motorcycle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "As a marine, Emily looks down on civilians like Maria, so _ is a bit saddened.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle makes a lot more money than Nelson can make at his job, as _ is a cashier.", + "gold_answer": "Nelson", + "os_answer": "Nelson", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The food that Hunter ate was spoiled but not that of Brett because _ left his food outside.", + "gold_answer": "Hunter", + "os_answer": "Hunter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The food that Hunter ate was spoiled but not that of Brett because _ left his food in the fridge.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura held the steel for their project while Carrie used the blowtorch, because _ was more skilled.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy recognized the man in the waiting room before Monica did, because _ had met the man only once.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nick smelled much worse than Kenneth after the baseball game although _ was wearing deodorant.", + "gold_answer": "Nick", + "os_answer": "Nick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Mark wanted to lose some weight by starting a diet and workout routine. He focused mainly on the _ because he was lazy.", + "gold_answer": "diet", + "os_answer": "diet", + "os_eval": "Correct", + "mcq_answer": "B.", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The drink was rich in caffeine and low in sugar because the _ was suffice in keeping the drinker awake.", + "gold_answer": "caffeine", + "os_answer": "caffeine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The drink was rich in caffeine and low in sugar because the _ was not enough to keep the drinker awake.", + "gold_answer": "sugar", + "os_answer": "caffeine", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The tree fell down sooner than the sapling because the roots of the _ were stronger.", + "gold_answer": "tree", + "os_answer": "sapling", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The tree fell down after the sapling because the roots of the _ were weaker.", + "gold_answer": "sapling", + "os_answer": "tree", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The man with the fever came over and talked to Carrie and not Lindsey because _ was a patient.", + "gold_answer": "Lindsey", + "os_answer": "Carrie", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha told Lindsey to be careful with the porcelain doll; when she ignored her and dropped the doll, _ was very sorry.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The Windows software attempted to install the upgrades onto the computer, but the _ exceeded data capacity.", + "gold_answer": "software", + "os_answer": "installation", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The Windows software attempted to install the upgrades onto the computer, but the _ was outdated.", + "gold_answer": "computer", + "os_answer": "firmware", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "James could not lift the bottle of water up to the table top because the _ is tall.", + "gold_answer": "table", + "os_answer": "table", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria gave birth to Katrina, so after the process was over, _ was a brand new mother.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jan planted her herbs in small growing bags, but she worried that the _ would be too shallow for them to put down roots.", + "gold_answer": "bags", + "os_answer": "soil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jan planted her herbs in small growing bags, but she worried that the _ would be too stifled to put down roots.", + "gold_answer": "herbs", + "os_answer": "plants", + "os_eval": "Correct.", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Writing came easily to Carrie but was difficult for Natalie because _ had taken engineering in college.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina asked Rachel to change the diapers for the babies this morning because _ is handling the stove.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina asked Rachel to change the diapers for the babies this morning because _ isn't doing anything.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett took more medicines than Aaron did although _ was suffering from many more diseases.", + "gold_answer": "Aaron", + "os_answer": "Aaron", + "os_eval": "Correct", + "mcq_answer": "B. Aaron", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The life of Christine was pretty basic until they met Maria , _ is a is lover of excitement .", + "gold_answer": "Maria", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin lied to Logan because _ was so upset about the money that was missing.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha decided to mix the mortar while Rebecca applied it to the wall. _ was not good at the finishing touches.", + "gold_answer": "Samantha", + "os_answer": "Rebecca", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick greeted Craig at the event but he did not respond to him because _ is humble.", + "gold_answer": "Derrick", + "os_answer": "Craig", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Derrick greeted Craig at the event but he did not respond to him because _ is arrogant.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica chose Kayla as the winning contestant on the reality show because _ was a contestant on the show.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael swam in the pond for longer than Derrick because _ thought the algae was okay.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth worked hard at training martial arts but not Samuel. _ couldn't made their dream come true of fighting in the UFC octagon.", + "gold_answer": "Samuel", + "os_answer": "Neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Because Megan wanted to be a welder and Patricia wanted to be a engineer, _ went to university instead of trade school.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Because Megan wanted to be a welder and Patricia wanted to be a engineer, _ went to trade school instead of university.", + "gold_answer": "Megan", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man took longer to pay for the shoes than the shirt because he paid for the _ in coins.", + "gold_answer": "shoes", + "os_answer": "shoes", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man took longer to pay for the shoes than the shirt although he paid for the _ in coins.", + "gold_answer": "shirt", + "os_answer": "shirt", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide to gift he brought wit him in his pocket because the _ is big.", + "gold_answer": "pocket", + "os_answer": "pocket", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide to gift he brought wit him in his pocket because the _ is small.", + "gold_answer": "gift", + "os_answer": "gift", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sometimes I write in my journal with a pencil instead of a pen, but the _ can be run dry.", + "gold_answer": "pen", + "os_answer": "pencil", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John cannot run the entire length of the track, he had been used to the field. The _ is short.", + "gold_answer": "field", + "os_answer": "field", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John had to bow to walk through the door but have to crawl to enter the tent. The _ is taller.", + "gold_answer": "door", + "os_answer": "door", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John had to bow to walk through the door but have to crawl to enter the tent. The _ is shorter.", + "gold_answer": "tent", + "os_answer": "tent", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam's blushed a deep red when Jeffrey saw him fall off his horse, but _ tried to pretend it didn't hurt.", + "gold_answer": "Adam", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Leslie told Aaron he only wanted to eat food that was healthy, he was laughed at. The teacher comforted _ immediately.", + "gold_answer": "Leslie", + "os_answer": "Leslie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Leslie told Aaron he only wanted to eat food that was healthy, he was laughed at. The teacher scolded _ immediately.", + "gold_answer": "Aaron", + "os_answer": "Aaron", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor treated Natalie, but refused to see Tanya, because _ has an incredible insurance plan.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica asked Rebecca to go see a new horror movie even though _ knew she would likely to decline the invitation.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It doesn't take much to shift between ice and water. The _ is hard and strong when its cold.", + "gold_answer": "ice", + "os_answer": "ice", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It doesn't take much to shift between ice and water. The _ is fluid and flexible when its warm.", + "gold_answer": "water", + "os_answer": "boundary", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy's being taught how to pay it forward by Kayla, so _ is likely the younger person.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven asked Joseph to have their stomach examined after _ had a night full of really bad gas issues.", + "gold_answer": "Joseph", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The assertive commander told the privates to change their boots but not their shirts because the _ were disgusting.", + "gold_answer": "boots", + "os_answer": "boots", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The assertive commander told the privates to change their boots but not their shirts because the _ were fine.", + "gold_answer": "shirts", + "os_answer": "shirts", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chef decided to omit the chicken from his signature dish for the party, because the _ needed to be vegetarian.", + "gold_answer": "dish", + "os_answer": "menu", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Timmy bought a transporter for his cat so he could take him on the plane but the _ was too small.", + "gold_answer": "transporter", + "os_answer": "transporter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia was given a leather belt from Betty to clean it, because _ knows how to do it.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia was given a leather belt from Betty to clean it, because _ doesn't know how to clean it.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eric replaced his long hair with a new hat for the summer time, the _ was old.", + "gold_answer": "hair", + "os_answer": "hat", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter had low tire pressure and asked Eric to fill the tires; when he said no, _ filled the tires.", + "gold_answer": "Hunter", + "os_answer": "Hunter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie tried to convince Cynthia that the cat needed a microchip because _ was concerned about the cat getting lost.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor felt more sympathy for Aaron than Ryan because _ had a curable illness and great insurance.", + "gold_answer": "Ryan", + "os_answer": "Aaron", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Emily delivered the daily newspaper to Samantha promptly, so _ gave a nice Christmas bonus.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily delivered the daily newspaper to Samantha promptly, so _ expected a nice Christmas bonus.", + "gold_answer": "Emily", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jack wanted to start a game, but couldn't decide between baseball or basketball. The _ game would needed fewer of friends.", + "gold_answer": "basketball", + "os_answer": "second", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jack wanted to start a game, but couldn't decide between baseball or basketball. The _ game would call for more friends.", + "gold_answer": "baseball", + "os_answer": "basketball", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to wear the corsage but it wouldn't fit around his wrist because his _ was too small.", + "gold_answer": "corsage", + "os_answer": "wrist", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to wear the corsage but it wouldn't fit around his wrist because the _ was too big.", + "gold_answer": "wrist", + "os_answer": "band", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura was climbing down from the roof and Katrina was below so, _ was holding the ladder.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bill could only go out to the restaurants rather than the bars because going to the _ required a minimum age.", + "gold_answer": "bars", + "os_answer": "bars", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina demanded that Jessica get off of their property, because _ was in the neighborhood for visiting.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina demanded that Jessica get off of their property, because _ wasn't in the mood for visiting.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the hospital, Kenneth tended to Randy 's wounds as _ was learning to contain an infection.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Justin admired the art hung on the wall by Nick, so _ asked if he would like to take something home.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man chose medication for his infection rather than the ointment, because the _ was ineffective.", + "gold_answer": "ointment", + "os_answer": "ointment", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary felt a great deal of guilt for stealing various items from Rachel so _ forgave her.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis warned Craig if they were late to work agian they would suffer termination, _ works for the boss at the local factory.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Patricia bought Christine a watch for their birthday because _ was tired of asking about the time.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The teenager chose a jeweled pin for her belly piercing, but the _ was too tiny.", + "gold_answer": "piercing", + "os_answer": "jewel", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The teenager chose a jeweled pin for her belly piercing, but the _ was too huge.", + "gold_answer": "pin", + "os_answer": "jewel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After visiting their tenth college, Kevin asked Donald to just make up his mind, because _ just didn't have time for more.", + "gold_answer": "Kevin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After visiting their tenth college, Kevin demanded that Donald to just make up _ 's mind, because he just didn't have time for more.", + "gold_answer": "Donald", + "os_answer": "his", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the store, John signed a warranty contract for the tablet, but did not purchase insurance for the phone, because the _ was unlikely to be damaged.", + "gold_answer": "phone", + "os_answer": "phone", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the store, John signed a warranty contract for the tablet, but did not purchase insurance for the phone, because the _ was likely to be damaged.", + "gold_answer": "tablet", + "os_answer": "tablet", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Bob had a love and hate relationship with gambling and the _ grew as he won more money.", + "gold_answer": "love", + "os_answer": "tension", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine was tired of Maria being a pain in the neck after _ laid down the prank trap.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Derrick told Christopher about quitting school to provide for their family, _ started panicking.", + "gold_answer": "Derrick", + "os_answer": "Christopher", + "os_eval": "Incorrect", + "mcq_answer": "B. Christopher", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The food Katrina made was very bland, so Victoria added some salt; _ felt bad and vowed not to season again.", + "gold_answer": "Victoria", + "os_answer": "Katrina", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She was the prettiest in the room, wearing a pretty dress and jewelry. The _ was sparkling.", + "gold_answer": "jewelry", + "os_answer": "jewelry", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason hired his coworker to paint the house instead of hiring a painting company, because the _ will do it for more money.", + "gold_answer": "painting company", + "os_answer": "company", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The crops in the facility grew better than in the greenhouse since the _ was bright inside.", + "gold_answer": "facility", + "os_answer": "lighting", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Beautiful roses were bought by Jason for Dennis because _ is a receiver in general.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The battery of the the phone died faster than the laptop battery, because the _ was always off.", + "gold_answer": "laptop", + "os_answer": "laptop", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The battery of the the phone died faster than the laptop battery, because the _ was always on.", + "gold_answer": "phone", + "os_answer": "screen", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia ran out of shirts and borrowed one from Patricia, but _ didn't ask permission ahead of time.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I wanted to use pomade on my hair instead of hairspray but it was old so the _ was unusable.", + "gold_answer": "pomade", + "os_answer": "pomade", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan picked up some olive oil for Felicia because _ hated to cook but loved to eat.", + "gold_answer": "Megan", + "os_answer": "Felicia", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Megan picked up some olive oil for Felicia because _ loved to cook but hated to eat.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian always got ready quickly in the morning and ended up waiting for Christopher, _ was always punctual.", + "gold_answer": "Ian", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kayla always wears sunscreen outdoors but Natalie doesn't because _ isn't concerned about getting neck wrinkles.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia wanted to be pampered by Emily, so _ went to the jewelry store and bought an expensive ring.", + "gold_answer": "Emily", + "os_answer": "Emily", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man couldn't stop thinking about the violin and the crossbow he lost when he was younger. He used to love to shoot _ .", + "gold_answer": "crossbow", + "os_answer": "arrows", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mastering the game of chess was easier for Brian than William because _ had an analytical mind.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gerbil came over to Laura but not Monica because _ was holding a hockey stick.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gerbil came over to Laura but not Monica because _ was holding a carrot stick.", + "gold_answer": "Laura", + "os_answer": "Laura", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle loved to camp in the wilderness but Justin preferred a nice hotel. _ booked a trip to New York City.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle loved to camp in the wilderness but Justin preferred a nice hotel. _ booked a trip to Yellowstone Park.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The _ car was a pleasure to drive but the red car was not as the blue car was very expensive.", + "gold_answer": "blue", + "os_answer": "blue", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The blue car was a pleasure to drive but the _ car was not as the red car was very cheap.", + "gold_answer": "red", + "os_answer": "red", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha wanted to use a valet to park the car but Carrie did not because _ was generous with money.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The trumpet part overpowered the reeds but could not be heard over the strings, as the _ were just too quiet .", + "gold_answer": "reeds", + "os_answer": "reeds", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James forgot to put the food in the freezer so he had to eat the fruits the next day because the _ is rotting.", + "gold_answer": "food", + "os_answer": "fruit", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The patient took calcium to fix his broken bone but the _ was too weak.", + "gold_answer": "bone", + "os_answer": "bone", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The patient took calcium to fix his broken bone but the _ was too strong.", + "gold_answer": "calcium", + "os_answer": "pain", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily has never struggled with blood clots like Victoria has, because _ lives a sedentary, gluttonous lifestyle.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "On the playground at school during recess, Monica called Emily a chicken because _ was capable of climbing the ladder.", + "gold_answer": "Monica", + "os_answer": "Emily", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "On the playground at school during recess, Monica called Emily a chicken because _ was scared of climbing the ladder.", + "gold_answer": "Emily", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hannah had to get a lawyer to help her understanding of the contract language because the _ the contract had was too complex.", + "gold_answer": "language", + "os_answer": "jargon", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary loved to make baked potatoes, but Monica couldn't stand the smell; _ asked her to only make them when she was alone.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary loved to make baked potatoes, but Monica couldn't stand the smell; _ only made them when she was alone.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The fisherman wanted to put the rock in the pond but the _ was too small.", + "gold_answer": "pond", + "os_answer": "pond", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joe did a lot worse on the quiz last week than he did on the test today, because the _ was a surprise.", + "gold_answer": "quiz", + "os_answer": "quiz", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena was asked by Jessica to put patches in the holes in her pants; _ gave her some she bought at the store.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena was asked by Jessica to put patches in the holes in her pants; _ used some she already had at home.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Learning a new form of karate was difficult for Logan but not William because _ was not athletic.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian wanted a horse but not Nick because _ raised cattle in their spare time.", + "gold_answer": "Brian", + "os_answer": "Nick", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Elena liked lizards more than Rachel did, so _ was appalled to receive a pet gecko for her birthday.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan preferred to snowboard while Kyle wanted to do biathlon so _ went up the hill.", + "gold_answer": "Logan", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She watered the rose but not the cactus, because the soil of the _ was already wet.", + "gold_answer": "cactus", + "os_answer": "cactus", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She watered the rose but not the cactus, because the soil of the _ was already dry.", + "gold_answer": "rose", + "os_answer": "cactus", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nick did not like sauces made from tomato, only creamy sauces. Ryan knew this so he only made white sauce when _ came over.", + "gold_answer": "Nick", + "os_answer": "Nick", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The ingredients that I use are tastier than the available toppings because the _ are old.", + "gold_answer": "toppings", + "os_answer": "toppings", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel knew exactly how to treat the injured person's wound but not Emily because _ took a woodworking class in high school.", + "gold_answer": "Emily", + "os_answer": "Rachel", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The dress could use either velcro or a zipper to close, the _ would last longer.", + "gold_answer": "zipper", + "os_answer": "zipper", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The class was going on a bus on a field trip to a local museum. The _ had to close at 4.", + "gold_answer": "museum", + "os_answer": "museum", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kelly was embarrassed when his toga fell off at the party and people saw his underwear because the _ was too tight.", + "gold_answer": "underwear", + "os_answer": "belt", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kelly was embarrassed when his toga fell off at the party and people saw his underwear because the _ was too loose.", + "gold_answer": "toga", + "os_answer": "belt", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla was always thinner than Rachel because _ enjoyed eating brioche and butter every morning.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert has no regret for punching Justin in the nose even though _ was the victim of injustice.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert has no regret for punching Justin in the nose because _ was the victim of injustice.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dark circles under Erin's eyes were darker than Cynthia's due to _ being older.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cake got burnt under the heat applied to it. It appears the _ is too small.", + "gold_answer": "cake", + "os_answer": "oven", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Harper wanted to wear a cowboy hat and a bolero tie to her party, but the _ didn't fit her head.", + "gold_answer": "hat", + "os_answer": "hat", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura put fruit in their pie for Lindsey to eat, and _ ate half the pie after that one was done baking.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I started a program for youth that worked better than the old system, because the _ is new.", + "gold_answer": "program", + "os_answer": "approach", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William was very comfortable entering Kenneth 's personal domain any time, as _ was very self-assured.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya recently finished filling out a job application but not Megan because _ is currently unemployed.", + "gold_answer": "Tanya", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Tanya recently finished filling out a job application but not Megan because _ is currently working.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence had lost a lot of weight on their diet but Hunter wasn't nearly as succesful. _ was now heavy.", + "gold_answer": "Hunter", + "os_answer": "He", + "os_eval": "Incorrect", + "mcq_answer": "B. Hunter", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey did not know how to make a good impression for an interview with Tanya. _ was surprised when she did not get the job.", + "gold_answer": "Lindsey", + "os_answer": "She", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya wanted to audition for the show that Sarah was casting, so _ watched her routine very carefully.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When it came to taking care of elderly people, Adam was suited for the job more than Brian because _ lived with younger people longer.", + "gold_answer": "Brian", + "os_answer": "Adam", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Felicia experienced a tummy ache while Tanya did not because _ had not eaten any food.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was self-conscious of her legs and Katrina didn't help by making fun of them, but _ went to the gym to try and help her.", + "gold_answer": "Katrina", + "os_answer": "Erin", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "While shopping at the mall, Kevin asked Benjamin to help find a red shirt to wear because _ was great at clothing budgeting.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "As a parent, Catherine doesn't let her kids watch movies, but they can watch some TV shows. Catherine thinks the _ are too violent.", + "gold_answer": "movies", + "os_answer": "movies", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey loves dogs and doesn't have one of her own. So when Amy visits with her dog, _ gives it treats and spoils it.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the scanning tool could not get through the cervix because the _ was too big.", + "gold_answer": "tool", + "os_answer": "fetus", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the scanning tool could not get through the cervix because the _ was too small.", + "gold_answer": "cervix", + "os_answer": "os", + "os_eval": "Incorrect.", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Mary didn't know what the currency of Mexico was but Lindsey knew _ had never been to Mexico before.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Megan sentenced Jennifer to probation for stealing from the grocery store, _ obeys the laws that are written.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Mary thinks Sarah has beautiful skin, even though _ actually has the better complexion of the two.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia loved the smell of Rachel's shampoo, so she asked where to buy it. _ gave her a bottle the next day.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald had to drive Matthew to the doctor immediately because _ was feeling lightheaded and dizzy.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The apartment Brett rented was owned by Jason, so _ sent the rent for the apartment each month.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The apartment Brett rented was owned by Jason, so _ received the rent for the apartment each month.", + "gold_answer": "Jason", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I don't want to use that iron on my new shirt, and, yes, it's because the _ is too expensive.", + "gold_answer": "shirt", + "os_answer": "shirt", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I don't want to use that iron on my new shirt, and, yes, it's because the _ is too cheap.", + "gold_answer": "iron", + "os_answer": "cord", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wound caused by the bullet needed more care than the one caused by the knife because the _ wound was superficial.", + "gold_answer": "knife", + "os_answer": "knife", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle was in a lot of pain after running the marathon in place of Brian, but _ appreciated the support of his cause.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy asked Maria how to make homemade candles to give as gifts. _ knew she had a lot of experience making them.", + "gold_answer": "Amy", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Patricia liked to lie around in a hammock all day but Megan did not because _ was very sedentary.", + "gold_answer": "Patricia", + "os_answer": "it", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Hank was eating cereal and spilt milk on his hot pants and decided to get his pleated pants. He needed to change into new leggings because the _ are clean.", + "gold_answer": "pleated pants", + "os_answer": "leggings", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sara's cat got fleas so she bought a treatment and put it on the cat's neck. The cat was unhappy and tried to lick it off the _ .", + "gold_answer": "neck", + "os_answer": "treatment", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick always wanted to wash when they woke up but Benjamin rarely bothered. _ was a very dirty person.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick always wanted to wash when they woke up but Benjamin rarely bothered. _ was a very clean person.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie is a forest ranger, Jessica is a cook therefore _ probably can't tell you how to plant your pine tree.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin brought a a saw and hammer to prepare making a cupboard for Benjamin because _ is his employer.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia was on a diet and did not eat the cookies Rebecca baked for her. _ was jealous.", + "gold_answer": "Patricia", + "os_answer": "Rebecca", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kenneth's back is being tended to by Derrick at the office, so _ is the client in this situation.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin used a stencil on their presentation lettering but Derrick did not. _ had a very sloppy looking presentation.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin used a stencil on their presentation lettering but Derrick did not. _ had a very neat looking presentation.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The mirror didn't lie when it showed how overweight Patricia was and how emaciated Felicia was, so _ needed to go on diet.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stores used posters instead of flyers, because the overall cost of distribution for the _ was cheaper.", + "gold_answer": "posters", + "os_answer": "posters", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stores used posters instead of flyers, but the overall cost of distribution for the _ was cheaper.", + "gold_answer": "flyers", + "os_answer": "posters", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "With my ankle sprain, I am not able to put my foot in my shoe because the _ is too fat.", + "gold_answer": "sprain", + "os_answer": "swelling", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Logan could eat gluten while Adam could not, and _ always had a smaller variety of foods to choose from.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria wasn't aware that Erin was coming up behind them, because _ was generally sneaky.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was a better employer than Joel so _ had to worry about retaining employees.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was a better employer than Joel so _ did not have to worry about retaining employees.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was suffering from nausea and decided to drink ginger tea but the _ was too meek.", + "gold_answer": "tea", + "os_answer": "flavor", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Two friends wanted a tan look but Joel was impatient while Robert wasn't. _ used bronzer to get a tan look.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Playing basketball came easier for Cynthia than Jennifer but _ had more control of their body movements.", + "gold_answer": "Jennifer", + "os_answer": "Jennifer", + "os_eval": "Correct", + "mcq_answer": "B. Jennifer", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Playing basketball came easier for Cynthia than Jennifer but _ had less control of their body movements.", + "gold_answer": "Cynthia", + "os_answer": "Jennifer", + "os_eval": "Incorrect", + "mcq_answer": "B. Jennifer", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The lady was blushing when she walked passed Amy but not Carrie because _ was intrigued by her.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis's home just burned down, but luckily Donald's was spared. So, now _ is grateful.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "B. Donald", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan focused more on proper posture than Lindsey because _ wanted to become a model.", + "gold_answer": "Megan", + "os_answer": "Megan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan focused less on proper posture than Lindsey because _ wanted to become a model.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria had no issues with Achilles Tendinitis unlike Betty because _ never wore sneakers with cushion.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina did not value the antique pictures as much as Lindsey because _ was a history buff.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan's boil cleared up right away while Christopher's boil got infected due to _ applying medicine later.", + "gold_answer": "Christopher", + "os_answer": "him", + "os_eval": "GRADE: Correct\n\nThe student's use of \"him\" correctly refers back to Christopher as mentioned in the sentence context, effectively replacing the word \"Christopher\" in the true answer without changing the meaning or introducing errors.", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason went zooming down Brett's street way too fast on his motorcycle, causing _ great excitement.", + "gold_answer": "Jason", + "os_answer": "great", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela wanted to find a partner, but Victoria wanted to stay single, because _ was lonely.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My teeth hurt more after eating the cake than the pie because the _ was not as sweet.", + "gold_answer": "pie", + "os_answer": "pie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My teeth hurt more after eating the cake than the pie because the _ was sweeter tasting.", + "gold_answer": "cake", + "os_answer": "cake", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "On Valentine's Day, Brian receives no flowers, but Kevin gets a lot. _ is probably dating someone.", + "gold_answer": "Kevin", + "os_answer": "Kevin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had to learn how to speak Chinese for his job unlike Matthew, because _ worked in China.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had to learn how to speak Chinese for his job unlike Matthew, because _ worked in England.", + "gold_answer": "Matthew", + "os_answer": "Matthew", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The boards were used to build the houses instead of the bricks as the _ were sparse.", + "gold_answer": "bricks", + "os_answer": "bricks", + "os_eval": "Correct", + "mcq_answer": "B. bricks", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty avoided getting attacked in the dark alley where Elena was mugged, because _ ignored their intuition.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The actors practiced the scenes in the parking lot more than the scenes in the morgue, because the _ scenes are full of silence.", + "gold_answer": "morgue", + "os_answer": "morgue", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was interested in babies, but Katrina thought they were annoying, so _ preferred visiting the nursery.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The laws of the government are a lot worse than the rules of schools, because the _ are strict.", + "gold_answer": "laws", + "os_answer": "penalties", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The kids at camp liked the activities with water, but avoided the sand, because the _ was cleansed.", + "gold_answer": "water", + "os_answer": "lake", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When gambling in Las Vegas, Christine usually bets less playing poker than Elena because _ is more cautious.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie is extremely shy, but Lindsey is good at talking to strangers, which makes _ worse at telemarketing.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin thought Android was the superior phone system but Ian thought IOS was better. _ bought a new Note 9 from Verizon.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin thought Android was the superior phone system but Ian thought IOS was better. _ bought a new iPhone 9 from Verizon.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jill bought a slip to go with her new skirt but the _ was too short and it hung out the bottom.", + "gold_answer": "skirt", + "os_answer": "slip", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jill bought a slip to go with her new skirt but the _ was too long and it hung out the bottom.", + "gold_answer": "slip", + "os_answer": "slip", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan kept a store of ammo in their house but Brian did not as _ approved of hunting.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B. Brian", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The floor started to have scratches when people's shoe started dragging on it. The _ was rough.", + "gold_answer": "shoe", + "os_answer": "abrasion", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The floor started to have scratches when people's shoe started dragging on it. The _ was smooth.", + "gold_answer": "floor", + "os_answer": "floor", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig made sure to stretch before working out but Christopher never did, so _ frequently got injuries.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B. Christopher", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena is concerned that Megan might have a Twitter addiction, but _ is probably worrying about nothing.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald was chosen to be a model while Dennis was passed over, because _ was exceptionally tall.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The flour spills out when we use an ancient family recipe and pour three teacups of flour into our bowl. The _ is too small.", + "gold_answer": "bowl", + "os_answer": "bowl", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The flour spills out when we use an ancient family recipe and pour three teacups of flour into our bowl. The _ is too big.", + "gold_answer": "teacup", + "os_answer": "bowl", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The pharmacy offered a product that could cure any disease, made of a new chemical and container, but the _ was not FDA approved.", + "gold_answer": "chemical", + "os_answer": "product", + "os_eval": "Incorrect.", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The pharmacy offered a product that could cure any disease, made of a new chemical and container, but the _ could hold few drugs.", + "gold_answer": "container", + "os_answer": "container", + "os_eval": "Correct", + "mcq_answer": "B.", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cracker that was given to me was worse than the cookie, because the _ was stale.", + "gold_answer": "cracker", + "os_answer": "cracker", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aria tried to fix the fence in his garden by using new paint and wood, but the _ had termites.", + "gold_answer": "wood", + "os_answer": "wood", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia bought a plant for Natalie to put in her garden, so _ sent a thank you card.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "April gets stressed when she goes waterskiing more than swimming. The _ is filled with relaxation for her.", + "gold_answer": "swimming", + "os_answer": "swimming", + "os_eval": "Correct", + "mcq_answer": "B. swimming", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I handed the documents over to immigration with the passports, but they only accepted the passports, because the _ were complete.", + "gold_answer": "passports", + "os_answer": "passports", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia is a great nurse and Cynthia is a famous doctor, blood is normal to them, _ get assisted in operations.", + "gold_answer": "Cynthia", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan checked Samuel's garage to see if the car was there. It was missing so _ was gone.", + "gold_answer": "Samuel", + "os_answer": "it", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica was arrested for growing hemp by the police but not Sarah because _ fled during the field raid.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica was arrested for growing hemp by the police but not Sarah because _ stayed during the field raid.", + "gold_answer": "Jessica", + "os_answer": "Sarah", + "os_eval": "Incorrect", + "mcq_answer": "B. Sarah", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "At the ballgame, Matthew was really thirsty and Aaron was not. _ took his beverage.", + "gold_answer": "Matthew", + "os_answer": "Aaron", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer thought it was important to neuter a dog and Rachel did not because _ knew lots of animals become homeless.", + "gold_answer": "Jennifer", + "os_answer": "Jennifer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joseph loved to smoke cigarettes while Derrick did not although _ hated to use a hookah.", + "gold_answer": "Joseph", + "os_answer": "both", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The woman didn't need an apprasial for the desk, but wondered how much the table was worth, because the _ appeared to be common.", + "gold_answer": "desk", + "os_answer": "desk", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "John could not hear his alarm clock when he was sleeping with a headphone on his head because the _ is closer.", + "gold_answer": "headphone", + "os_answer": "headphone", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John could not hear his alarm clock when he was sleeping with a headphone on his head because the _ is farther.", + "gold_answer": "clock", + "os_answer": "sound", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teacher was helping us study carpentry instead of studying the cooking today. The _ was mandatory.", + "gold_answer": "carpentry", + "os_answer": "lesson", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily was nine months pregnant but Tanya was not pregnant at all. _ had a beautiful baby girl.", + "gold_answer": "Emily", + "os_answer": "Emily", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan ordered the salad with added avocado, but Randy passed, because _ wasn't ok with the $3 upcharge.", + "gold_answer": "Randy", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan ordered the salad with added avocado, but Randy passed, because _ was ok with the $3 upcharge.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya was an adult while Samantha was young and still had room to grow , so _ gave her her old clothes.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya was an adult while Samantha was young and still had room to grow , so _ took her old clothes.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hiking group had more food than water, so they tried to conserve the _ .", + "gold_answer": "water", + "os_answer": "water", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hiking group had less food than water, so they tried to conserve the _ .", + "gold_answer": "food", + "os_answer": "food", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary used the lotion instead of the cream because her skin was glowing when she used the _ .", + "gold_answer": "lotion", + "os_answer": "lotion", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I wore the pants and the shirt together, but got more compliments on the _ because the shirt was uglier.", + "gold_answer": "pants", + "os_answer": "pants", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John cannot listen to his music with the volume of the television his cousin is watching. The _ is quiet.", + "gold_answer": "music", + "os_answer": "television", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The honey flows out slower from the bottle than the oil. The _ is viscous.", + "gold_answer": "honey", + "os_answer": "honey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence volunteered to donate blood to help others, but Steven was unable to, since _ was healthy.", + "gold_answer": "Lawrence", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Reading poetry and rhymes was very entertaining for Derrick but boring for Logan, since _ was a mathematician.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura never feared anything like Erin because _ didn't have a very strong and very powerful mind.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura never feared anything like Erin because _ had a very strong and very powerful mind.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The farmer had more corn to harvest than yams because his cows liked eating the _ .", + "gold_answer": "yams", + "os_answer": "corn", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The farmer had more corn to harvest than yams because his cows hated eating the _ .", + "gold_answer": "corn", + "os_answer": "yams", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Adam asked Dennis to always remember to flush the toilet because _ doesn't flush it.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine knew how to make wings with better flavor than Maria, so _ waited for supper.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shoddy bridge held secure for when the cars were getting passengers across the town to their destinations on time. However the _ were cautious.", + "gold_answer": "passengers", + "os_answer": "drivers", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shoddy bridge held secure for when the cars were getting passengers across the town to their destinations on time. However the _ were racing.", + "gold_answer": "cars", + "os_answer": "buses", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Buying a swimming pool was great for Adam but not for Christopher because _ had a large back yard.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ann liked using oil paint rather than acrylic on canvas because _ had a shortened working time.", + "gold_answer": "acrylic", + "os_answer": "acrylic", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia was happy to give Patricia the politics section of the newspaper, because _ had little interest in the election results.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Only the bag got melted and not the wood when they were inside the flame. The _ is soft.", + "gold_answer": "bag", + "os_answer": "bag", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Only the bag got melted and not the wood when they were inside the flame. The _ is hard.", + "gold_answer": "wood", + "os_answer": "wood", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie always arrived to work after Cynthia, as _ had a shorter driving commute in the mornings.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy left smears all over the surface after cleaning Kayla's sink, because _ didn't supervise very much.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian could learn to swim with the right instruction, but it was hard to tell whether lifeguard Matthew was qualified to provide it, since _ had never swum before.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I slowly poured the milk over my bowl of cereal until the _ was gone.", + "gold_answer": "milk", + "os_answer": "milk", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They disagreed over what dog to adopt as Mary wanted a yorkie while Maria wanted a labrador. _ loved small dogs.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Devin got sick after eating the sausage, so he laid on the couch and later moved to the bed because the _ was more comfortable.", + "gold_answer": "bed", + "os_answer": "bed", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer has more money than Amy, so _ became a homeowner at a young age.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had a unhappy relationship and was jealous because Lawrence had a great one only to find out the reason was _ slacked in adhering to standard marriage advice.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The salesman would only feature nice things in the house like the pool but not the wiring because the _ was fine.", + "gold_answer": "pool", + "os_answer": "wiring", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The boxes were too heavy for Benjamin to carry alone, so he asked Matthew for help. After he said yes, _ felt regret.", + "gold_answer": "Matthew", + "os_answer": "Matthew", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jasmine wanted to put the emerald on the ring but it would not fit. The _ was minuscule.", + "gold_answer": "ring", + "os_answer": "setting", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jasmine wanted to put the emerald on the ring and it would not fit. The _ was colossal.", + "gold_answer": "emerald", + "os_answer": "emerald", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John was glad the file was kept in the box before the fire outbreak started because the _ is inflammable.", + "gold_answer": "box", + "os_answer": "box", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sandra tried out a new conditioner for her hair that makes it curly, but was upset with the results because the _ was too straight.", + "gold_answer": "hair", + "os_answer": "outcome", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sandra tried out a new conditioner for her hair that makes it curly, but was upset with the results because the _ was too mild.", + "gold_answer": "conditioner", + "os_answer": "effect", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia had to pay less tax than Cynthia because _ made more money in the year.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia had to pay less tax than Cynthia because _ made less money in the year.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian's plants are showing a lot more growth than Logan's, because _ used better fertilizer.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James always feel weak whenever he walked the length of his street so he decided walking just the length of the lawn. The _ is long.", + "gold_answer": "street", + "os_answer": "lawn", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James always feel weak whenever he walked the length of his street so he decided walking just the length of the lawn. The _ is short.", + "gold_answer": "lawn", + "os_answer": "lawn", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The living room was cleaner than the kitchen, because we spend leess time in in the _ .", + "gold_answer": "living room", + "os_answer": "kitchen", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The living room was cleaner than the kitchen, because we spend more time in the the _ .", + "gold_answer": "kitchen", + "os_answer": "kitchen", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The girl broke Leslie's heart but not Kenneth's because _ was never in love with her.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The girl broke Leslie's heart but not Kenneth's because _ used to be in love with her.", + "gold_answer": "Leslie", + "os_answer": "Leslie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica suspected that Rebecca had become an alcoholic, but _ predicted an intervention to address the problem.", + "gold_answer": "Rebecca", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The skateboard got broken under the weight of the fat boy and his luggage. The _ is light.", + "gold_answer": "skateboard", + "os_answer": "luggage", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Lawrence was always gaining weight while Dennis was losing it as _ liked to eat too little.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stone still thudded on the floor even though it was dropped on the pillow. The _ is too light.", + "gold_answer": "pillow", + "os_answer": "pillow", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel touches the cool looking bulletproof vest of Kayla due to _ being on an investigation.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Rachel touches the cool looking bulletproof vest of Kayla due to _ being on a ride along.", + "gold_answer": "Rachel", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Remodeling the kitchen came naturally to Michael but not William because _ had experience being a carpenter's apprentice.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Selena wanted the hairdresser to cut her hair with a razor instead of a clipper, because the _ always gave an edgier look.", + "gold_answer": "razor", + "os_answer": "razor", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil cut trees down into lumber every year unlike Logan because _ lives in the city.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B. Logan", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil cut trees down into lumber every year unlike Logan because _ lives out in the countryside.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We couldn't extract the blood but got the plasma out, since the _ was reachable by the needle.", + "gold_answer": "plasma", + "os_answer": "vein", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Happiness was most important to Nick but money was most important to William. _ valued a good life.", + "gold_answer": "Nick", + "os_answer": "Both", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sound of the foot was clearly audible from the street because the _ is quiet.", + "gold_answer": "street", + "os_answer": "area", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "To remove the stain he reached for soap first, then got up and got a bowl. The _ was close by.", + "gold_answer": "soap", + "os_answer": "bowl", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "To remove the stain he reached for soap first, then got up and got a bowl. The _ was far away.", + "gold_answer": "bowl", + "os_answer": "bowl", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle asked Brett for some tips on healthy eating because _ has recently lost weight.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The architect tried to build the room inside the house but the _ was too large.", + "gold_answer": "room", + "os_answer": "space", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The architect tried to build the room inside the house but the _ was too small.", + "gold_answer": "house", + "os_answer": "space", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "William was a huge animal rights activist but Randy couldn't care less so _ hated leather.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "A. William", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William was a huge animal rights activist but Randy couldn't care less so _ loved leather.", + "gold_answer": "Randy", + "os_answer": "Randy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The school needed a new auditorium and a new teacher's lounge. They built the _ first because it benefited the faculty more.", + "gold_answer": "teacher's lounge", + "os_answer": "lounge", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cashier was trained that real $100 bills had sharp lines and counterfeit ones might be blurry, so she accepted the _ bill.", + "gold_answer": "sharp", + "os_answer": "real", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The pressure of finding new jobs is harder than finding new apartments. The _ are high in numbers.", + "gold_answer": "apartments", + "os_answer": "jobs", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "She couldn't wear the bra, unlike the shirt, because the _ was the right size.", + "gold_answer": "shirt", + "os_answer": "shirt", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria wanted to play poker with Jennifer because _ was a better player and she won a lot of money.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Angela was a homebody while Amy loved to travel the world whenever they could. _ took a vacation to the beach over the summer.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela was a homebody while Amy loved to travel the world whenever they could. _ took a staycation at home over the summer.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth was really scared to have surgery but Neil was very brave about it. _ was under a lot of stress.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel went to Michael 's house and consumed a lot of alcohol, so _ had to ride back home as a passenger.", + "gold_answer": "Joel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the new restaurant, Betty convinced Lindsey to try fried brussel sprouts. _ was relieved when she tried new things.", + "gold_answer": "Betty", + "os_answer": "Lindsey", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jane received a pet tortoise and an aquarium as a birthday gift, but the _ was too small.", + "gold_answer": "aquarium", + "os_answer": "aquarium", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She chose the black car over the green car, because the _ has more brighter color.", + "gold_answer": "green car", + "os_answer": "green", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + } +] \ No newline at end of file