diff --git "a/Large/Claude/Winogrande.json" "b/Large/Claude/Winogrande.json" new file mode 100644--- /dev/null +++ "b/Large/Claude/Winogrande.json" @@ -0,0 +1,11405 @@ +[ + { + "question": "Sarah was a much better surgeon than Maria so _ always got the easier cases.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah was a much better surgeon than Maria so _ always got the harder cases.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They were worried the wine would ruin the bed and the blanket, but the _ was't ruined.", + "gold_answer": "bed", + "os_answer": "bedspread", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Terry tried to bake the eggplant in the toaster oven but the _ was too big.", + "gold_answer": "eggplant", + "os_answer": "vegetable", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At night, Jeffrey always stays up later than Hunter to watch TV because _ wakes up late.", + "gold_answer": "Jeffrey", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cat of Sarah has some mouth problems, so she takes it to see Maria. _ is a responsible cat owner.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The home that my parents had when I was in school was a lot nicer than my house now because the _ was sophisticated.", + "gold_answer": "home", + "os_answer": "d\u00e9cor", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The home that my parents had when I was in school was a lot nicer than my house now because the _ is trashy.", + "gold_answer": "house", + "os_answer": "neighborhood", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie has a rich husband and lots of money, Jennifer is poor _ needs to make her clothes.", + "gold_answer": "Jennifer", + "os_answer": "and", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe immediately went to bakery before the bank because the _ had a limited supply of what he wanted.", + "gold_answer": "bakery", + "os_answer": "bakery", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe immediately went to bakery before the bank because the _ had a substantial supply of what he wanted.", + "gold_answer": "bank", + "os_answer": "bakery", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I had to read an entire story for class tomorrow. Luckily, the _ was canceled.", + "gold_answer": "class", + "os_answer": "class", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I had to read an entire story for class tomorrow. Luckily, the _ was short.", + "gold_answer": "story", + "os_answer": "passage", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He had enough time between classes to go to a cafe or to the library. He went to the _ because his paper could wait.", + "gold_answer": "cafe", + "os_answer": "cafe", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He had enough time between classes to go to a cafe or to the library. He went to the _ because his paper was due soon.", + "gold_answer": "library", + "os_answer": "library", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey like to read graphic novels but Natalie liked classic literature to read. _ bought the new Frank Miller comic at the book store.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael just bought brand new wheels for his truck unlike Leslie because _ wheels were new and perfect.", + "gold_answer": "Leslie", + "os_answer": "his", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael just bought brand new wheels for his truck unlike Leslie because _ wheels were old and used.", + "gold_answer": "Michael", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Leslie was nervous around parrots but Neil was not, since _ was bitten by a bird early in life.", + "gold_answer": "Leslie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christmas was a special holiday to Eric but not Adam since _ was a Jew.", + "gold_answer": "Adam", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "To make frosting I needed pudding that was at a store 15 minutes away but pre-made frosting was at a store 5 minutes away. The _ was closer.", + "gold_answer": "frosting", + "os_answer": "store", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin was chosen instead of Brett to be the makeup artist for the play because _ was less experienced.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia violated the rights of Amy, because _ had too much passivity with other people.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They had to eat a lot to gain the strength they had lost and be able to work, the _ was too much.", + "gold_answer": "work", + "os_answer": "fatigue", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They had to eat a lot to gain the strength they had lost and be able to work, the _ was too little.", + "gold_answer": "strength", + "os_answer": "ration", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The roof of Rachel's home is old and falling apart, while Betty's is new. The home value of _ is lower.", + "gold_answer": "Rachel", + "os_answer": "Rachel's", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "All the clutter in the house excited Leslie but not Derrick because cleaning energized _ very much.", + "gold_answer": "Leslie", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The portions of food today were bigger than the sizes yesterday because the _ fed more people.", + "gold_answer": "portions", + "os_answer": "caterers", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Since Craig threw aluminum cans in the trash and Benjamin recycled, _ was environmentally irresponsible.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine was going to Jessica's house to do some cleaning in the kitchen, because _ was a energetic person.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The students were at their desks taking tests with pencils, they used the _ to hold the papers.", + "gold_answer": "desks", + "os_answer": "paperweights", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary thought poodles were a cool dog but Rachel thought Great Danes were cooler. _ bought a small dog bed for their pet.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary thought poodles were a cool dog but Rachel thought Great Danes were cooler. _ bought a gigantic dog bed for their pet.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Leslie had a lot of issues that Kyle was tired of dealing with, so _ felt abandoned when they finally moved out.", + "gold_answer": "Leslie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica enjoyed a simple, basic life with Betty, but _ was bored having a quiet existence.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I wanted to build a bathroom on the third floor of the house but I couldn't because the _ would be too full.", + "gold_answer": "floor", + "os_answer": "rafters", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joel researched laws and helped to open a preschool for Eric. Because _ is very good with kids.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya told Emily she couldn't come to work because her cat had an infection, but _ was lying.", + "gold_answer": "Tanya", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela thinks her husband might be cheating with Lindsey, and _ confesses at the dinner party.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald's understanding of math isn't as good as Joseph's, so _ is more likely a professor.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian was jealous of Brett's new car because _ couldn't afford to buy a new car.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man used his eyes to read the letters but the _ were too small.", + "gold_answer": "letters", + "os_answer": "words", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jill was on a budget so she only bought a new dress for the ceremony and wore an old hat. She figured the _ would be less noticeable.", + "gold_answer": "hat", + "os_answer": "hat", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jill was on a budget so she only bought a new dress for the ceremony and wore an old hat. She figured the _ would be more noticeable.", + "gold_answer": "dress", + "os_answer": "dress", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "On Monday, Patricia made Felicia eggs for an early breakfast, but _ does not like fried eggs.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Since Craig wears clear contacts and William wears colored ones, it is safe to assume that _ loves the color of their eyes.", + "gold_answer": "Craig", + "os_answer": "William", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Since Craig wears clear contacts and William wears colored ones, it is safe to assume that _ dislikes the color of their eyes.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easy for Angela to become a vegetarian although Kayla couldn't do it. _ really missed the taste of chicken.", + "gold_answer": "Kayla", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter was a better baker than Logan so _ made the kitchen a mess when they tried to make an apple pie.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya spent more on the children's birthday party than Amy. _ thought a magician was a good use of funds.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Judy bought new brushes to paint the etched glasses crack but it didn't fit. The _ was too wide.", + "gold_answer": "brush", + "os_answer": "crack", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Judy bought new brushes to paint the etched glasses crack but it didn't fit. The _ was too narrow.", + "gold_answer": "crack", + "os_answer": "aperture", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I look forward to the Sunday newspaper so I can look at the comics. This is the only reason I still get the _ in this day and age.", + "gold_answer": "newspaper", + "os_answer": "newspaper", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer was more of a morning person than Natalie although _ always went to bed early and got a good night's rest.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer was more of a morning person than Natalie because _ always went to bed early and got a good night's rest.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Alcohol is a love of Matthew's, but Ryan can't stand the stuff because _ is a sober alcoholic.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe brought the horse out to the country quite a distance and gave him food but the _ was too much.", + "gold_answer": "distance", + "os_answer": "exertion", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy gave their heart to Brian, and _ soon told them that they should have kept their heart to themselves.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nick wanted to play a game on the floor, but Dennis was hesitant because of his knees. _ was disappointed.", + "gold_answer": "Nick", + "os_answer": "Nick", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although she was being prosecuted, Monica was welcomed into the sanctuary of the church by Samantha because _ was a sinful criminal.", + "gold_answer": "Monica", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The battle was less fierce than the great war, because the _ lasted one year.", + "gold_answer": "war", + "os_answer": "conflict", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura used too much super glue on Erins hands, so _ needed to get to the doctor to separate their hands.", + "gold_answer": "Erin", + "os_answer": "they", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James panicked when his phone fell on the table thinking it will break but the _ is soft.", + "gold_answer": "table", + "os_answer": "tablecloth", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James panicked when his phone fell on the table thinking it will break but the _ is strong.", + "gold_answer": "phone", + "os_answer": "screen protector", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "John cannot touch the cup as it was just brought out of the refrigerator. He wanted some air to blow around it. The _ is very warm.", + "gold_answer": "air", + "os_answer": "air", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The fireman used several rags to polish the nozzles on the fire hose; when he was done the _ were dirty.", + "gold_answer": "rags", + "os_answer": "rags", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary wanted to get another piercing in her ear, but the _ was much too tiny.", + "gold_answer": "ear", + "os_answer": "lobe", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Mary wanted to get another piercing in her ear, but the _ was much too huge.", + "gold_answer": "piercing", + "os_answer": "gauge", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura just loved the taste of green beans but Felicia hated the taste of them. _ didn't have a second serving.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bartender cut Carrie off but continued to serve Emily because _ was too drunk.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Blaze always wore a t-shirt instead of a shirt because he thought that the _ was stuffy and old fashioned.", + "gold_answer": "shirt", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The paint would melt in the sun, so we used a varnish instead, since the _ was susceptible to heat.", + "gold_answer": "paint", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I tried to make mini lamps by using glow sticks in mason jars, but had to get larger jars because the _ were too big.", + "gold_answer": "glow sticks", + "os_answer": "sticks", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel always liked to turn the heater up higher than Joseph did for the reason that _ was never cold.", + "gold_answer": "Joseph", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joel always liked to turn the heater up higher than Joseph did for the reason that _ was always cold.", + "gold_answer": "Joel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teen found the new hat was no substitute for his cool shirt. The _ was just cool to wear to school.", + "gold_answer": "shirt", + "os_answer": "shirt", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary was helping Patricia's daughter put on makeup but _ watches a lot of makeup tutorials.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Mary was helping Patricia's daughter put on makeup because _ watches a lot of makeup tutorials.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He wanted to kill time at the house instead of the playground, because everyone at the _ was fun.", + "gold_answer": "house", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron didn't know Dennis had a peanut allergy, so when _ made peanut chicken an ambulance was called.", + "gold_answer": "Aaron", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron didn't know Dennis had a peanut allergy, so when _ ate peanut chicken an ambulance was called.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "God liked to control the day and the night, but the _ was too bright.", + "gold_answer": "day", + "os_answer": "sun", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brett asked Joel for advice and guidance about waxing his mustache, and afterwards _ felt burdened.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The filter in the living room needed to be changed more often than the one in the bedroom because the _ was dirtier.", + "gold_answer": "living room", + "os_answer": "air", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The filter in the living room needed to be changed more often than the one in the bedroom because the _ was cleaner.", + "gold_answer": "bedroom", + "os_answer": "air", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy went over to the waiting room at the hospital to calm Samantha because _ was placid.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Megan forgot to buy deodorant at the store so they borrowed Jessica's deodorant and _ never found out.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan forgot to buy deodorant at the store so they borrowed Jessica's deodorant and _ hoped they never found out.", + "gold_answer": "Megan", + "os_answer": "secretly", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy thought she was the mirror image of Natalie , but _ could not be convinced to see the similarity.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy thought she was the mirror image of Natalie , but _ could not persuade her to see the similarity.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I helped my sister find her gold necklace. She couldn't wear her woven necklace to the ball because the _ was so casual.", + "gold_answer": "woven necklace", + "os_answer": "style", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily never had as much money to spend as Carrie, because _ had a good job.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wooden doors at my friends work are worse than the wooden desks at my work, because the _ material is cheaper.", + "gold_answer": "doors", + "os_answer": "door", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The wooden doors at my friends work are worse than the wooden desks at my work, because the _ material is stronger.", + "gold_answer": "desks", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The arrow stuck to the bark but not the stone because the _ was flimsy.", + "gold_answer": "bark", + "os_answer": "arrow", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The arrow stuck to the bark but not the stone because the _ was hard.", + "gold_answer": "stone", + "os_answer": "stone", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The leg of the pig body stuck out of the grave where it was buried because the _ is large.", + "gold_answer": "body", + "os_answer": "femur", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The sheet recovered can easily be hiding between the space in the door. The _ is thin.", + "gold_answer": "sheet", + "os_answer": "sheet", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sheet recovered can easily be hiding between the space in the door. The _ is wide.", + "gold_answer": "space", + "os_answer": "gap", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mike doesn't like the table in his living room as much as the couch. The _ resonates with the other decorations.", + "gold_answer": "couch", + "os_answer": "couch", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven believes they can buy happiness but Craig thinks otherwise as _ is very realistic.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven believes they can buy happiness but Craig thinks otherwise as _ is very materialistic.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They brought the cornhole supplies to the camp site so they could play while adults cooked dinner. The boys really enjoyed the _ after the game.", + "gold_answer": "dinner", + "os_answer": "s'mores", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The game of chess was easy to play for Angela but not Rebecca because _ had a analytical mind.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The game of chess was easy to play for Angela but not Rebecca because _ did not have an analytical mind.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "To pay for dinner, he used the credit card rather than cash. The _ was not available.", + "gold_answer": "cash", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The plan devised by Christine to get Kayla to like them failed, as _ did not really try it.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Since the diabetic woman had to limit her sugar intake, she ignored the pie and had a cookie instead because the _ was full of sugar.", + "gold_answer": "pie", + "os_answer": "pie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor offered to treat the patient's illness quickly with surgery or slowly with diet, and the patient refused the _ because he felt it was dangerous.", + "gold_answer": "surgery", + "os_answer": "surgery", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Throughout the practice Rachel pushed the limits of Megan to get ready for the game because _ was the coach.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Throughout the practice Rachel pushed the limits of Megan to get ready for the game because _ was the athlete.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah was quickly promoted to manager over Kayla, because _ excelled at angering other people.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett was browsing the internet while he found the information unlike Randy, _ prefers using books.", + "gold_answer": "Randy", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis knows that Jeffrey is an animal lover and _ knows he wants to go to the zoo to see them.", + "gold_answer": "Dennis", + "os_answer": "also", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty drank chocolate shakes while Elena drank carrot juice, and _ had a very healthy diet.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty drank chocolate shakes while Elena drank carrot juice, and _ had a very unhealthy diet.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie posted their sofa for sale on Craigslist, and had received an offer they had to decline because the _ is valuable.", + "gold_answer": "sofa", + "os_answer": "antique", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I picked up some leaves to put in the books and dry, but they didn't fit because the _ were too small.", + "gold_answer": "books", + "os_answer": "books", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I picked up some leaves to put in the books and dry, but they didn't fit because the _ were too massive.", + "gold_answer": "leaves", + "os_answer": "leaves", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The president had their speech at the auditorium rather than the park because the _ was bigger.", + "gold_answer": "auditorium", + "os_answer": "capacity", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The president had their speech at the auditorium rather than the park because the _ was smaller.", + "gold_answer": "park", + "os_answer": "venue", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Steven found that their T-shirt had shrunk in the laundry, Robert's first reaction was to laugh, and _ then became angry.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Steven found that their T-shirt had shrunk in the laundry, Robert's first reaction was to laugh, and _ became apologetic.", + "gold_answer": "Robert", + "os_answer": "then", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "She counted her calories for her diet and found she needed more so she ate a brownie instead of an apple since the _ has fewer.", + "gold_answer": "apple", + "os_answer": "apple", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia liked wearing glasses more than braces because she could take the _ off after two years.", + "gold_answer": "braces", + "os_answer": "glasses", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia liked wearing glasses more than braces because she could take the _ off every day.", + "gold_answer": "glasses", + "os_answer": "glasses", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy's hair is dry when compared to Ian's due to _ using a strong conditioner.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam was a crook and not a law-abiding citizen like Joseph, so it was surprising that _ was the one with a restraining order against him.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam was law-abiding and not a crook like Joseph, so it was surprising that _ was the one with a restraining order against him.", + "gold_answer": "Adam", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wages at the factory were lower than the wages at the plant since it was more safe to work at the _ .", + "gold_answer": "factory", + "os_answer": "factory", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The health of Joel was stronger than that of William due to _ being a cigar smoker.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easy for Amy but not Rachel to create a meal because _ had taken woodshop in school.", + "gold_answer": "Rachel", + "os_answer": "Amy", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Ann's babies were crying, and she could give them a bottle or a rattle. She tried the _ first in case they were bored.", + "gold_answer": "rattle", + "os_answer": "rattle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca thought Disney movies were the best thing to watch but Samantha like horror movies better. _ rented Saw from Redbox.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The house of Aaron took some damage from the storm but not Michael's house, because _ lived farther away.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer dragged Felicia along to a self help workshop about how to succeed, because _ wanted some company.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary can read the clock in the room at night without the light even though the _ is dark.", + "gold_answer": "room", + "os_answer": "room", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan reads a lot, while Donald almost never picks up a book because _ is a plumber.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan reads a lot, while Donald almost never picks up a book because _ is a student.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle wanted to crush Ryan 's dreams of becoming a movie actor. _ was a threat to him.", + "gold_answer": "Ryan", + "os_answer": "He", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wind during the last hurricane tried to knock over their new house, but the _ was too strong.", + "gold_answer": "house", + "os_answer": "foundation", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty made the choice to reduce Samantha's salary after _ started cutting back on efficiency.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "During the rescue mission, Maria pulled Rebecca away from the minefield since _ was a civilian.", + "gold_answer": "Rebecca", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The jewelry sold for less than the baseball card did since the _ was very common.", + "gold_answer": "jewelry", + "os_answer": "jewelry", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura brought extensions to Monica at the salon, so that _ could get their dreads treated professionally.", + "gold_answer": "Laura", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura brought extensions to Monica at the salon, so that _ could treat their dreads professionally.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The installation process was simpler for the cable over the internet because the man had never installed the _ previously.", + "gold_answer": "internet", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The installation process was simpler for the cable over the internet because the man had already installed the _ previously.", + "gold_answer": "cable", + "os_answer": "hardware", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica wanted Mary to help them decorate their new house because _ asked them not to do it alone.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William went on the ride more than Matthew did because _ thought it was scary.", + "gold_answer": "Matthew", + "os_answer": "Matthew", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan took Monica to a wood shack in the mountains, because _ was a kidnapper trying to hide.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the beauty salon, Angela preferred to work on her eyebrows instead of her eyelashes because the _ were already worked on.", + "gold_answer": "eyelashes", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel tried unsuccessfully to get Brett to skip school because _ was a truant that didn't follow the rules.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla prepared a foot soak bath for Cynthia for their birthday so _ is pouring in water.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man looked at the sundial since a watch or clocktower was not at his disposal, having lost the _ .", + "gold_answer": "watch", + "os_answer": "former", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter chose to eat a banana for breakfast every morning but Michael did not because _ is unconcerned about their health.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The IRS sent Tim a letter informing him of the audit, which could occure at the house or the office. Tim chose a comfortable setting of the _ .", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia decided to buy Felicia dinner because they had been through a lot and _ just inherited some money.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Patricia decided to buy Felicia dinner because they had been through a lot and _ just lost some money.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah thought that Elena was overpacking for Hawaii, because _ had a very full suitcase.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William liked to be outside more than Kyle so _ spent time arguing against getting a pool.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William liked to be outside more than Kyle so _ spent time arguing for getting a pool.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "John never mentioned his canoe, but had a long conversation with Ron about the raft, because John rarely used the _ .", + "gold_answer": "canoe", + "os_answer": "canoe", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica gives Jessica a book about posture, because _ has been trying to get better at ballet dancing.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My gun was inspected with a cloth to make sure it worked fine. The _ was hard.", + "gold_answer": "gun", + "os_answer": "wipe", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My gun was inspected with a cloth to make sure it worked fine. The _ was soft.", + "gold_answer": "cloth", + "os_answer": "cloth", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the estate sale, John saw the hammer was more affordable than the screwdriver, because the _ was used.", + "gold_answer": "hammer", + "os_answer": "hammer", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "At the estate sale, John saw the hammer was more affordable than the screwdriver, because the _ was brand new.", + "gold_answer": "screwdriver", + "os_answer": "screwdriver", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The temperature in winter is much different than summer, the _ is always lower.", + "gold_answer": "winter", + "os_answer": "temperature", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sliding glass door was broken when Eric pushed Ian through it because _ is a pushover.", + "gold_answer": "Ian", + "os_answer": "it", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman used a gentle technique when painting the urn but applied more pressure when painting the vase, because the _ was less fragile.", + "gold_answer": "Vase", + "os_answer": "vase", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman used a gentle technique when painting the urn but applied more pressure when painting the vase, because the _ was more fragile.", + "gold_answer": "Urn", + "os_answer": "urn", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tina made a schedule to keep track of her work and school obligations. She preferred to focus on the _ because she wanted to learn.", + "gold_answer": "school", + "os_answer": "academics", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica wants to protect herself from infectious diseases so she goes to doctor Samantha, because _ is careful.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kerry was running later when he took his car to work than when he took a taxi because he ran into more traffic in the _ .", + "gold_answer": "car", + "os_answer": "evening", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The history of the village is more intriguing than the history of the city because the _ is very new.", + "gold_answer": "city", + "os_answer": "city", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel told Patricia to pick up some baby powder at the store because _ had sweaty feet.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel told Patricia to pick up some baby powder at the store but _ had sweaty feet too.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil looked all over the neighborhood for their missing dog until Samuel called and _ got their dog back.", + "gold_answer": "Neil", + "os_answer": "found", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I did not buy the color pink rose flowers for my wedding because the _ is too bright.", + "gold_answer": "color", + "os_answer": "hue", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I started playing drums young. Sometimes I played in the garage and sometimes my room, but my parents preferred knowing I was in the _ .", + "gold_answer": "garage", + "os_answer": "house", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At work, Mary uses a broiler a lot, but Rebecca uses a chainsaw. That's because _ is a tree cutter.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sand and water in the fish tank were very dirty, so the _ needed to be filtered.", + "gold_answer": "water", + "os_answer": "water", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sand and water in the fish tank were very dirty, so the _ needed to be scrubbed.", + "gold_answer": "sand", + "os_answer": "aquarium", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Warts appeared on Jerry's limbs after he went through the jungle because the _ were infectious.", + "gold_answer": "warts", + "os_answer": "microbes", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Pete preferred to use the sheet to the blanket, because the _ was much hotter.", + "gold_answer": "blanket", + "os_answer": "weather", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She preferred a globe of the world made of PVC instead of plastic, because the _ made it look expensive.", + "gold_answer": "PVC", + "os_answer": "material", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "People think _ is embarassed, because Samantha made snide comments about the shirt Rebecca was wearing.", + "gold_answer": "Rebecca", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam's mindset was a lot stronger than William's because _ was able to control it.", + "gold_answer": "Adam", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The puncture healed quicker than the cut because the _ was a more superficial wound.", + "gold_answer": "puncture", + "os_answer": "puncture", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the beach, Emily collected some seashells for her mother Maria. _ polished the seashells before giving them away.", + "gold_answer": "Emily", + "os_answer": "She", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Using a needle to sew together both the leather and silk was difficult. The _ was hard get through.", + "gold_answer": "leather", + "os_answer": "leather", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The maid took away a cozy blanket from Lawrence but not Nick because _ was very hot.", + "gold_answer": "Lawrence", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The maid took away a cozy blanket from Lawrence but not Nick because _ was very cold.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The photo came out of the Polaroid camera and fell onto the tray, so now the _ is lighter.", + "gold_answer": "camera", + "os_answer": "exposure", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brett asked Nelson where they were because _ had no idea after he fell asleep.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett asked Nelson where they were because _ had had been driving after he fell asleep.", + "gold_answer": "Nelson", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Leslie coughed more when they were eating their food than Adam although there was more seasoning in the food of _ .", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig gifted Eric a new picnic table, because _ borrowed some money a while ago.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Craig gifted Eric a new picnic table, because _ lent him some money a while ago.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was eager to make the big sale to Sarah , as _ needed the money that day.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was eager to make the big sale to Sarah , as _ had the money that day.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert took voice lessons from Randy, because _ was known to be on American Idol.", + "gold_answer": "Randy", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Whilst on the beach Cynthia loved to wear a bikini but Laura did not because _ had a flat stomach.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Whilst on the beach Cynthia loved to wear a bikini but Laura did not because _ had a fat stomach.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Paint was applied to the chairs but not the tables, since the _ were new.", + "gold_answer": "tables", + "os_answer": "tables", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Paint was applied to the chairs but not the tables, since the _ were old.", + "gold_answer": "chairs", + "os_answer": "chairs", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "In high school Matthew was most popular among the teachers as were Steven was among the students, _ was liked by adolescents.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shoe james bought got pinched by a nail while jogging because the _ is soft.", + "gold_answer": "shoe", + "os_answer": "sole", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence liked watching foreign movies with subtitles unlike Jason because _ criticized the original language of the film.", + "gold_answer": "Jason", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence liked watching foreign movies with subtitles unlike Jason because _ appreciated the original language of the film.", + "gold_answer": "Lawrence", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The fishing line snagged and broke on a rock because the _ was too heavy.", + "gold_answer": "rock", + "os_answer": "sinker", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Johnny likes fruits more than vegetables in his new keto diet because the _ are saccharine.", + "gold_answer": "fruits", + "os_answer": "fruits", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was still grieving the death of a friend more than Elena, because _ had a more distant relationship with the friend.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was still grieving the death of a friend more than Elena, because _ had a very close relationship with the friend.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bill had extra charges for past due and hookup. I owe the _ for being a new customer.", + "gold_answer": "hookup", + "os_answer": "company", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia had a much harder life than Amy, so when _ said life was good, it was an unusual sentiment.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The courage of Ian was a lot stronger than Michael because _ had been through a lot in life.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chef fried less mushrooms than tomatoes because the _ were ordered frequently at the restaurant.", + "gold_answer": "tomatoes", + "os_answer": "tomatoes", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence dealt the cards to Joseph at the blackjack table, because _ was a professional player.", + "gold_answer": "Joseph", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "You can grow cilantro in a garden or buy it at the store, but the _ variety will taste bland because it will be older.", + "gold_answer": "store", + "os_answer": "store-bought", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "You can grow cilantro in a garden or buy it at the store, but the _ variety will taste better because it will be fresh.", + "gold_answer": "garden", + "os_answer": "homegrown", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha strictly followed their diet while Sarah ate what they felt like, and _ ate chicken and broccoli all week.", + "gold_answer": "Samantha", + "os_answer": "they", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It seemed more likely that Brett would wear a fedora rather than Justin because _ was known to dress stylishly.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It seemed more likely that Brett would wear a fedora rather than Justin because _ did not often dress stylishly.", + "gold_answer": "Justin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William did not mind if it took them a while to prepare a meal but Adam did because _ was very meticulous.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The wall of the house looks nicer than the one in the garage despite that the _ was painted more recently.", + "gold_answer": "garage", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kevin ate large amounts of food but not Adam. _ didn't have to get checked to see if they had a tapeworm.", + "gold_answer": "Adam", + "os_answer": "Kevin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The computer of Victoria ran faster than that of Carrie because _ downloaded less files.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The computer of Victoria ran slower than that of Carrie because _ downloaded less files.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "My face was more familiar than it was at the bar than the gym because I went to the _ very rarely.", + "gold_answer": "gym", + "os_answer": "gym", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My face was more familiar than it was at the bar than the gym because I went to the _ several times a week.", + "gold_answer": "bar", + "os_answer": "bar", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Randy showed Samuel the abused horse that he rescued from the shelter. _ was proud of his friend.", + "gold_answer": "Samuel", + "os_answer": "He", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena enjoyed yoga classes while Amy preferred other forms of exercise; this was because _ was flexible.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena enjoyed yoga classes while Amy preferred other forms of exercise; this was because _ was inflexible.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cake that Lawrence tried to bake for Ryan didn't rise, and _ felt forgiving abut it.", + "gold_answer": "Ryan", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie took a longer time to take a bath than Jennifer because _ liked relaxing in the tub.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily said that Victoria's hijab was silly and old fashioned. _ heard some very offensive things.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily said that Victoria's hijab was silly and old fashioned. _ said some very offensive things.", + "gold_answer": "Emily", + "os_answer": "Emily", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary was more reliable and hardworking than Rachel, but to be fair, _ had a better foundation as a child.", + "gold_answer": "Mary", + "os_answer": "the", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "It is likely that Donald but not Jason would get the job promotion because _ never stayed late and never did extra work.", + "gold_answer": "Jason", + "os_answer": "Jason", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "A background check was performed on Natalie by Lindsey due to _ being a nanny.", + "gold_answer": "Natalie", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We reached a settlement with the company but were roadblocked by the court. The _ was just more inflexible in its dealings.", + "gold_answer": "court", + "os_answer": "judiciary", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man paid cash for the phone but purchased the tablet with credit because the _ was pricy.", + "gold_answer": "Tablet", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man paid cash for the phone but purchased the tablet with credit because the _ was inexpensive.", + "gold_answer": "Phone", + "os_answer": "phone", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "There are lots of pills in the home of Neil, but none in the house of Logan, so _ must be healthy.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie asked Betty where the children were on the playground because _ could not see them.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the region was too crowded for our comfortable stay for all the people sent there , the _ were too small..", + "gold_answer": "region", + "os_answer": "quarters", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha had to get car insurance and Jessica did not because _ just got a new car.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stain was lighter on Jason's shirt than Donald's because _ spilled red wine and not white wine.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The stain was darker on Jason's shirt than Donald's because _ spilled red wine and not white wine.", + "gold_answer": "Jason", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily decided to eat a lot more yucca than Carrie did. _ was still hungry.", + "gold_answer": "Carrie", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily decided to eat a lot more yucca than Carrie did. _ was no longer hungry.", + "gold_answer": "Emily", + "os_answer": "She", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian needed to adjust the mirror and Craig did not because _ was shorter than the owner of the car.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian needed to adjust the mirror and Craig did not because _ was the same height as the owner of the car.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The commodities trader decided to buy wool and sell cotton because the _ was priced low.", + "gold_answer": "wool", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The commodities trader decided to buy wool and sell cotton because the _ was priced high.", + "gold_answer": "cotton", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was told my eyes are failing so I need to get glasses or contacts. I don't think I'll get the contacts since the _ seem less comfortable.", + "gold_answer": "contacts", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It is an article of faith that the paper is more important than the exam , even though the _ weighs less heavily on the grade.", + "gold_answer": "paper", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The teenager got a job at the supermarket instead of at the diner because he had to work during school at the _ .", + "gold_answer": "diner", + "os_answer": "diner", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The tip of James pencil was breaking while writing on the paper sheet. The _ is weak.", + "gold_answer": "pencil", + "os_answer": "lead", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William lived in a rougher part of town than Eric, so _ trained their dog as a guard dog.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman moved the urn in front of the vase on the shelf because the _ was attractive.", + "gold_answer": "urn", + "os_answer": "juxtaposition", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jennifer returned the pan to Sarah because _ had borrowed it from her for the potluck party.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer returned the pan to Sarah because _ had loaned it to her for the potluck party.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor told Kevin to exercise more often but not Neil. _ had always been lazy and unmotivated.", + "gold_answer": "Kevin", + "os_answer": "Kevin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor told Kevin to exercise more often but not Neil. _ had always been active and self-motivated.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I always wonder how people prefer reading in a library instead of at the house because the lack of people at the _ would make it easier to concentrate.", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I always wonder how people prefer reading in a library instead of at the house because the amount of people at the _ would make it hard to concentrate.", + "gold_answer": "library", + "os_answer": "library", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The blood sample on the slide was more helpful than the one in the vial, because the _ had been kept pristine.", + "gold_answer": "slide", + "os_answer": "slide", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Ryan had to use a calculator on the test but Michael didn't because _ was very bad at math.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The air in the shop was better than in the garage, because the _ was highly purified.", + "gold_answer": "shop", + "os_answer": "ventilation", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He went to put his pocket watch into his pocket, but realized the chain had broke. Without it, the _ doesn't function correctly.", + "gold_answer": "pocket watch", + "os_answer": "fob", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason was easily scared, so he watched sci-fi movies instead of horror movies because the _ were not scary.", + "gold_answer": "sci-fi movies", + "os_answer": "aliens", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine accepted the over night challenge from Laura, because _ had a better chance of winning.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman kept the bikini but returned the top, because the _ was the right size.", + "gold_answer": "bikini", + "os_answer": "bottom", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman kept the bikini but returned the top, because the _ was the wrong size.", + "gold_answer": "top", + "os_answer": "top", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria taught Elena how to count in Malay for their trip, because _ was a visitor of the island.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela beat Mary in the weightlifting competition, but it wasn't fair. _ had been taking steroids.", + "gold_answer": "Angela", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty assisted Kayla with the daily analysis task they were assigned and then _ ask for help herself.", + "gold_answer": "Betty", + "os_answer": "proceeded", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The store sold Michael a fake phone but not Eric so _ could still make a call.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The juice from the mango fruit could not fill up the cup because the _ is small.", + "gold_answer": "mango", + "os_answer": "quantity", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jeri was deciding what to bring to a potluck and picked cookies over a pie because the _ could be shared with fewer people.", + "gold_answer": "pie", + "os_answer": "pie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brian asked Nick to feed their rabbit,because _ was planning on going on vacation to Disney for a week.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James listened carefully to the conversation from the other room but all he could hear was the clock tickling. The _ is pretty loud.", + "gold_answer": "clock", + "os_answer": "ticking", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog that Laura found was dirtier than Amy's dog, since _ dog lived in the street.", + "gold_answer": "Laura", + "os_answer": "Laura's", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The ambulance went to the hospital without Nelson inside but with Ryan because _ drove there in a car.", + "gold_answer": "Nelson", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig was a very selfish individual but Kenneth was very generous. _ had a lot of good friends.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It took a less time for Katrina to read the book than Cynthia since _ was a better reader.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bobby had to use his pen to finish the exam rather than the pencil because the _ was full of ink.", + "gold_answer": "pen", + "os_answer": "pen", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easy for Matthew but not Logan to practice yoga because _ wanted to improve their mind and body.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia was called back for a second interview but not Victoria, as _ had passed the background check.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia was called back for a second interview but not Victoria, as _ had failed the background check.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Harold liked to play with dolls more than cars because the _ talked back to him.", + "gold_answer": "dolls", + "os_answer": "dolls", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "There was more dirt on the car than the bike because the _ was kept inside.", + "gold_answer": "bike", + "os_answer": "bike", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "There was more dirt on the car than the bike because the _ was kept outside.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was a very calm person with yoga but Jeffrey was hyper so, _ decided to take a yoga class.", + "gold_answer": "Jeffrey", + "os_answer": "Jeffrey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Going to a restaurant is something that Patricia does very often but Carrie rarely goes to one because _ is a very bad cook.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Going to a restaurant is something that Patricia does very often but Carrie rarely goes to one because _ is a very good cook.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eric went to Leslie's house to play with the new dog, but there was no answer. _ was at the park.", + "gold_answer": "Leslie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica spends a lot more money on frivolous things than Rachel because _ has more disposable income.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin showed Maria to use the fork and knife in a proper manner as _ attended etiquette school.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Ian won a fish from Kenneth at the carnival so _ bagged it up and sent it home.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The hotline was staffed by Christine when Tanya called in because _ was a volunteer.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven helped Derrick do research on the paper because _ did not have access to the internet.", + "gold_answer": "Derrick", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven helped Derrick do research on the paper because _ had access to the internet.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel got advice on buying stocks from his cousin Bob while Eric used a broker. _ had a virtually worthless portfolio of companies.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca asked Kayla to turn the lights out but _ did not want to go to sleep.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis is changing the sand in a pool filter for Joseph, because _ is a bit lazy.", + "gold_answer": "Joseph", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter gave Justin two weeks to respond after sending him a demand letter. .After that _ will sue him in the court.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The mediation and medication both helped me be patient. I lost my temper when the _ got rescheduled.", + "gold_answer": "mediation", + "os_answer": "mediation", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason considers he and Benjamin to be friends so _ puts a lot of effort into their relationship.", + "gold_answer": "Jason", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason considers he and Benjamin to be friends even though _ puts little effort into their relationship.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It took a minute longer to melt the chocolate in the microwave than the caramel, because the _ was very soft.", + "gold_answer": "caramel", + "os_answer": "caramel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It took a minute longer to melt the chocolate in the microwave than the caramel, because the _ was very firm.", + "gold_answer": "chocolate", + "os_answer": "chocolate", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They discussed the company's budget at the business meeting but the _ was boring and the meeting was ran long.", + "gold_answer": "budget", + "os_answer": "agenda", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "They discussed the company's budget at the business meeting but the _ was boring and the topic of the budget ran long.", + "gold_answer": "meeting", + "os_answer": "agenda", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sponges performed worse at cleaning the tub in the bathroom when compared with the cloths. It's because the _ are cheaper.", + "gold_answer": "sponges", + "os_answer": "sponges", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy only ever added a little bit of hot sauce to his food, especially compared to Adam, as _ was much more sensitive to spice.", + "gold_answer": "Randy", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Matt wanted to change either the plain bathroom or the colorful bedroom, but the _ was already colorful.", + "gold_answer": "bedroom", + "os_answer": "bedroom", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Matt wanted to change either the plain bathroom or the colorful bedroom, but the _ was already plain.", + "gold_answer": "bathroom", + "os_answer": "bathroom", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The snow came down so much that Michael had to go plow Kevins driveway because _ agreed to take care of his neighbors.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The snow came down so much that Michael had to go plow Kevins driveway because _ needed the help of his neighbors.", + "gold_answer": "Kevin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The girl used the comb to try and brush her hair but the _ was too soft.", + "gold_answer": "comb", + "os_answer": "bristles", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Police arrested Maria but let Cynthia go as _ had some paint on their hand from the spray paint used for graffiti.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Police arrested Maria but let Cynthia go as _ had no paint on their hand from the spray paint used for graffiti.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter bought a vehicle to commute in but not Dennis because _ had a driving distance to work.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey went to the doctor to treat their ailments but not Robert so _ became sicker.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria asked Cynthia if she could borrow some fuel for her car, as _ had a shortage of it.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In the accident the vehicle of Nelson received more damage than that of Justin, since _ vehicle was smaller.", + "gold_answer": "Nelson", + "os_answer": "his", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "In the accident the vehicle of Nelson received more damage than that of Justin, since _ vehicle was bigger.", + "gold_answer": "Justin", + "os_answer": "Justin's", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela did a bunch of crunches and sit-ups but Cynthia didn't, consequentially _ had six- pack abs.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica is looking to buy some new furniture and Carrie just bought some, so _ is starting to anticipate their purchase arrival.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron showed Donald how to use google play on an android because _ owned an apple phone.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina turned out to be much more spoiled than Felicia because _ did not have wealthy or generous parents.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina turned out to be much more spoiled than Felicia because _ had wealthy and generous parents.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah rolls her eyes as Monica extolls the virtues of vinegar as a cleaning solution for everything since _ is bored.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson always had the best friendships except with Neil since _ was always so polite.", + "gold_answer": "Nelson", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Derrick really liked working in Human Resources and William wanted to work at the same company, and _ subsequently offered a position.", + "gold_answer": "Derrick", + "os_answer": "was", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Derrick really liked working in Human Resources and William wanted to work at the same company, and _ subsequently accepted a position.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The room at the hotel cost more to stay in than the room at the inn because the _ was nastier.", + "gold_answer": "inn", + "os_answer": "inn", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The room at the hotel cost more to stay in than the room at the inn because the _ was nicer.", + "gold_answer": "hotel", + "os_answer": "accommodations", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman practiced for her interview and not for the sport since the _ was expedient.", + "gold_answer": "interview", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The boot was removed from the car tire and put on the truck tire, since the _ was now illegally parked.", + "gold_answer": "truck", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The boot was removed from the car tire and put on the truck tire, since the _ was now legally parked.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I have both glasses and contacts, but the cleaning solution was empty so I wore the _ today.", + "gold_answer": "glasses", + "os_answer": "glasses", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He found it harder to write the letter than the e-mail because the _ had so few words.", + "gold_answer": "e-mail", + "os_answer": "tweet", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jane loved travelling internationally. The current country she was in preferred wine over tea because the _ was less available.", + "gold_answer": "tea", + "os_answer": "water", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer wanted to get romance in a relationship while Elena did not because _ liked to watch romantic comedies.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam loved dogs but Jason was afraid of them, so only _ petted the poodle.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena brought the horse to the stables owned by Cynthia, so _ could buy the animal.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena brought the horse to the stables owned by Cynthia, so _ could sell the animal.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brett wanted to get a massage but Kenneth did not. This is because _ was feeling relaxed.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kevin was worried about Eric's infections so _ decided to go to an emergency clinic.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The bird squawked at Mary's rushed approached and quieted when Jennifer came in since _ was threatening.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan was always behind Donald in high school because _ had a diagnosed learning disability.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "People do not want to eat James burnt cake but they love his burger because the _ is tasteless.", + "gold_answer": "cake", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had problems with dry skin but not Hunter since _ used a soothing skin lotion.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had problems with dry skin but not Hunter because _ used an irritating skin lotion.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie loves putting sugar in coffee as opposed to Laura because _ thinks the coffee tastes better.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett was actively engaged in weight loss whereas Benjamin was trying to gain weight, so _ maximized their caloric intake.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ben had to drain both water and oil down the sink, but the _ was too viscous.", + "gold_answer": "oil", + "os_answer": "oil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ben had to drain both water and oil down the sink, but the _ was too fluid.", + "gold_answer": "water", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "John painted the pole red close to the color of the wall and painted the frame white and now the _ is contrasting.", + "gold_answer": "frame", + "os_answer": "pole", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John painted the pole red close to the color of the wall and painted the frame white and now the _ is similar.", + "gold_answer": "pole", + "os_answer": "contrast", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mark preferred his drinks in paper cups over styrofoam cups because the _ are strong.", + "gold_answer": "paper cups", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica had trouble paying off their loan unlike Sarah because _ was an infrequent gambler.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Derrick was sad that Robert did not show up, _ forgot they had an agreement to meet each other.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She suspected that her old makeup had expired after she put it on her skin because her _ was harder.", + "gold_answer": "makeup", + "os_answer": "complexion", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kevin drew the blood from Ian's arm, because _ was giving it to do some tests.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sookie roasted a turkey and served it with potatoes instead of carrots, because everyone in her family would have hated the _ .", + "gold_answer": "carrots", + "os_answer": "carrots", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "They were wanting to move the bed thru the door. The _ was way to small.", + "gold_answer": "door", + "os_answer": "doorway", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty learned to play the cello well but Erin did not because _ was very impatient.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan ended the one-side relationship they were having with Robert, which made _ feel relieved.", + "gold_answer": "Logan", + "os_answer": "him", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was eating more than Betty was eating for dinner because _ had a big lunch.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was eating more than Betty was eating for dinner because _ had skipped lunch.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I chose to drive the car over the truck because the _ had a small amount of gas.", + "gold_answer": "truck", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I chose to drive the car over the truck because the _ had a large amount of gas.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The diary of Carrie is boring, and the one Jennifer writes is interestin. _ has lived a simple life.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian's hair is being worked on by Craig, so it's more likely _ is the customer.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan didn't care for the comedians show but Patricia thought it was brilliant. _ hung out for the comedian's second set.", + "gold_answer": "Patricia", + "os_answer": "Neither", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He liked filling the bucket with the hose better than the faucet, because the _ provided extra water pressure.", + "gold_answer": "hose", + "os_answer": "hose", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine was watching makeup tutorials while Amy was not because _ wanted to forget how to put blush on correctly.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Diana went to the laundromat and she used the washer but not the dryer because she only had enough money for the _ .", + "gold_answer": "washer", + "os_answer": "washer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ben wanted to propose to his girlfriend by hiding the ring in either cake or water. He decided to hide it in the _ because she drank the water fast.", + "gold_answer": "cake", + "os_answer": "cake", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman avoided the hole but easily stepped over the pit, because the _ was very deep.", + "gold_answer": "hole", + "os_answer": "hole", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The woman avoided the hole but easily stepped over the pit, because the _ was very shallow.", + "gold_answer": "pit", + "os_answer": "pit", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After I soaked the roller in the paint container, the _ had less paint on it.", + "gold_answer": "container", + "os_answer": "roller", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The lease in the city was more than the lease in the country because the value of the property in the _ was higher.", + "gold_answer": "city", + "os_answer": "city", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The refrigerator was acting up again, so we called a technician to repair the part. The _ was fine when he showed up.", + "gold_answer": "refrigerator", + "os_answer": "appliance", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Erin has a teenager whereas Patricia has toddler-age children because _ became a mother later.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Erin has a teenager whereas Patricia has toddler-age children because _ became a mother first.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla was very civil when dealing with Emily so that _ would be accepted by her.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin ordered a martini when Tanya only ordered a tonic water with lemon, because _ was pregnant.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The employee tried to put the extra clothes in the closets but the _ were too small.", + "gold_answer": "closets", + "os_answer": "closets", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald has a problem with hearing in his ears unlike Benjamin because _ worked in a quiet area.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil was a very popular kid in school unlike Jeffrey, because _ was very extroverted.", + "gold_answer": "Neil", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I loved my old gifts but not the new dishes, because the _ were so beautiful.", + "gold_answer": "gifts", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty used glue to fix Megan's toy because _ was too young to use superglue.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason but not Craig asked the company if they were currently hiring because _ has a job.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The game on television was very important for Ian but not Dennis because _ was into music instead.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The virus stuck to the clothes better than it stuck to the walls, because the _ had less deterrents on them.", + "gold_answer": "clothes", + "os_answer": "fabrics", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The virus stuck to the clothes better than it stuck to the walls, because the _ had more deterrents on them.", + "gold_answer": "walls", + "os_answer": "walls", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "At their high school's homecoming dance, Natalie stayed on the floor for the slow dance while Maria got food during it, because _ had broken up with her significant other.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At their high school's homecoming dance, Natalie stayed on the floor for the slow dance while Maria got food during it, because _ currently had a significant other.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam always spent all of the free time watching Tv unlike Hunter who volunteered, due to _ being lazy.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ ignored their ear because Jessica has a ear infection and Felicia was fine.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha had to use the potty while Felicia used the restroom because _ is a grownup.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After walking barefooted, James washed his foot in the bowl of water and the _ got dirty.", + "gold_answer": "water", + "os_answer": "water", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Benjamin put the family into debt, Adam filed for divorce; then the judge gave _ a sympathetic look.", + "gold_answer": "Adam", + "os_answer": "him", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Benjamin put the family into debt, Adam filed for divorce; then the judge gave _ a withering look.", + "gold_answer": "Benjamin", + "os_answer": "him", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin read a book to Monica because _ was old enough to be able to read.", + "gold_answer": "Erin", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The box slid down James hand when he was wearing a glove, hence he removed it and lift it again. The _ is dry.", + "gold_answer": "hand", + "os_answer": "skin", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The box slid down James hand when he was wearing a glove, hence he removed it and lift it again. The _ is slippery.", + "gold_answer": "glove", + "os_answer": "glove", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The building's ancient foundation was re-enforced with a steel alloy during the remodel because the _ was strengthening.", + "gold_answer": "steel", + "os_answer": "purpose", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When we go hiking I bring my backpack because it has built in water bottles and places for snacks. Today I forgot to fill the _ and was dehydrated.", + "gold_answer": "water bottles", + "os_answer": "bottles", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When we go hiking I bring my backpack because it has built in water bottles and places for snacks. Today I forgot to bring the _ and was starving.", + "gold_answer": "snacks", + "os_answer": "backpack", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She wanted to learn how to pair wine so she bought book instead of using a magazine because the _ was too broad.", + "gold_answer": "magazine", + "os_answer": "scope", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya read the contract carefully before signing it but Patricia didn't. _ didn't get ripped off by the shady merchant.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The garbage can smells much worse than the recycling, so the _ is probably a lot more sterile.", + "gold_answer": "recycling", + "os_answer": "recycling", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My pain was not nearly as bad as Joe's burn because the _ Joe had was uncontrollable.", + "gold_answer": "burn", + "os_answer": "agony", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hotel had a terrible gym but a nice restaurant; the _ was something management attended to.", + "gold_answer": "restaurant", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Refraining from drinking was easy for Kyle but not Eric, as _ never enjoyed the taste of alcohol.", + "gold_answer": "Kyle", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia ate all of the dessert while Sarah did not have any since _ was not trying to lose any weight.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary went to the office to receive a new card with her photo on it and discarded a sticker because the _ was temporary.", + "gold_answer": "sticker", + "os_answer": "adhesive", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The new cream didn't remove the warts like the last lotion, because the _ was not powerful enough.", + "gold_answer": "cream", + "os_answer": "concentration", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kenneth is accused of destroying drywall in Jeffrey's house, _ is leasing out the house.", + "gold_answer": "Jeffrey", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth is accused of destroying drywall in Jeffrey's house, _ is renting the house.", + "gold_answer": "Kenneth", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Adam was cold and Michael was hot so _ removed a heavy jacket to withstand the freezing weather.", + "gold_answer": "Michael", + "os_answer": "Adam", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "After a short time we stopped pouring the tea glass in the pot because the _ was full.", + "gold_answer": "pot", + "os_answer": "saucer", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After a short time we stopped pouring the tea glass in the pot because the _ was empty.", + "gold_answer": "glass", + "os_answer": "teapot", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "When the dog behaves I like to give him a sausage otherwise I give him a ball. I gave him the _ since he was bad.", + "gold_answer": "ball", + "os_answer": "ball", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John decided to grow a new breed of plant in his garden but the _ is big.", + "gold_answer": "plant", + "os_answer": "risk", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was sick of the pests like Amy always cutting out their internet, so _ decided to lay low.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "William wanted to go biking but Aaron wanted to stay home, so _ went out by themselves.", + "gold_answer": "William", + "os_answer": "they", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela loved to wear sun glasses but Jessica didn't. _ bought a fancy new pair of shoes.", + "gold_answer": "Jessica", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica was caught napping in class more often than Katrina because _ stayed up all night.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The highlands were a lot colder than the beaches because the _ were lower down in elevation.", + "gold_answer": "beaches", + "os_answer": "beaches", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine had really good grammar but Cynthia didn't have good grammar because _ studied math in college.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jessica was given a sapphire ring by Christine for her birthday because _ really likes sapphires.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The waist of Joel measured more inches than that of Kevin because _ ate much less.", + "gold_answer": "Kevin", + "os_answer": "Kevin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The lips on Cynthia were much bigger than Monica because _ got hit with a softball in the mouth.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The lips on Cynthia were much smaller than Monica because _ got hit with a softball in the mouth.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Mary goes around telling everyone that Christine is too clingy because _ likes to be touched..", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The parakeet flew to Hunter but flew past Samuel because _ had some bird seed in their hand.", + "gold_answer": "Hunter", + "os_answer": "Hunter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John opened the window for air to come him when he was sweating in his bedroom. The _ is cold.", + "gold_answer": "air", + "os_answer": "breeze", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Even though Ian had less of a sweet tooth than Robert, _ liked chocolate more.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James walked into a ditch while trying to catch the ball thrown at him. The _ is farther.", + "gold_answer": "ball", + "os_answer": "distance", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Caroline works in the catering and food wholesale industries, but enjoys food preparation more, so she prefers her work in the _ industry.", + "gold_answer": "catering", + "os_answer": "catering", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Caroline works in the catering and food wholesale industries, but enjoys food distribution more, so she prefers her work in the _ industry.", + "gold_answer": "food wholesale", + "os_answer": "wholesale", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria never received flowers from the customers unlike Monica, by virtue of _ being polite.", + "gold_answer": "Monica", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hugh scrubbed the mold in his apartment with a cleaner but had to call a pro because the _ was too weak.", + "gold_answer": "cleaner", + "os_answer": "cleaner", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher tried to empty all the water from the tank in the yard because Michael had asked him to, but _ wasn't able to get it all out.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The watch could not fit on the arm properly because it had been cut by a blade. The _ was short.", + "gold_answer": "Watch", + "os_answer": "strap", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "A very active Randy injured their elbow playing basketball against Lawrence, so _ said sorry.", + "gold_answer": "Lawrence", + "os_answer": "Lawrence", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John sold the three chairs and used the money to buy twelve shoes. The _ were cheaper.", + "gold_answer": "shoes", + "os_answer": "shoes", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John sold the three chairs and used the money to buy twelve shoes. The _ were more expensive.", + "gold_answer": "chairs", + "os_answer": "chairs", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The barista loved to make all types of coffee including iced and hot. The _ coffee was popular in the cooler weathers.", + "gold_answer": "hot", + "os_answer": "hot", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The barista loved to make all types of coffee including iced and hot. The _ coffee was popular in the hotter weathers.", + "gold_answer": "iced", + "os_answer": "iced", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The apartment that Samantha lived in was a lot smaller than Megan, because _ had a little salary.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The girl put her money in the bag instead of her pocket although the bully would look in the _ .", + "gold_answer": "bag", + "os_answer": "purse", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The girl put her money in her bag instead of her pocket because the bully looked in the _ .", + "gold_answer": "pocket", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ ignores Google to search for information because Betty trusts in it and Cynthia doesn't.", + "gold_answer": "Cynthia", + "os_answer": "ANSWER: Betty", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Irena didn't like other people living in something before her so she felt more comfortable buying the house instead of the mansion as the _ was old.", + "gold_answer": "mansion", + "os_answer": "house", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kevin was not able to run fast compared to William because _ had no broken bones in his body.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I did not see the sign on the billboard on the highway because the _ was too huge.", + "gold_answer": "billboard", + "os_answer": "advertisement", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I did not see the sign on the billboard on the highway because the _ was too tiny.", + "gold_answer": "sign", + "os_answer": "text", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After Logan pitched a ball that got clobbered for a home run by Justin in a baseball game, _ felt exultant.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela thought that Elena talked too slowly, and _ had a hard time being understood when they spoke.", + "gold_answer": "Elena", + "os_answer": "both", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel complained to Ian about the condition of the house. _ preferred a messy space.", + "gold_answer": "Ian", + "os_answer": "He", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At Jan's home, she dusted the dresser more frequently than the fan, because the _ was easier to reach.", + "gold_answer": "dresser", + "os_answer": "dresser", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At Jan's home, she dusted the dresser more frequently than the fan, because the _ was more difficult to reach.", + "gold_answer": "fan", + "os_answer": "fan", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor suggested alternating between ice and a heating pad when I strained a muscle, but he warned me to not let the _ get too warm.", + "gold_answer": "pad", + "os_answer": "pad", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor suggested alternating between ice and a heating pad when I strained a muscle, but he warned me to not let the _ get too cold.", + "gold_answer": "ice", + "os_answer": "ice", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "When other people were smoking, Kayla was more disgusted than Erin because _ had always avoided smoke.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin has a spouse and Kyle is single after being divorced, so _ is celebrating their independence this year.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher taught Hunter to play go fish so that _ had someone to play with.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie was helping Patricia diet and exercise at the gym to lose weight because _ used to be overweight.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I had to rake more leaves at the house than at the office because there were more trees at the _ .", + "gold_answer": "house", + "os_answer": "house", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The quality of music produced largely depends on the instrument used. The _ is vital.", + "gold_answer": "Instrument", + "os_answer": "instrument", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael made pickled eggs for Kenneth, but _ really loved his own and wanted to share them.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Henry wanted to stop yelling and start using a more effective type of communication because the _ was nice.", + "gold_answer": "communication", + "os_answer": "therapist", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tommy was able to carry the tripod himself, but his friend had to help him carry the camera because the _ was heavier.", + "gold_answer": "camera", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tommy was able to carry the tripod himself, but his friend had to help him carry the camera because the _ was lighter.", + "gold_answer": "tripod", + "os_answer": "tripod", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog ran into the bedroom during the rainstorm while we stayed in the kitchen because the rain was louder in the _ .", + "gold_answer": "kitchen", + "os_answer": "bedroom", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The dog ran into the bedroom during the rainstorm while we stayed in the kitchen because the rain was softer in the _ .", + "gold_answer": "bedroom", + "os_answer": "bedroom", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Maria gave Samantha the blue floral pants, because _ didn't fit into them very well.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey was considered more masculine than Amy because every year _ went into the woods to French kiss deer.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "He was late for the party but on time for the sleepover because the _ had just finished.", + "gold_answer": "party", + "os_answer": "party", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Cynthia had to pee after one large coffee but Betty did not as _ had a very big bladder.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia had to pee after one large coffee but Betty did not as _ had a very small bladder.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The remote control worked better than the toy car because the batteries in the _ were fresher.", + "gold_answer": "remote control", + "os_answer": "remote", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily bought a piece of jewelry from Natalie, later _ thought she sold too low but kept a cool attitude.", + "gold_answer": "Natalie", + "os_answer": "the", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert was simply not as stoic as Joel , as _ tended to handle things gracefully.", + "gold_answer": "Joel", + "os_answer": "the", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron drank plenty of water before the hike, but Christopher forgot to, so _ ended up staying hydrated.", + "gold_answer": "Aaron", + "os_answer": "Aaron", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron drank plenty of water before the hike, but Christopher forgot to, so _ ended up getting dehydrated.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The TV that Samantha bought costs more than that of Carrie, because _ was poor.", + "gold_answer": "Carrie", + "os_answer": "Carrie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The TV that Samantha bought costs more than that of Carrie, because _ was rich.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie had an easier time crawling through the narrow tunnel than Patricia because _ was larger.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia gave a rabbit as a companion to Carrie because _ thought they were lonely.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia gave a rabbit as a companion to Carrie because _ explained they were lonely.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Smoke still rose from the house but had subsided at the barn. The fire was doused at the _ .", + "gold_answer": "barn", + "os_answer": "barn", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although William liked animals less overall than Justin, _ couldn't stand to be around hamsters.", + "gold_answer": "Justin", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Katrina drove Emily to the prison, so that _ could say goodbye to them before they went to jail.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Ian was tired of trying new diets while Steven had luck with one, so _ decided to do their own thing.", + "gold_answer": "Ian", + "os_answer": "each", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian was tired of trying new diets while Steven had luck with one, so _ stuck to their routine.", + "gold_answer": "Steven", + "os_answer": "both", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina wanted to build a new picture frame for Samantha's portrait because _ was an inexperienced woodworker.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Nick struggled with unresolved trauma that Ian couldn't understand, since _ had frequently experienced childhood abuse.", + "gold_answer": "Ian", + "os_answer": "Nick", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Nick struggled with unresolved trauma that Ian couldn't understand, since _ had never experienced childhood abuse.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Victoria decided to adopt a Yorkie, but Elena wouldn't even consider it, because _ loved small dogs.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Carrie kept written records of their expenses but not Laura because _ had a faulty memory.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Carrie kept written records of their expenses but not Laura because _ had a sharp memory.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My employer offers a bonus of either a phone or a television, but unfortunately the _ is just way too large to be useful.", + "gold_answer": "phone", + "os_answer": "television", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My employer offers a bonus of either a phone or a television, but unfortunately the _ is just way too small to be useful.", + "gold_answer": "television", + "os_answer": "screen", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The stain in the bucket could not be cleaned with the brush because the _ is soft.", + "gold_answer": "brush", + "os_answer": "bristle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stain in the bucket could not be cleaned with the brush because the _ is tough.", + "gold_answer": "stain", + "os_answer": "stain", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha was not interested in hearing about Tanya awesome marriage, because _ was happy all the time.", + "gold_answer": "Tanya", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha wanted to reduce smoking by relying on a new nicotine patch and therapy video, but the _ was boring.", + "gold_answer": "video", + "os_answer": "video", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha wanted to reduce smoking by relying on a new nicotine patch and therapy video, but the _ was addictive.", + "gold_answer": "patch", + "os_answer": "habit", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had a slower running phone than Logan because _ had more apps running on theirs.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Craig had a faster running phone than Logan because _ had more apps running on theirs.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The roof would have to be repaired using tarps or shingles before the storm comes. The _ are a temporary fix, though.", + "gold_answer": "tarps", + "os_answer": "tarps", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty had more burns on their hands than Amy because _ worked as a welder.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary wanted to surprise Cynthia with a puppy for Christmas, so _ asked about allergies to dogs.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Keeping the doors closed and the windows opened kept the apartment cool , because the _ let out the heat.", + "gold_answer": "windows", + "os_answer": "breeze", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Keeping the doors closed and the windows opened kept the apartment cool , because the _ kept out the heat.", + "gold_answer": "doors", + "os_answer": "insulation", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The student tried to write down the notes on the papers but the _ were too long.", + "gold_answer": "notes", + "os_answer": "lectures", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel had a shorter expected lifespan than Kenneth, so _ procrastinated in following all their dreams.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The personal trainer gave Laura but not Victoria the more difficult exercise because _ was in shape.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The personal trainer gave Laura but not Victoria the more difficult exercise because _ was out of shape.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "When the car was brought up into the shop, the brake was replaced when the wheel wasn't, since the _ was fixed.", + "gold_answer": "wheel", + "os_answer": "caliper", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the dance, Adam asked the girl to dance before Donald, so _ is angry with himself.", + "gold_answer": "Donald", + "os_answer": "Donald", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "If I want to build a swing should I build it out of wood or use a tire? It seems like the _ would get dirty and gross inside.", + "gold_answer": "tire", + "os_answer": "tire", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "If I want to build a swing should I build it out of wood or use a tire? It seems like the _ would get rotten eventually.", + "gold_answer": "wood", + "os_answer": "wood", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The beef tasted better than the pork did although the _ had been slightly undercooked.", + "gold_answer": "beef", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chef added butter to the pan on the stove and it began to melt right away because the _ was hot.", + "gold_answer": "pan", + "os_answer": "stove", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chef added butter to the pan on the stove and it began to melt right away because the _ was soft.", + "gold_answer": "butter", + "os_answer": "butter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie had a pig while Jennifer had a cow so _ thought mines smaller so its better.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sink in the bathroom looked good but the toilet was leaking so James kept the _ .", + "gold_answer": "sink", + "os_answer": "plumber", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Rebecca slept in the hammock in the backyard while Tanya gardened because _ was tired.", + "gold_answer": "Rebecca", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bagel shop was closer to Michael than Joel because _ lived in a different area of town.", + "gold_answer": "Joel", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel but not Christine was tracked down by police because _ made it to the hideout.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel but not Christine was tracked down by police because _ did not make it to the hideout.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Benjamin had less piercings than Jeffrey did so it was harder for _ to get a job.", + "gold_answer": "Jeffrey", + "os_answer": "him", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Rachel wanted children, but Megan had no interest, so _ looked for someone else to have babies with.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel wanted children, but Megan had no interest, so _ looked for someone else to have freedom with.", + "gold_answer": "Megan", + "os_answer": "Rachel", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joe drank his milk and tried to dunk his cookie in the glass but the _ was too small.", + "gold_answer": "glass", + "os_answer": "diameter", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe drank his milk and tried to dunk his cookie in the glass but the _ was too big.", + "gold_answer": "cookie", + "os_answer": "cookie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Anxiety is a feeling Rebecca gets when she has face Erin who is a probation officer, _ does not a fear of authority.", + "gold_answer": "Erin", + "os_answer": "but", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Adam cried when Donald had a stubbed toe since _ had a look of pain on his face.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bank permitted Michael to open a checking account, but not Matthew, because _ was employed.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The bank permitted Michael to open a checking account, but not Matthew, because _ was unemployed.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The children were not vaccinated, which was fine with Betty but annoyed Mary. _ knew they didn't make kids autistic.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The children were not vaccinated, which was fine with Betty but annoyed Mary. _ believed they made kids autistic.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Firing a shotgun came more naturally for Megan than Tanya because _ grew up around them.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ ignored drinking milk from the bottle because Rachel was thirsty and Erin already drank some water.", + "gold_answer": "Erin", + "os_answer": "Rachel", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ drank milk from the bottle because Rachel was thirsty and Erin already drank some water.", + "gold_answer": "Rachel", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donna needed dentures or implants for her bad teeth. She chose the _ because they are cheaper.", + "gold_answer": "dentures", + "os_answer": "dentures", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donna needed dentures or implants for her bad teeth. She chose the _ because they are permanent.", + "gold_answer": "implants", + "os_answer": "implants", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We were going fishing out on the dock later in the day after we couldn't all fit in the boat, because the _ was confined.", + "gold_answer": "boat", + "os_answer": "space", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie tended to wear their hair in a ponytail, while Maria wasn't able to, because _ had long hair.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The pine trees were still green in December, but the oak trees were not, because the _ keep their leaves in fall.", + "gold_answer": "pine trees", + "os_answer": "pines", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The pine trees were still green in December, but the oak trees were not, because the _ lose their leaves in fall.", + "gold_answer": "oak trees", + "os_answer": "oaks", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Fiction books were interesting and easy to read for Logan but not Brett because _ enjoyed real tales.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel had many extra possesions while Neil didn't, so _ had to rent a storage shed.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel had many extra possesions while Neil didn't, so _ didn't have to rent a storage shed.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey thought Craig probably had gum and asked for a piece, because _ had fresh breath.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey thought Craig probably had gum and asked for a piece, because _ had bad breath.", + "gold_answer": "Jeffrey", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin was able to use their device for longer than Steven because _ remembered to bring their charger.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura was thrilled to get their lip pierced but Rachel was pretty scared. _ had theirs done and cried.", + "gold_answer": "Rachel", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wound responded quickly to the rubbing alcohol, but slowly to the ointment because the _ is more efficient.", + "gold_answer": "rubbing alcohol", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He tried to use the rag to clean the bacteria off the table but the _ was too large.", + "gold_answer": "table", + "os_answer": "colony", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "She decided to report the accident and the burglary, but the _ required much more investigation.", + "gold_answer": "burglary", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She decided to report the accident and the burglary, but the _ required much less investigation.", + "gold_answer": "accident", + "os_answer": "accident", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Brian informed Aaron that their coach had scheduled an extra event on Saturday morning since _ was present at yesterday's practice.", + "gold_answer": "Brian", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "For work I can either get there by car or bicycle. I'm going to take the _ today because the weather is supposed to be rainy.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "No one would have noticed the spot on that skin because the _ is small.", + "gold_answer": "spot", + "os_answer": "blemish", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Because William developed a sore knee during his race against against Kyle, _ won the race.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I couldn't figure out what my costume would be for Halloween Peter Pan or Snow White. The _ costume I'd have to wear a dress.", + "gold_answer": "Snow White", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I couldn't figure out what my costume would be for Halloween Peter Pan or Snow White. The _ costume I'd have to make myself a boy.", + "gold_answer": "Peter Pan", + "os_answer": "either", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James passport was kept inside the purse. He never knew the _ is that small.", + "gold_answer": "passport", + "os_answer": "size", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "James passport was kept inside the purse. He never knew the _ is that big.", + "gold_answer": "purse", + "os_answer": "size", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Of the two owners, Jessica was far worse than Jennifer, because _ like to treat the dogs.", + "gold_answer": "Jennifer", + "os_answer": "ANSWER: neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Of the two owners, Jessica was far worse than Jennifer, because _ like to beat the dogs.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The handle of the spoon was submerged in the cup of tea because the _ is short.", + "gold_answer": "spoon", + "os_answer": "cup", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tom recently was approved for botox therapy. He had a choice between near the office or near his house and went with his weekday convenience of the _ .", + "gold_answer": "office", + "os_answer": "office", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The water in the car was cooler than the water in the truck because the engine in the _ had run more recently.", + "gold_answer": "truck", + "os_answer": "truck", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The water in the car was hotter than the water in the truck because the engine in the _ had run more recently.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The color of the paint was quite pleasing to Jessica however Natalie believed it to be too bright. _ painted their room with a subdued color paint.", + "gold_answer": "Natalie", + "os_answer": "They", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Research came easy to Monica as compared to Erin because _ 's father was a landscaper.", + "gold_answer": "Erin", + "os_answer": "Monica", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Because of his rash, he opted not to wash with soap but with oil, as the _ would soothe it.", + "gold_answer": "oil", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James took out a seat from his office to create more space. The _ is too big.", + "gold_answer": "seat", + "os_answer": "room", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "His addiction was getting bad so they handed him over to therapy and stopped taking medicine since the _ was cheaper.", + "gold_answer": "therapy", + "os_answer": "rehab", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easier for the diner to follow their budget than the food truck because the _ had more money to spend.", + "gold_answer": "diner", + "os_answer": "diner", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easier for the diner to follow their budget than the food truck because the _ had less money to spend.", + "gold_answer": "food truck", + "os_answer": "diner", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Donald stuck his nose up and scoffed at William's ragged outfit, because _ looked like the working class.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We didn't get the biscuits this morning before school, so I ordered an omelet instead of a hash brown as the _ would make me hungry.", + "gold_answer": "hash brown", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We didn't get the biscuits this morning before school, so I ordered an omelet instead of a hash brown as the _ would make me full.", + "gold_answer": "omelet", + "os_answer": "protein", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett threw away all the soda and junk food to reduce Leslie's dependence on unhealthy foods because _ cares for his health.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Gem needed both therapy and medicines to cope with her broken leg. She preferred the _ because it was painless.", + "gold_answer": "medicine", + "os_answer": "therapy", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Neil told Lawrence that he was training to be a race car driver. _ was excited.", + "gold_answer": "Neil", + "os_answer": "Lawrence", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Neil told Lawrence that he was training to be a race car driver. _ was worried about him.", + "gold_answer": "Lawrence", + "os_answer": "Lawrence", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the water poured freely into the hole until it disappeared , the _ was little.", + "gold_answer": "water", + "os_answer": "trickle", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "the water poured freely into the hole until it disappeared , the _ was deep.", + "gold_answer": "hole", + "os_answer": "abyss", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena was an excellent flight attendant when Sarah boarded the plane with a fear of flying because, _ was able to overcome their fears.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She wanted to sew a shirt from silk she bought and a jacket in denim from old jeans so the _ was recycled.", + "gold_answer": "denim", + "os_answer": "fabric", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty reluctantly confided in Rebecca that she was suffering from memory loss. _ was distraught.", + "gold_answer": "Betty", + "os_answer": "Betty", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Carla start doing sit-ups and pushups for her weak spots. The _ are for her abs.", + "gold_answer": "sit-ups", + "os_answer": "sit-ups", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carla start doing sit-ups and pushups for her weak spots. The _ are for her chest.", + "gold_answer": "pushups", + "os_answer": "pushups", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher was getting ready to wash Joel's hair,so _ got out shampoo by the sink and sat in the chair.", + "gold_answer": "Joel", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis invited Joseph on a trip to the hatchery tomorrow morning because _ was also interested in fish.", + "gold_answer": "Joseph", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man finally decided to become a guardian for the child at the orphanage because the _ was loving.", + "gold_answer": "guardian", + "os_answer": "Here is the correct word to fill in the blank:\n\nyoungster", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela's room was a lot lighter than Rebecca's room, because the light of _ went out.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca's", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan wrote on the paper with a pencil unlike Jennifer who wrote with a pen, because _ wanted to erase it later.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan wrote on the paper with a pencil unlike Jennifer who wrote with a pen, because _ wanted to keep it for later.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura asked Rachel if she could borrow some clothes because _ loved her fashion sense.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When you buy food for your cat, choose dry instead of wet as the crunchy texture of the _ is better for their teeth.", + "gold_answer": "dry", + "os_answer": "kibble", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It was easier to get the soil loosened up with the pick than with the shovel, because the _ was solid.", + "gold_answer": "pick", + "os_answer": "ground", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin knew the perfect gift for the wedding shower, but Samantha had to do some research, because _ was slightly acquainted with the bride.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gothic lolita style suited Victoria better than Sarah because _ looked the worst in frilly dresses.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha couldn't see any alternatives, but Emily could, because _ wasn't nearly as open minded.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joseph wanted to sell lemonade at a stand in the summer months instead of the spring months since people in the _ would be thirstier.", + "gold_answer": "summer", + "os_answer": "summer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After a boring meeting, Monica closed her eyes and dozed while Carrie took a walk, as _ had gone to bed late the night before.", + "gold_answer": "Monica", + "os_answer": "both", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After a boring meeting, Monica closed her eyes and dozed while Carrie took a walk, as _ had gone to bed early the night before.", + "gold_answer": "Carrie", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My mom didn't fit the shape into the painting, because the _ was too awkward.", + "gold_answer": "shape", + "os_answer": "composition", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "My mom didn't fit the shape into the painting, because the _ was too complete.", + "gold_answer": "painting", + "os_answer": "composition", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My mom always had training at the house, but not today because the _ was unavailable.", + "gold_answer": "house", + "os_answer": "trainer", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin frequently suffered from hair loss while Samantha had healthy hair, as _ was never stressed out.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason was at practice all the time to try and get better than Christopher. _ needed more practice.", + "gold_answer": "Jason", + "os_answer": "He", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The team won a trophy instead of a plaque as a result of hard times as the _ was cheap to make.", + "gold_answer": "trophy", + "os_answer": "trophy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The creatures attacked Derrick while ignoring Ryan, because _ remembered to put on the repellent.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan liked to read a book good more than Samantha because _ liked the peace and quiet.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan liked to read a book good more than Samantha because _ hated the peace and quiet.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Late at night, Rebecca was more tired than Jessica so _ was unable to go right to sleep.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Late at night, Rebecca was more tired than Jessica so _ was able to go right to sleep.", + "gold_answer": "Rebecca", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman pierced the customer's tongue with a needle before piercing his nose because the _ was numb.", + "gold_answer": "tongue", + "os_answer": "tongue", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The woman pierced the customer's tongue with a needle before piercing his nose because the _ was still sensitive.", + "gold_answer": "nose", + "os_answer": "nostril", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Starting the engine of the car took less time unlike the truck since the _ 's engine was working at the time.", + "gold_answer": "car", + "os_answer": "car", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil used a chainsaw to cut down the tree instead of a regular saw like William, because _ believed in modern equipment.", + "gold_answer": "Neil", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shirts were straighter than the pants because the _ were hanging on the hanger.", + "gold_answer": "shirt", + "os_answer": "shirts", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shirts were straighter than the pants although the _ were hanging on the hanger.", + "gold_answer": "pants", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man thought lifting the rock, not the log, would give him a hernia because the _ was lighter.", + "gold_answer": "log", + "os_answer": "log", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria was able to keep their weight off long term, unlike Felicia, because _ followed a healthy diet.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Maria was able to keep their weight off long term, unlike Felicia, because _ followed a crash diet.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The dog was more suspicious of the locker than of the package because the drugs were in the _ .", + "gold_answer": "locker", + "os_answer": "locker", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin usually paid for the gas when Craig always said he was broke. _ was generous.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin loved people and wanted to help them while Katrina loved to help animals. _ volunteered at the local shelter.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis did not enjoy their afternoon but Hunter did because _ left work after the sunset.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Dennis did not enjoy their afternoon but Hunter did because _ left work after the sunrise.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We were making orange jack o lanterns and bought candles to put in the oranges, the candles did not fit. The _ were too big.", + "gold_answer": "candles", + "os_answer": "oranges", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "We were making orange jack o lanterns and bought candles to put in the oranges, the candles did not fit. The _ were too small.", + "gold_answer": "oranges", + "os_answer": "holes", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie committed a bunch of good deeds in Samantha's name, because _ wanted all the credit.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Natalie committed a bunch of good deeds in Samantha's name, because _ didn't want the credit.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "She wanted to shop for more clothes and ultimately decided on the velvet dress instead of the denim jacket because the _ was more casual.", + "gold_answer": "jacket", + "os_answer": "jacket", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil put the finishing touches on the android as he sold it off to Brian because _ was an engineer.", + "gold_answer": "Neil", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura didn't buy anything at all for Betty's birthday, because _ forgot to mention it.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel plans to go to Latin America next year where Dennis is currently living, _ has never been to Latin America.", + "gold_answer": "Joel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Beautiful to Angela means something physical, while it's mental to Emily, so _ is deeper.", + "gold_answer": "Emily", + "os_answer": "beauty", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Beautiful to Angela means something physical, while it's mental to Emily, so _ is shallower.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason really wanted to get the job, but he felt like he flunked the interview. The manager called and said he could try the _ again next week.", + "gold_answer": "interview", + "os_answer": "interview", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was wearing wool socks when I went to try on my new boots but I couldn't get them on because the _ were too small.", + "gold_answer": "boots", + "os_answer": "boots", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was wearing wool socks when I went to try on my new boots but I couldn't get them on because the _ were too large.", + "gold_answer": "socks", + "os_answer": "socks", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The library always had more books than computers, most likely because the _ are smaller.", + "gold_answer": "books", + "os_answer": "books", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The library always had more books than computers, most likely because the _ are bigger.", + "gold_answer": "computers", + "os_answer": "budgets", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The hair stylist gave Laura hair extensions and not Katrina because _ had very short hair.", + "gold_answer": "Laura", + "os_answer": "Laura", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Monica did not need a recipe in order to mix a cake but Angela did because _ was an instinctive baker.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had cereal for breakfast while Dennis had a shake, so _ finished drinking their breakfast.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had cereal for breakfast while Dennis had a shake, so _ finished eating their breakfast.", + "gold_answer": "Craig", + "os_answer": "both", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Logan ended up calling the police over an incident involving Jason because _ was scratched by them.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Carl needed a new top after ripping his epaulette shirt. He wanted a flannel shirt because the _ is old.", + "gold_answer": "epaulette shirt", + "os_answer": "trend", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Garrett was always feeling fatigued because of the energy his job demands. The _ of the job is too much.", + "gold_answer": "demand", + "os_answer": "rigor", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Ben had to respect his toys and his books to ensure they last long. However, it was difficult to respect the _ because they were fun.", + "gold_answer": "toys", + "os_answer": "toys", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He made a few dishes to serve. One was a salad and the other was a steak. The _ was healthy.", + "gold_answer": "salad", + "os_answer": "salad", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although Angela was overall a nicer person than Natalie, _ often did practice humility very regularlly.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia has a pond in their backyard, but Carrie cannot afford one, which means _ lives in the richer neighborhood.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil's cat was terrified of thunderstorms but Kyle's wasn't bothered by them. _ found their cat hiding under the bed after the loud crackle of thunder.", + "gold_answer": "Neil", + "os_answer": "Neil", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jay could comfort sad people better instead of happy people because the _ people weren't realistic.", + "gold_answer": "happy", + "os_answer": "nostalgic", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eric often thought of his annoying habits, like hitting his pen on his desk, and asked Ryan if it bothered him; _ said he was sorry he had done it.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya wanted poppies for her wedding flowers but Carrie said that was an odd choice. _ pointed out it was a wedding and tradition mattered.", + "gold_answer": "Carrie", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin shaved his beard, but Nick had just grown one, so _ gave them all his old oils.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I got more use in the gym than at the playground because the _ had more things to do.", + "gold_answer": "gym", + "os_answer": "gym", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica can speak English and German but Samantha can only speak English because _ is trilingual.", + "gold_answer": "Samantha", + "os_answer": "neither", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "All of the bands were not able to march on the fields at the same time because the _ were massive.", + "gold_answer": "bands", + "os_answer": "crowds", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Marty needed some sport and dress shoes, but could only buy one pair. He went with the _ since he would be going to a wedding.", + "gold_answer": "dress", + "os_answer": "dress", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I like to drink mineral water over tap water when I travel outside of the USA because the _ water in other countries is safe.", + "gold_answer": "mineral", + "os_answer": "bottled", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Pine trees were a big part of Erin s Christmas tree farm while Megan was jewish but helped _ celebrate anyhow.", + "gold_answer": "Erin", + "os_answer": "Erin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eating spicy foods better suited Robert and not Adam because _ never got acid reflux from salsa.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel hated their new in-laws, but tried to keep it secret from Monica. Eventually _ told them.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha was pretty good at math while Natalie was better at English. _ enrolled in a storytelling class this semester.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth had worse skin than Craig so _ had to use more of the moisturizer.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth had better skin than Craig so _ had to use more of the moisturizer.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cat Natalie owned would snuggle up on Jessica's lap because _ was nice to it all the time.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian always tried to find ways to be productive at work unlike Kenneth, because _ was a hard worker.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya loved pepperoni on their pizza and Katrina loved sausage, so when it had just sausage _ was not very happy.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya loved pepperoni on their pizza and Katrina loved sausage, so when it had just pepperoni _ was not very happy.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jen planned a retreat to a mountain or the park. She chose the _ because it was warmer.", + "gold_answer": "park", + "os_answer": "park", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin bought a new RV but Lawrence liked his old one, so _ decided to buy it.", + "gold_answer": "Lawrence", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin bought a new RV but Lawrence liked his old one, so _ decided to sell it.", + "gold_answer": "Justin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya was unrecognizable after Sarah was done beating them, so _ ended up going to jail.", + "gold_answer": "Sarah", + "os_answer": "Sarah", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Frank wanted to put the burger on the barbecue, but the _ wasn't formed yet.", + "gold_answer": "burger", + "os_answer": "patty", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "All the glaciers that fell from the top of the mountains were found at the bottom. The _ were large.", + "gold_answer": "Glaciers", + "os_answer": "fragments", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The student liked writing their signature with a pen instead of a pencil, because the _ showed up lighter.", + "gold_answer": "pencil", + "os_answer": "pencil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The student liked writing their signature with a pen instead of a pencil, because the _ showed up darker.", + "gold_answer": "pen", + "os_answer": "ink", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick showed Jason how to cut the tiles for their kitchen, and _ was shown appreciation for their help.", + "gold_answer": "Derrick", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "So _ avoids eating carrots for their eye health because Emily needs good eyesight while Monica doesn't.", + "gold_answer": "Monica", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The medical waste was moved from the bag to the bucket, so the _ soon became sterilized.", + "gold_answer": "bag", + "os_answer": "bag", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Sarah but not Erin would get a retirement pension because _ had a 30 year work career.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick had been working on his script for years and refused to get any other job, much to Logan's dismay. _ was worried and upset.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Connie likes to cook at home and decided to forgo a roast in favor of tofu because the _ is useless for a vegetarian meal.", + "gold_answer": "roast", + "os_answer": "meat", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He has a much harder time with this fever compared to the flu, because the _ took one week to get over.", + "gold_answer": "fever", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I couldn't decide if I should pressure cook or smoke the pig feet. After looking outside, I decided the weather was poor enough to _ them.", + "gold_answer": "pressure cook", + "os_answer": "braise", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I couldn't decide if I should pressure cook or smoke the pig feet. After looking outside, I decided the weather was good enough to _ them.", + "gold_answer": "smoke", + "os_answer": "smoke", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The computer ran faster than the tablet because the files on the _ were larger.", + "gold_answer": "tablet", + "os_answer": "tablet", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Gem had a husky breed named Ben. Ben liked both bones and toys. However, he liked the _ the best because it was inedible.", + "gold_answer": "toys", + "os_answer": "toys", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian agreed to buy soap for Kenneth while at the store, and _ paid them back the following day for the errand.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The company wanted to increase labor productivity with its new machinery and camera, but the _ had faulty screws.", + "gold_answer": "machinery", + "os_answer": "equipment", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter prepared the documents and data tables for Matthew's scientific research because _ is his assistant.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel was blown away to find out from Lawrence that goldfish are a type of carp, so _ decided to fact check his friend.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The professor's eyes could not see clearly because of the sunglasses he had. The _ were poor.", + "gold_answer": "Sunglasses", + "os_answer": "optics", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "For her birthday gifts, Sarah was upset with the pearls, but felt the opposite about the rings she received. The _ were fancier.", + "gold_answer": "rings", + "os_answer": "rings", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jody wanted new mascara and eyeliner, either black or brown, but the _ was too light.", + "gold_answer": "brown", + "os_answer": "shade", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jody wanted new mascara and eyeliner, either black or brown, but the _ was too heavy.", + "gold_answer": "black", + "os_answer": "traffic", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aaron wanted to go the gym but the others wanted to go to the park because the _ did require membership.", + "gold_answer": "gym", + "os_answer": "park", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The doctor couldn't treat the arm infection, but was able to handle the ear ache. The _ was more petty.", + "gold_answer": "ear ache", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had a cat as a pet but Nelson didn't have any pets because _ had little allergies in their system.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Maria mimicked everything that Christine did at work because _ was like a fan to her.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kyle paid Craig to board the family dog at the kennel for a week, because _ was going on vacation.", + "gold_answer": "Kyle", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria told Monica they looked too sick to go to work and asked if they had a fever. _ went to the Doctor.", + "gold_answer": "Monica", + "os_answer": "They", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stove was left on after Matthew used it, so Nelson turned it off. _ was careful.", + "gold_answer": "Nelson", + "os_answer": "Nelson", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica found the heavy load at work overwhelming but not Katrina because _ did a poor job at planning their work.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The brutal boxing match was suitable for Christopher but not Samuel because _ did damage to his opponent.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The brutal boxing match was suitable for Christopher but not Samuel because _ did not damage his opponent.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Going on a diet was easier for Benjamin but not Donald because _ did not know about any different programs.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer got about with a seeing-eye dog but Mary did not because _ was blind.", + "gold_answer": "Jennifer", + "os_answer": "Jennifer", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer got about with a seeing-eye dog but Mary did not because _ was sighted.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog loved Kevin but hated Derrick, so _ started bringing the dog treats to change its mind.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dog hated Kevin but loved Derrick, so _ started bringing the dog treats to change its mind.", + "gold_answer": "Kevin", + "os_answer": "Kevin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The kitty ran away from Kayla and not Felicia because the kitty had known _ for many years.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "During the summer, I like visiting the zoo more than the aquarium because the _ is inside.", + "gold_answer": "aquarium", + "os_answer": "aquarium", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The market was going out of business so they sold their products but not the lots as the _ were useful.", + "gold_answer": "lots", + "os_answer": "premises", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The market was going out of business so they sold their products but not the lots as the _ were useless.", + "gold_answer": "products", + "os_answer": "fixtures", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Patricia has a trouble with training her horse and wants Tanya's help, because _ wants her horse to behave.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samuel had to recently recover from a stroke unlike William because _ was living an unhealthy lifestyle.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy was going to see an X-rated film but was stopped on the sidewalk and yelled at by Nick. The anger showed on _ 's face.", + "gold_answer": "Nick", + "os_answer": "Nick", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Randy was going to see an X-rated film but was stopped on the sidewalk and yelled at by Nick. The shame showed on _ 's face.", + "gold_answer": "Randy", + "os_answer": "Randy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela noticed the lumps on Amy 's arms that she had failed to notice, _ is just oblivious that way.", + "gold_answer": "Amy", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joel ran out of toilet paper, so he asked Dennis in the stall next to him for some. _ was relieved when he agreed.", + "gold_answer": "Joel", + "os_answer": "He", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla was the subject of a secret crush from Rebecca. _ was aware they were a secret admirer.", + "gold_answer": "Rebecca", + "os_answer": "Neither", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Tanya was the most powerful person in the world, and Sarah admired them, because _ was something to aspire to.", + "gold_answer": "Tanya", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian was supposed to be babysitting for Dennis but didn\u2019t show up because _ was forgotten.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald was able to catch the Frisbee thrown by Eric, then _ was thrown the Frisbee back.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald was able to catch the Frisbee thrown by Eric, then _ threw the Frisbee back.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I was driving my car and tried to get through the intersection, but the light turned red. The _ is too fast.", + "gold_answer": "light", + "os_answer": "timer", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe brought his books to school in a suitcase instead of a backpack because the _ was bigger.", + "gold_answer": "suitcase", + "os_answer": "suitcase", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joe brought his books to school in a suitcase instead of a backpack because the _ was smaller.", + "gold_answer": "backpack", + "os_answer": "backpack", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "During the earthquake, the boy hid under the desk instead of the table because the _ was sturdy.", + "gold_answer": "desk", + "os_answer": "desk", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While playing soccer, Robert got kicked in the head and Joel laughed at him causing the coach to look at _ with pity.", + "gold_answer": "Robert", + "os_answer": "Robert", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald had to wax a lot more frequently than Ian because _ had blonde colored hair.", + "gold_answer": "Ian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joseph asked Robert to clean the floor with a mop nearby because _ needs to work.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Christine took all the money while Mary told her to save the money for herself. _ only knows to take.", + "gold_answer": "Christine", + "os_answer": "ANSWER: Christine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig grew frustrated trying to coach Nick in soccer, as _ lacked the aptitude needed for the task.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig grew frustrated trying to coach Nick in soccer, as _ lacked the patience needed for the task.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Getting a divorce as soon as possible suited Victoria but not Lindsey because _ was no longer in love.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The musician liked playing at the auditorium more than at the park because he sounded quieter at the _ .", + "gold_answer": "park", + "os_answer": "park", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The musician liked playing at the auditorium more than at the park because he sounded louder at the _ .", + "gold_answer": "auditorium", + "os_answer": "auditorium", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Wanting to impress his boss, the man put the brandy away and served scotch instead because the _ was expensive.", + "gold_answer": "Scotch", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Wanting to impress his boss, the man put the brandy away and served scotch instead because the _ was cheap.", + "gold_answer": "Brandy", + "os_answer": "brandy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Pho needs cilantro and beef to be tasty. However, the _ can be too bitter.", + "gold_answer": "cilantro", + "os_answer": "cilantro", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Pho needs cilantro and beef to be tasty. However, the _ can be too savory.", + "gold_answer": "beef", + "os_answer": "broth", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty's blanket was much thicker than Jessica's blanket, so _ felt cold all night in bed.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher declined when asked by Ian to play a game of chess because _ liked to play intellectual games.", + "gold_answer": "Ian", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie had a phobia about crossing over high bridges but Tanya didn't. _ had to re-route their trip to avoid bridges.", + "gold_answer": "Natalie", + "os_answer": "They", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth explained to Ryan that he was dressed like this because he was going to a disco party. _ was excited.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth did not like Hunter because he was not a good manager. But he still respected _ because he was his superior.", + "gold_answer": "Hunter", + "os_answer": "him", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca had a way of minimizing risks whereas Mary usually did not. This made _ want to assist.", + "gold_answer": "Rebecca", + "os_answer": "me", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Paolo tries to remember what he read in the textbook, but all he can think of is the email from his friend because he read the _ ages ago.", + "gold_answer": "textbook", + "os_answer": "textbook", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "If you are trying to get rid of blood spots from clothes use cold water instead of hot water the _ releases the stain.", + "gold_answer": "cold water", + "os_answer": "heat", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "If our relationship just started, should I get her a card or gift for Christmas? She might think I'm cheap if I give the _ .", + "gold_answer": "card", + "os_answer": "card", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "More people attended the funeral of Joel than of Derrick because _ was a mean person.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cleavage had to be hidden for this event's clothing because the _ was inappropriate.", + "gold_answer": "cleavage", + "os_answer": "d\u00e9colletage", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam decided to shave Denniss beard before the reuinion, because _ thought it was too long.", + "gold_answer": "Adam", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Adam decided to shave Denniss beard before the reuinion, but _ thought it was too short.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rebecca had a sneezing reflex unlike Monica, so when they took the cinnamon challenge _ won.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John tried to clean the juice that spilled on the carpet with a towel but it has sunk deep. The _ is still dry.", + "gold_answer": "towel", + "os_answer": "stain", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The landscaping looked better at the house than at the cottage because the _ owners used a hardworking company.", + "gold_answer": "house", + "os_answer": "former", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily had always loved kids and Jessica felt the opposite, so _ was surprised to become a pediatrician.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The intelligence agency ordered new computers for the workers and kept the same peripherals because the _ were at risk.", + "gold_answer": "computers", + "os_answer": "data", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria planned to spring clean this weekend and told Katrina they should help too. _ purposely left home very early.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria planned to spring clean this weekend and told Katrina they should help too. _ expected her help.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson wanted to be an actor so Neil got them an audition because _ had poor connections in the movie industry.", + "gold_answer": "Nelson", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "During the charity drive, they decided to donate the couch but not the bed because the _ was broken.", + "gold_answer": "bed", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man decided to use a nail instead of a screw because the _ would be looser in the wood.", + "gold_answer": "screw", + "os_answer": "screw", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jen made charcoal to use as a mask and as toothpaste, but using the _ made her skin very black.", + "gold_answer": "mask", + "os_answer": "charcoal", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jen made charcoal to use as a mask and as toothpaste, but using the _ made her teeth very white.", + "gold_answer": "toothpaste", + "os_answer": "charcoal", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was disappointed as Logan asked him if he had any herb. _ was a stoner.", + "gold_answer": "Logan", + "os_answer": "Logan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was disappointed as Logan asked him if he had any herb. _ was let down.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert usually didn't like fish as much as Kyle however _ had a disliking for sardines on pizza.", + "gold_answer": "Kyle", + "os_answer": "both", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica painted the porch for Kayla so the neighbor berated _ for being so lazy.", + "gold_answer": "Kayla", + "os_answer": "Kayla", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis made their weight loss goal before Eric, because _ only ate a healthy diet.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya looked for an escape route while Elena did not because _ liked to live in the moment.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya looked for an escape route while Elena did not because _ liked to be aware of all the surroundings.", + "gold_answer": "Tanya", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was on a diet, but cheated by eating junk food with Christopher. _ felt bad for ruining his plan.", + "gold_answer": "Christopher", + "os_answer": "He", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Elena waited patiently for Angela, as _ arrived early to meet at their prearranged spot.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In her newly purchased house, Patricia was upset to discover a woodworm infestation and called the realtor Victoria. _ called the sellers to ask them pay for an exterminator.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In her newly purchased house, Patricia was upset to discover a woodworm infestation and called the realtor Victoria. _ wanted the sellers to pay for an exterminator.", + "gold_answer": "Patricia", + "os_answer": "She", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We set up the treasure hunt, but the treasure chest was found easily on the path because the _ was big.", + "gold_answer": "chest", + "os_answer": "footprint", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "We set up the treasure hunt, but the treasure chest was found easily on the path because the _ was short.", + "gold_answer": "path", + "os_answer": "route", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald took medication for their anxiety, but Craig went to therapy because _ was open with their feelings.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald took medication for their anxiety, and Craig went to therapy because _ was private with their feelings.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Hunter found they no longer returned Joseph's love in their marriage, therefore _ received divorce papers.", + "gold_answer": "Joseph", + "os_answer": "they", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In order to grow his plants naturally, he bought fertilizer and water. The _ was lacking with nutrients.", + "gold_answer": "water", + "os_answer": "soil", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In order to grow his plants naturally, he bought fertilizer and water. The _ was filled with nutrients.", + "gold_answer": "fertilizer", + "os_answer": "fertilizer", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla threw the phone to Rebecca, then _ asked for it to be thrown back.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had less money than Samuel did because _ liked to shop and spend money too much.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Michael had more money than Samuel did because _ like to shop and spend money too much.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After a nasty breakup, Kayla needed a restraining order from Samantha because _ was scary to them.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I didn't do well on my exam even though I did all the problems in the textbook correctly. I guess the questions in the _ were just too hard.", + "gold_answer": "exam", + "os_answer": "exam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At dinner time, Tanya ate Erin's serving of peas even though _ really likes green vegetables.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sally knew the exam would be hard so she developed a study schedule. The _ was 4 weeks long.", + "gold_answer": "schedule", + "os_answer": "schedule", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sally knew the exam would be hard so she developed a study schedule. The _ was 4 weeks away.", + "gold_answer": "exam", + "os_answer": "exam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey brushed their teeth quite regularly but Brian did not. _ rarely had to go to a dentist.", + "gold_answer": "Jeffrey", + "os_answer": "Jeffrey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey brushed their teeth quite regularly but Brian did not. _ had to go to a dentist often.", + "gold_answer": "Brian", + "os_answer": "Brian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The kid looked terrible in the ancient Egyptian dress because the _ was too small.", + "gold_answer": "kid", + "os_answer": "tunic", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica was worried that Mary might be caught in a scam when they started their new job, but _ decided to trust their friend's judgement.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian taught Michael how to feed a rabbit greens because _ had rabbits as a kid.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "i had to walk closer to the board to see the phone numbers, only the monogram of the company is visible from a distance. The _ is bold.", + "gold_answer": "monogram", + "os_answer": "logo", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "He was having an asthma attack but forgot his inhaler so someone recommended coffee as the _ was unavailable.", + "gold_answer": "inhaler", + "os_answer": "alternative", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Amy tried to spread the cake icing all over the cake but the _ was not enough.", + "gold_answer": "icing", + "os_answer": "icing", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia teaches Kindergarten students, Christine teaches High School students therefore _ doesn't read aloud a lot.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia teaches Kindergarten students, Christine teaches High School students therefore _ reads aloud a lot.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey has dark lips unlike Elena due to _ remembering to put on chapsticks at night.", + "gold_answer": "Elena", + "os_answer": "not", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey has dark lips unlike Elena due to _ forgetting to put on chapsticks at night.", + "gold_answer": "Lindsey", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joseph has an allergy to mangoes, but Nelson does not, so _ has to be very careful.", + "gold_answer": "Joseph", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin went with Donald to the game because _ wanted to be the designated driver.", + "gold_answer": "Justin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mike wanted to make the picture with the Photoshop software instead of the Paintshop software because the _ was more reliable.", + "gold_answer": "Photoshop software", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason missed his work shift in order to finish his research paper, because the _ was less important.", + "gold_answer": "work shift", + "os_answer": "priority", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The paper bags got torn when James was using it to move the groceries. The _ are weak.", + "gold_answer": "bags", + "os_answer": "bags", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was worried about the height requirements for the rollercoaster more than Dennis was since _ was short.", + "gold_answer": "Steven", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven was worried about the height requirements for the rollercoaster more than Dennis was since _ was tall.", + "gold_answer": "Dennis", + "os_answer": "Dennis", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The quill was used by the writer much more than the pen for the job since the _ is heavy.", + "gold_answer": "pen", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel has experience driving large vehicles and Lawrence doesn't. _ drives their RV with accuracy.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She used vinegar to wipe down the cabinets hourly and a wood cleaner monthly. The _ was overused.", + "gold_answer": "vinegar", + "os_answer": "vinegar", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Despite the fact that Joseph was sick and Craig was healthy, _ still stayed home from work that day.", + "gold_answer": "Craig", + "os_answer": "Joseph", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The teacher asked for the homework. Elena played games the night before and Tanya did not, so _ got an F.", + "gold_answer": "Elena", + "os_answer": "Elena", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teacher asked for the homework. Elena played games the night before and Tanya did not, so _ got an A.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William had a fear about nothing unlike Benjamin, because _ had a horrible childhood growing up.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The smell in the kitchen of the home is unbearable, while the laundry room smells fine. The _ must have been cleaned longer ago.", + "gold_answer": "kitchen", + "os_answer": "kitchen", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The clothing in the north was warmer than the clothing in the south because there was more snow in the _ .", + "gold_answer": "north", + "os_answer": "north", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The clothing in the north was warmer than the clothing in the south because there was more sun in the _ .", + "gold_answer": "south", + "os_answer": "south", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan grew the houseplant from seed, but Matthew bought a plastic plant instead, because _ tended to neglect plants.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The thief tried to escape over the fence, but the _ was too short for him to climb over.", + "gold_answer": "thief", + "os_answer": "ladder", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The rib-eye steak needed some artisan pepper to season it because the _ was flavorful.", + "gold_answer": "pepper", + "os_answer": "meat", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The rib-eye steak needed some artisan pepper to season it because the _ was bland.", + "gold_answer": "steak", + "os_answer": "steak", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil introduced William, who is very shy, to his friends, but _ was being very embarrassing.", + "gold_answer": "Neil", + "os_answer": "William", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil introduced William, who is very shy, to his friends, but _ was being very quiet.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gas was not smelling out of the tank but out of the hose because the _ is leaky.", + "gold_answer": "hose", + "os_answer": "nozzle", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gas was not smelling out of the tank but out of the hose because the _ is sealed.", + "gold_answer": "tank", + "os_answer": "tank", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura had a much better body than Katrina, because _ spent all of their time at the ice cream shop.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My home is closer to the store than John's house, because the _ of me is next door.", + "gold_answer": "home", + "os_answer": "residence", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha believed in life after death while Christine did not, so _ never tried to talk to spirits.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James always had to wash his shoe after jogging on the street but it is not always the same when jogging on the lawn. The _ is clean.", + "gold_answer": "lawn", + "os_answer": "lawn", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While at the store, Logan grabbed a head of lettuce for Eric to use for dinner, but _ already had some at home.", + "gold_answer": "Eric", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While at the store, Logan grabbed a head of lettuce for Eric to use for dinner because _ knew there was none at home.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In the hotel laundry room, Felicia burned Mary's shirt while ironing it, so the manager wrote _ up.", + "gold_answer": "Felicia", + "os_answer": "Felicia", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In the hotel laundry room, Felicia burned Mary's shirt while ironing it, so the manager gave _ a refund.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey asked Hunter when was the date set for the wedding because _ was getting married.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jeffrey asked Hunter when was the date set for the wedding because _ was his best man.", + "gold_answer": "Jeffrey", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig had never learned handwriting in school but Michael had learned beautiful script so, _ always typed all their correspondence.", + "gold_answer": "Craig", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia did laundry by hand, but Lindsey used the electric washer, because _ wore clothes made of delicate fabrics.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dancer would leave the stage and enter the hall after her dance was finished, as the _ was where she belonged during the dance.", + "gold_answer": "stage", + "os_answer": "stage", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick needed Kenneth to go to the store and get a baby bib, but _ said the one they had was still ok.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "His hands were a lot rougher than his thighs, because he used the _ for nothing.", + "gold_answer": "thighs", + "os_answer": "hands", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Christine told Samantha at court their reasons for their expired license, since _ had the responsibility to attend.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine told Samantha at court their reasons for their expired license, since _ had the responsibility to judge.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig was all about self-publishing his first album, but a PRO rep Lawrence advised against it. _ advocated for a very hands-on approach to publishing.", + "gold_answer": "Craig", + "os_answer": "Lawrence", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig was all about self-publishing his first album, but a PRO rep Lawrence advised against it. _ advocated for a very hands-off approach to publishing.", + "gold_answer": "Lawrence", + "os_answer": "Lawrence", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cleaning crew always used rags instead of washcloths, although the _ tended to wear out quickly.", + "gold_answer": "rags", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I hated the project this year compared to the essay last year, because the _ required more work.", + "gold_answer": "project", + "os_answer": "project", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "While waiting for the movie to begin, Natalie bought popcorn and drinks for Lindsey, since _ had little money.", + "gold_answer": "Lindsey", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christopher was able to travel abroad, while William only travelled domestically, as _ had never applied for a passport.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The rubber resisted the rock but snapped on the concrete, as the _ was abrasive.", + "gold_answer": "concrete", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The rubber resisted the rock but snapped on the concrete, as the _ was smooth.", + "gold_answer": "rock", + "os_answer": "surface", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Al got solar panels and a small generator installed at his house for electricity as the _ would be his main power supply.", + "gold_answer": "panels", + "os_answer": "panels", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The newborns in the nursery were very frail because they were fed the _ calorie food during the high and low calorie experiment..", + "gold_answer": "low", + "os_answer": "low", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The newborns in the nursery were very hardy because they were fed the _ calorie food during the high and low calorie experiment.", + "gold_answer": "high", + "os_answer": "high", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jane's hair was bound by a band until the band was cut because the _ is bulky.", + "gold_answer": "hair", + "os_answer": "bun", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The patient put in a special request for Brett instead of Kyle because _ was always stern.", + "gold_answer": "Kyle", + "os_answer": "Kyle", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel decided on adopting a young puppy but Megan didn't because _ didn't want to train a pupply.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin became very ill with pneumonia, so Matthew made him some soup; then _ finally went home.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Applying to dance in music videos was great for Erin but not Lindsey because _ was a beginner dancer.", + "gold_answer": "Lindsey", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The landlord said she had violated her lease by allowing a dog into the apartment. She said that the dog did not violate the _ at all.", + "gold_answer": "lease", + "os_answer": "lease", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin asked Samuel to buy them a puppy, because _ could not have a pet.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The jeans fit worse than the shirt because I had tried the _ on at the store.", + "gold_answer": "shirt", + "os_answer": "shirt", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson teased Christopher about needing to find a homecoming date because _ could not find one.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nelson teased Christopher about needing to find a homecoming date because _ already had one.", + "gold_answer": "Nelson", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The athletes on the team of Christine were more tired than those on the team of Monica because the ones with _ did less laps.", + "gold_answer": "Monica", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The athletes on the team of Christine were less tired than those on the team of Monica because the ones with _ did less laps.", + "gold_answer": "Christine", + "os_answer": "Christine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John could not buy anything from the store than night and he went to the kiosk to buy some things because the _ is opened.", + "gold_answer": "kiosk", + "os_answer": "kiosk", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "In order to increase her estrogen, Jenny started eating carrots instead of donuts because the _ were not junky.", + "gold_answer": "carrots", + "os_answer": "carrots", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It smelled a lot better near the pool than it did near the compost because there was no garbage in the _ .", + "gold_answer": "pool", + "os_answer": "pool", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide the book inside his jacket because the _ is small.", + "gold_answer": "book", + "os_answer": "volume", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide the book inside his jacket because the _ is big.", + "gold_answer": "jacket", + "os_answer": "pocket", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian laughs at Ryan because of the small Christmas tree they picked out. _ wants a table top tree.", + "gold_answer": "Ryan", + "os_answer": "Ryan", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian laughs at Ryan because of the small Christmas tree they picked out. _ wants a six foot tree.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Betty gave the full pitcher to Rachel so _ could fill her glass with water.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett looks as if they are aging at half the rate of Craig because _ has lived a rough lifestyle.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel's date was shorter than she, so she wore her shoes rather than her boots, because the _ had high heels.", + "gold_answer": "boots", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Rachel's date was shorter than she, so she wore her shoes rather than her boots, because the _ had low heels.", + "gold_answer": "shoes", + "os_answer": "shoes", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The store had 80 platters but only 2 bowls left in stock because the _ were in high demand.", + "gold_answer": "bowls", + "os_answer": "bowls", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The store had 80 platters but only 2 bowls left in stock because the _ were in low demand.", + "gold_answer": "platters", + "os_answer": "bowls", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Sarah had to call in an expert unlike Erin because _ had no knowledge on the subject.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sarah had to call in an expert unlike Erin because _ had vast knowledge on the subject.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica really enjoys a vodka drink, but Felicia prefers whiskey because _ likes dark liquors.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica really enjoys a vodka drink, but Felicia prefers whiskey because _ likes clear liquors.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The knee injury of Samantha has healed much quicker than Katrina's. _ 's injury was minor.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia felt very thirsty but Sarah did not feel thirsty. _ bought a bag of chips.", + "gold_answer": "Sarah", + "os_answer": "Cynthia", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha failed on the test but Mary got very good marks because _ had been very lazy.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle wanted to write to Aaron every day, because _ enjoyed sending letters to friends.", + "gold_answer": "Kyle", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle wanted to write to Aaron every day, because _ enjoyed receiving letters from friends.", + "gold_answer": "Aaron", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The toddler kicked the soft furniture and hard toy, but only the _ caused pain.", + "gold_answer": "toy", + "os_answer": "toy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The toddler kicked the hard furniture and soft toy, but only the _ caused pain.", + "gold_answer": "furniture", + "os_answer": "furniture", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica saw Laura constantly flirt with men in the office. _ thought it was normal in a place of business and she was admired by their coworkers.", + "gold_answer": "Laura", + "os_answer": "Neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Much to the dismay of Christopher, Jeffrey learned of their evil plan, and _ was stopped before it succeeded.", + "gold_answer": "Christopher", + "os_answer": "it", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The student wanted to be respectful to the teacher so he got her a book instead of an apple because the _ was old.", + "gold_answer": "apple", + "os_answer": "stereotype", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha's main artistic medium was paint, while Patricia preferred to work with clay, since _ was trained as a sculptor.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil asked Brian to hand him the measuring tape, but _ already measured the wall to center the picture.", + "gold_answer": "Brian", + "os_answer": "he'd", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The creams didn't work as well on my skin as the lotions did because the _ were new.", + "gold_answer": "lotions", + "os_answer": "formulas", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kiwis are a favorite of Ryan, while Derrick can't eat them. _ has sensitive teeth.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Although Amy worked harder and longer than Rebecca, _ was a more wealthy person overall.", + "gold_answer": "Rebecca", + "os_answer": "Rebecca", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to write a list of what he can do for Christmas and he ended up using all the pages in the notepad. The _ is long.", + "gold_answer": "list", + "os_answer": "list", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to write a list of what he can do for Christmas and he ended up using all the pages in the notepad. The _ is short.", + "gold_answer": "page", + "os_answer": "list", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha gifted her new bathrobe to Betty because it felt very comfortable for _ when she tried it on.", + "gold_answer": "Betty", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha gifted her new bathrobe to Betty because it felt very itchy for _ when she tried it on.", + "gold_answer": "Samantha", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chopstick were better to eat the noodles with than the fork as the _ was repaired.", + "gold_answer": "chopstick", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "James was finding a space on the couch for the box to be placed but he could not find it because the _ is big.", + "gold_answer": "box", + "os_answer": "box", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael loved eating many different vegetables but not Brett because _ was on a vegetarian diet.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "It was painful for Justin to break up with Jason, but _ wasn't ready to move on.", + "gold_answer": "Jason", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Needing a boost Emily asked Rachel to put them on their shoulders in order to reach the roof, _ is tall in height.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bill had complicated feelings about getting a car after his motorcycle died because the _ possessed a lot of new features.", + "gold_answer": "car", + "os_answer": "vehicle", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bill had complicated feelings about getting a car after his motorcycle died because the _ possessed a lot of sentimental value.", + "gold_answer": "motorcycle", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "As a marine, Emily looks down on civilians like Maria, so _ is a bit saddened.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle makes a lot more money than Nelson can make at his job, as _ is a cashier.", + "gold_answer": "Nelson", + "os_answer": "Nelson", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The food that Hunter ate was spoiled but not that of Brett because _ left his food outside.", + "gold_answer": "Hunter", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The food that Hunter ate was spoiled but not that of Brett because _ left his food in the fridge.", + "gold_answer": "Brett", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura held the steel for their project while Carrie used the blowtorch, because _ was more skilled.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy recognized the man in the waiting room before Monica did, because _ had met the man only once.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Nick smelled much worse than Kenneth after the baseball game although _ was wearing deodorant.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Mark wanted to lose some weight by starting a diet and workout routine. He focused mainly on the _ because he was lazy.", + "gold_answer": "diet", + "os_answer": "diet", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The drink was rich in caffeine and low in sugar because the _ was suffice in keeping the drinker awake.", + "gold_answer": "caffeine", + "os_answer": "caffeine", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The drink was rich in caffeine and low in sugar because the _ was not enough to keep the drinker awake.", + "gold_answer": "sugar", + "os_answer": "caffeine", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The tree fell down sooner than the sapling because the roots of the _ were stronger.", + "gold_answer": "tree", + "os_answer": "sapling", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The tree fell down after the sapling because the roots of the _ were weaker.", + "gold_answer": "sapling", + "os_answer": "sapling", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The man with the fever came over and talked to Carrie and not Lindsey because _ was a patient.", + "gold_answer": "Lindsey", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Samantha told Lindsey to be careful with the porcelain doll; when she ignored her and dropped the doll, _ was very sorry.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The Windows software attempted to install the upgrades onto the computer, but the _ exceeded data capacity.", + "gold_answer": "software", + "os_answer": "download", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The Windows software attempted to install the upgrades onto the computer, but the _ was outdated.", + "gold_answer": "computer", + "os_answer": "hardware", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James could not lift the bottle of water up to the table top because the _ is tall.", + "gold_answer": "table", + "os_answer": "table", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria gave birth to Katrina, so after the process was over, _ was a brand new mother.", + "gold_answer": "Maria", + "os_answer": "Maria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jan planted her herbs in small growing bags, but she worried that the _ would be too shallow for them to put down roots.", + "gold_answer": "bags", + "os_answer": "soil", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jan planted her herbs in small growing bags, but she worried that the _ would be too stifled to put down roots.", + "gold_answer": "herbs", + "os_answer": "soil", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Writing came easily to Carrie but was difficult for Natalie because _ had taken engineering in college.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina asked Rachel to change the diapers for the babies this morning because _ is handling the stove.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina asked Rachel to change the diapers for the babies this morning because _ isn't doing anything.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brett took more medicines than Aaron did although _ was suffering from many more diseases.", + "gold_answer": "Aaron", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The life of Christine was pretty basic until they met Maria , _ is a is lover of excitement .", + "gold_answer": "Maria", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin lied to Logan because _ was so upset about the money that was missing.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha decided to mix the mortar while Rebecca applied it to the wall. _ was not good at the finishing touches.", + "gold_answer": "Samantha", + "os_answer": "Neither", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick greeted Craig at the event but he did not respond to him because _ is humble.", + "gold_answer": "Derrick", + "os_answer": "Craig", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Derrick greeted Craig at the event but he did not respond to him because _ is arrogant.", + "gold_answer": "Craig", + "os_answer": "Craig", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica chose Kayla as the winning contestant on the reality show because _ was a contestant on the show.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael swam in the pond for longer than Derrick because _ thought the algae was okay.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth worked hard at training martial arts but not Samuel. _ couldn't made their dream come true of fighting in the UFC octagon.", + "gold_answer": "Samuel", + "os_answer": "they", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Because Megan wanted to be a welder and Patricia wanted to be a engineer, _ went to university instead of trade school.", + "gold_answer": "Patricia", + "os_answer": "Patricia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Because Megan wanted to be a welder and Patricia wanted to be a engineer, _ went to trade school instead of university.", + "gold_answer": "Megan", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man took longer to pay for the shoes than the shirt because he paid for the _ in coins.", + "gold_answer": "shoes", + "os_answer": "shoes", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The man took longer to pay for the shoes than the shirt although he paid for the _ in coins.", + "gold_answer": "shirt", + "os_answer": "shoes", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide to gift he brought wit him in his pocket because the _ is big.", + "gold_answer": "pocket", + "os_answer": "pocket", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was able to hide to gift he brought wit him in his pocket because the _ is small.", + "gold_answer": "gift", + "os_answer": "gift", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Sometimes I write in my journal with a pencil instead of a pen, but the _ can be run dry.", + "gold_answer": "pen", + "os_answer": "eraser", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John cannot run the entire length of the track, he had been used to the field. The _ is short.", + "gold_answer": "field", + "os_answer": "track", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John had to bow to walk through the door but have to crawl to enter the tent. The _ is taller.", + "gold_answer": "door", + "os_answer": "door", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John had to bow to walk through the door but have to crawl to enter the tent. The _ is shorter.", + "gold_answer": "tent", + "os_answer": "tent", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Adam's blushed a deep red when Jeffrey saw him fall off his horse, but _ tried to pretend it didn't hurt.", + "gold_answer": "Adam", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Leslie told Aaron he only wanted to eat food that was healthy, he was laughed at. The teacher comforted _ immediately.", + "gold_answer": "Leslie", + "os_answer": "him", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Leslie told Aaron he only wanted to eat food that was healthy, he was laughed at. The teacher scolded _ immediately.", + "gold_answer": "Aaron", + "os_answer": "Aaron", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor treated Natalie, but refused to see Tanya, because _ has an incredible insurance plan.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica asked Rebecca to go see a new horror movie even though _ knew she would likely to decline the invitation.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It doesn't take much to shift between ice and water. The _ is hard and strong when its cold.", + "gold_answer": "ice", + "os_answer": "ice", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "It doesn't take much to shift between ice and water. The _ is fluid and flexible when its warm.", + "gold_answer": "water", + "os_answer": "molecule", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy's being taught how to pay it forward by Kayla, so _ is likely the younger person.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Steven asked Joseph to have their stomach examined after _ had a night full of really bad gas issues.", + "gold_answer": "Joseph", + "os_answer": "they", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The assertive commander told the privates to change their boots but not their shirts because the _ were disgusting.", + "gold_answer": "boots", + "os_answer": "boots", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The assertive commander told the privates to change their boots but not their shirts because the _ were fine.", + "gold_answer": "shirts", + "os_answer": "shirts", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The chef decided to omit the chicken from his signature dish for the party, because the _ needed to be vegetarian.", + "gold_answer": "dish", + "os_answer": "entree", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Timmy bought a transporter for his cat so he could take him on the plane but the _ was too small.", + "gold_answer": "transporter", + "os_answer": "carrier", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia was given a leather belt from Betty to clean it, because _ knows how to do it.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia was given a leather belt from Betty to clean it, because _ doesn't know how to clean it.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Eric replaced his long hair with a new hat for the summer time, the _ was old.", + "gold_answer": "hair", + "os_answer": "haircut", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hunter had low tire pressure and asked Eric to fill the tires; when he said no, _ filled the tires.", + "gold_answer": "Hunter", + "os_answer": "Hunter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie tried to convince Cynthia that the cat needed a microchip because _ was concerned about the cat getting lost.", + "gold_answer": "Carrie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The doctor felt more sympathy for Aaron than Ryan because _ had a curable illness and great insurance.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily delivered the daily newspaper to Samantha promptly, so _ gave a nice Christmas bonus.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily delivered the daily newspaper to Samantha promptly, so _ expected a nice Christmas bonus.", + "gold_answer": "Emily", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jack wanted to start a game, but couldn't decide between baseball or basketball. The _ game would needed fewer of friends.", + "gold_answer": "basketball", + "os_answer": "former", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jack wanted to start a game, but couldn't decide between baseball or basketball. The _ game would call for more friends.", + "gold_answer": "baseball", + "os_answer": "former", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to wear the corsage but it wouldn't fit around his wrist because his _ was too small.", + "gold_answer": "corsage", + "os_answer": "buttonhole", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James wanted to wear the corsage but it wouldn't fit around his wrist because the _ was too big.", + "gold_answer": "wrist", + "os_answer": "band", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura was climbing down from the roof and Katrina was below so, _ was holding the ladder.", + "gold_answer": "Katrina", + "os_answer": "Katrina", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Bill could only go out to the restaurants rather than the bars because going to the _ required a minimum age.", + "gold_answer": "bars", + "os_answer": "bars", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina demanded that Jessica get off of their property, because _ was in the neighborhood for visiting.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Katrina demanded that Jessica get off of their property, because _ wasn't in the mood for visiting.", + "gold_answer": "Katrina", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the hospital, Kenneth tended to Randy 's wounds as _ was learning to contain an infection.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Justin admired the art hung on the wall by Nick, so _ asked if he would like to take something home.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The man chose medication for his infection rather than the ointment, because the _ was ineffective.", + "gold_answer": "ointment", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary felt a great deal of guilt for stealing various items from Rachel so _ forgave her.", + "gold_answer": "Rachel", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis warned Craig if they were late to work agian they would suffer termination, _ works for the boss at the local factory.", + "gold_answer": "Craig", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Patricia bought Christine a watch for their birthday because _ was tired of asking about the time.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teenager chose a jeweled pin for her belly piercing, but the _ was too tiny.", + "gold_answer": "piercing", + "os_answer": "clasp", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The teenager chose a jeweled pin for her belly piercing, but the _ was too huge.", + "gold_answer": "pin", + "os_answer": "gauge", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After visiting their tenth college, Kevin asked Donald to just make up his mind, because _ just didn't have time for more.", + "gold_answer": "Kevin", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "After visiting their tenth college, Kevin demanded that Donald to just make up _ 's mind, because he just didn't have time for more.", + "gold_answer": "Donald", + "os_answer": "his", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the store, John signed a warranty contract for the tablet, but did not purchase insurance for the phone, because the _ was unlikely to be damaged.", + "gold_answer": "phone", + "os_answer": "tablet", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the store, John signed a warranty contract for the tablet, but did not purchase insurance for the phone, because the _ was likely to be damaged.", + "gold_answer": "tablet", + "os_answer": "tablet", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Bob had a love and hate relationship with gambling and the _ grew as he won more money.", + "gold_answer": "love", + "os_answer": "addiction", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine was tired of Maria being a pain in the neck after _ laid down the prank trap.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When Derrick told Christopher about quitting school to provide for their family, _ started panicking.", + "gold_answer": "Derrick", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The food Katrina made was very bland, so Victoria added some salt; _ felt bad and vowed not to season again.", + "gold_answer": "Victoria", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "She was the prettiest in the room, wearing a pretty dress and jewelry. The _ was sparkling.", + "gold_answer": "jewelry", + "os_answer": "jewelry", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason hired his coworker to paint the house instead of hiring a painting company, because the _ will do it for more money.", + "gold_answer": "painting company", + "os_answer": "painting company", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The crops in the facility grew better than in the greenhouse since the _ was bright inside.", + "gold_answer": "facility", + "os_answer": "lighting", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Beautiful roses were bought by Jason for Dennis because _ is a receiver in general.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The battery of the the phone died faster than the laptop battery, because the _ was always off.", + "gold_answer": "laptop", + "os_answer": "charger", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The battery of the the phone died faster than the laptop battery, because the _ was always on.", + "gold_answer": "phone", + "os_answer": "screen", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia ran out of shirts and borrowed one from Patricia, but _ didn't ask permission ahead of time.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I wanted to use pomade on my hair instead of hairspray but it was old so the _ was unusable.", + "gold_answer": "pomade", + "os_answer": "pomade", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan picked up some olive oil for Felicia because _ hated to cook but loved to eat.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Megan picked up some olive oil for Felicia because _ loved to cook but hated to eat.", + "gold_answer": "Felicia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ian always got ready quickly in the morning and ended up waiting for Christopher, _ was always punctual.", + "gold_answer": "Ian", + "os_answer": "who", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kayla always wears sunscreen outdoors but Natalie doesn't because _ isn't concerned about getting neck wrinkles.", + "gold_answer": "Natalie", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Felicia wanted to be pampered by Emily, so _ went to the jewelry store and bought an expensive ring.", + "gold_answer": "Emily", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The man couldn't stop thinking about the violin and the crossbow he lost when he was younger. He used to love to shoot _ .", + "gold_answer": "crossbow", + "os_answer": "arrows", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mastering the game of chess was easier for Brian than William because _ had an analytical mind.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gerbil came over to Laura but not Monica because _ was holding a hockey stick.", + "gold_answer": "Monica", + "os_answer": "Monica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The gerbil came over to Laura but not Monica because _ was holding a carrot stick.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle loved to camp in the wilderness but Justin preferred a nice hotel. _ booked a trip to New York City.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle loved to camp in the wilderness but Justin preferred a nice hotel. _ booked a trip to Yellowstone Park.", + "gold_answer": "Kyle", + "os_answer": "They", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The _ car was a pleasure to drive but the red car was not as the blue car was very expensive.", + "gold_answer": "blue", + "os_answer": "blue", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The blue car was a pleasure to drive but the _ car was not as the red car was very cheap.", + "gold_answer": "red", + "os_answer": "red", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Samantha wanted to use a valet to park the car but Carrie did not because _ was generous with money.", + "gold_answer": "Samantha", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The trumpet part overpowered the reeds but could not be heard over the strings, as the _ were just too quiet .", + "gold_answer": "reeds", + "os_answer": "dynamics", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "James forgot to put the food in the freezer so he had to eat the fruits the next day because the _ is rotting.", + "gold_answer": "food", + "os_answer": "fruit", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The patient took calcium to fix his broken bone but the _ was too weak.", + "gold_answer": "bone", + "os_answer": "dosage", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The patient took calcium to fix his broken bone but the _ was too strong.", + "gold_answer": "calcium", + "os_answer": "dosage", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Emily has never struggled with blood clots like Victoria has, because _ lives a sedentary, gluttonous lifestyle.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "On the playground at school during recess, Monica called Emily a chicken because _ was capable of climbing the ladder.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "On the playground at school during recess, Monica called Emily a chicken because _ was scared of climbing the ladder.", + "gold_answer": "Emily", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hannah had to get a lawyer to help her understanding of the contract language because the _ the contract had was too complex.", + "gold_answer": "language", + "os_answer": "legalese", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary loved to make baked potatoes, but Monica couldn't stand the smell; _ asked her to only make them when she was alone.", + "gold_answer": "Monica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary loved to make baked potatoes, but Monica couldn't stand the smell; _ only made them when she was alone.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The fisherman wanted to put the rock in the pond but the _ was too small.", + "gold_answer": "pond", + "os_answer": "hole", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Joe did a lot worse on the quiz last week than he did on the test today, because the _ was a surprise.", + "gold_answer": "quiz", + "os_answer": "quiz", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena was asked by Jessica to put patches in the holes in her pants; _ gave her some she bought at the store.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Elena was asked by Jessica to put patches in the holes in her pants; _ used some she already had at home.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Learning a new form of karate was difficult for Logan but not William because _ was not athletic.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian wanted a horse but not Nick because _ raised cattle in their spare time.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Elena liked lizards more than Rachel did, so _ was appalled to receive a pet gecko for her birthday.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan preferred to snowboard while Kyle wanted to do biathlon so _ went up the hill.", + "gold_answer": "Logan", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She watered the rose but not the cactus, because the soil of the _ was already wet.", + "gold_answer": "cactus", + "os_answer": "cactus", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She watered the rose but not the cactus, because the soil of the _ was already dry.", + "gold_answer": "rose", + "os_answer": "cactus", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Nick did not like sauces made from tomato, only creamy sauces. Ryan knew this so he only made white sauce when _ came over.", + "gold_answer": "Nick", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The ingredients that I use are tastier than the available toppings because the _ are old.", + "gold_answer": "toppings", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel knew exactly how to treat the injured person's wound but not Emily because _ took a woodworking class in high school.", + "gold_answer": "Emily", + "os_answer": "Rachel", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The dress could use either velcro or a zipper to close, the _ would last longer.", + "gold_answer": "zipper", + "os_answer": "zipper", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The class was going on a bus on a field trip to a local museum. The _ had to close at 4.", + "gold_answer": "museum", + "os_answer": "museum", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kelly was embarrassed when his toga fell off at the party and people saw his underwear because the _ was too tight.", + "gold_answer": "underwear", + "os_answer": "cincture", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kelly was embarrassed when his toga fell off at the party and people saw his underwear because the _ was too loose.", + "gold_answer": "toga", + "os_answer": "knot", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kayla was always thinner than Rachel because _ enjoyed eating brioche and butter every morning.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert has no regret for punching Justin in the nose even though _ was the victim of injustice.", + "gold_answer": "Justin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Robert has no regret for punching Justin in the nose because _ was the victim of injustice.", + "gold_answer": "Robert", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The dark circles under Erin's eyes were darker than Cynthia's due to _ being older.", + "gold_answer": "Erin", + "os_answer": "her", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cake got burnt under the heat applied to it. It appears the _ is too small.", + "gold_answer": "cake", + "os_answer": "pan", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Harper wanted to wear a cowboy hat and a bolero tie to her party, but the _ didn't fit her head.", + "gold_answer": "hat", + "os_answer": "hat", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura put fruit in their pie for Lindsey to eat, and _ ate half the pie after that one was done baking.", + "gold_answer": "Lindsey", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I started a program for youth that worked better than the old system, because the _ is new.", + "gold_answer": "program", + "os_answer": "approach", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William was very comfortable entering Kenneth 's personal domain any time, as _ was very self-assured.", + "gold_answer": "William", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Tanya recently finished filling out a job application but not Megan because _ is currently unemployed.", + "gold_answer": "Tanya", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Tanya recently finished filling out a job application but not Megan because _ is currently working.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence had lost a lot of weight on their diet but Hunter wasn't nearly as succesful. _ was now heavy.", + "gold_answer": "Hunter", + "os_answer": "He", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey did not know how to make a good impression for an interview with Tanya. _ was surprised when she did not get the job.", + "gold_answer": "Lindsey", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya wanted to audition for the show that Sarah was casting, so _ watched her routine very carefully.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "When it came to taking care of elderly people, Adam was suited for the job more than Brian because _ lived with younger people longer.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Felicia experienced a tummy ache while Tanya did not because _ had not eaten any food.", + "gold_answer": "Tanya", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Erin was self-conscious of her legs and Katrina didn't help by making fun of them, but _ went to the gym to try and help her.", + "gold_answer": "Katrina", + "os_answer": "Erin", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "While shopping at the mall, Kevin asked Benjamin to help find a red shirt to wear because _ was great at clothing budgeting.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "As a parent, Catherine doesn't let her kids watch movies, but they can watch some TV shows. Catherine thinks the _ are too violent.", + "gold_answer": "movies", + "os_answer": "movies", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lindsey loves dogs and doesn't have one of her own. So when Amy visits with her dog, _ gives it treats and spoils it.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "the scanning tool could not get through the cervix because the _ was too big.", + "gold_answer": "tool", + "os_answer": "fetus", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "the scanning tool could not get through the cervix because the _ was too small.", + "gold_answer": "cervix", + "os_answer": "os", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary didn't know what the currency of Mexico was but Lindsey knew _ had never been to Mexico before.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan sentenced Jennifer to probation for stealing from the grocery store, _ obeys the laws that are written.", + "gold_answer": "Megan", + "os_answer": "thereby", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary thinks Sarah has beautiful skin, even though _ actually has the better complexion of the two.", + "gold_answer": "Mary", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia loved the smell of Rachel's shampoo, so she asked where to buy it. _ gave her a bottle the next day.", + "gold_answer": "Rachel", + "os_answer": "Rachel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald had to drive Matthew to the doctor immediately because _ was feeling lightheaded and dizzy.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The apartment Brett rented was owned by Jason, so _ sent the rent for the apartment each month.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The apartment Brett rented was owned by Jason, so _ received the rent for the apartment each month.", + "gold_answer": "Jason", + "os_answer": "Jason", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I don't want to use that iron on my new shirt, and, yes, it's because the _ is too expensive.", + "gold_answer": "shirt", + "os_answer": "fabric", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I don't want to use that iron on my new shirt, and, yes, it's because the _ is too cheap.", + "gold_answer": "iron", + "os_answer": "brand", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The wound caused by the bullet needed more care than the one caused by the knife because the _ wound was superficial.", + "gold_answer": "knife", + "os_answer": "knife", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle was in a lot of pain after running the marathon in place of Brian, but _ appreciated the support of his cause.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy asked Maria how to make homemade candles to give as gifts. _ knew she had a lot of experience making them.", + "gold_answer": "Amy", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Patricia liked to lie around in a hammock all day but Megan did not because _ was very sedentary.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Hank was eating cereal and spilt milk on his hot pants and decided to get his pleated pants. He needed to change into new leggings because the _ are clean.", + "gold_answer": "pleated pants", + "os_answer": "pleated", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sara's cat got fleas so she bought a treatment and put it on the cat's neck. The cat was unhappy and tried to lick it off the _ .", + "gold_answer": "neck", + "os_answer": "fur", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick always wanted to wash when they woke up but Benjamin rarely bothered. _ was a very dirty person.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Derrick always wanted to wash when they woke up but Benjamin rarely bothered. _ was a very clean person.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie is a forest ranger, Jessica is a cook therefore _ probably can't tell you how to plant your pine tree.", + "gold_answer": "Jessica", + "os_answer": "Jessica", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin brought a a saw and hammer to prepare making a cupboard for Benjamin because _ is his employer.", + "gold_answer": "Benjamin", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia was on a diet and did not eat the cookies Rebecca baked for her. _ was jealous.", + "gold_answer": "Patricia", + "os_answer": "Rebecca", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Kenneth's back is being tended to by Derrick at the office, so _ is the client in this situation.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin used a stencil on their presentation lettering but Derrick did not. _ had a very sloppy looking presentation.", + "gold_answer": "Derrick", + "os_answer": "Derrick", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Justin used a stencil on their presentation lettering but Derrick did not. _ had a very neat looking presentation.", + "gold_answer": "Justin", + "os_answer": "Justin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The mirror didn't lie when it showed how overweight Patricia was and how emaciated Felicia was, so _ needed to go on diet.", + "gold_answer": "Patricia", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stores used posters instead of flyers, because the overall cost of distribution for the _ was cheaper.", + "gold_answer": "posters", + "os_answer": "posters", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stores used posters instead of flyers, but the overall cost of distribution for the _ was cheaper.", + "gold_answer": "flyers", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "With my ankle sprain, I am not able to put my foot in my shoe because the _ is too fat.", + "gold_answer": "sprain", + "os_answer": "swelling", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan could eat gluten while Adam could not, and _ always had a smaller variety of foods to choose from.", + "gold_answer": "Adam", + "os_answer": "therefore", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria wasn't aware that Erin was coming up behind them, because _ was generally sneaky.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was a better employer than Joel so _ had to worry about retaining employees.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael was a better employer than Joel so _ did not have to worry about retaining employees.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James was suffering from nausea and decided to drink ginger tea but the _ was too meek.", + "gold_answer": "tea", + "os_answer": "flavor", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Two friends wanted a tan look but Joel was impatient while Robert wasn't. _ used bronzer to get a tan look.", + "gold_answer": "Joel", + "os_answer": "Joel", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Playing basketball came easier for Cynthia than Jennifer but _ had more control of their body movements.", + "gold_answer": "Jennifer", + "os_answer": "Jennifer", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Playing basketball came easier for Cynthia than Jennifer but _ had less control of their body movements.", + "gold_answer": "Cynthia", + "os_answer": "Jennifer", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The lady was blushing when she walked passed Amy but not Carrie because _ was intrigued by her.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Dennis's home just burned down, but luckily Donald's was spared. So, now _ is grateful.", + "gold_answer": "Donald", + "os_answer": "Dennis", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan focused more on proper posture than Lindsey because _ wanted to become a model.", + "gold_answer": "Megan", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Megan focused less on proper posture than Lindsey because _ wanted to become a model.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria had no issues with Achilles Tendinitis unlike Betty because _ never wore sneakers with cushion.", + "gold_answer": "Betty", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Katrina did not value the antique pictures as much as Lindsey because _ was a history buff.", + "gold_answer": "Lindsey", + "os_answer": "Lindsey", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan's boil cleared up right away while Christopher's boil got infected due to _ applying medicine later.", + "gold_answer": "Christopher", + "os_answer": "his", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jason went zooming down Brett's street way too fast on his motorcycle, causing _ great excitement.", + "gold_answer": "Jason", + "os_answer": "quite", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Angela wanted to find a partner, but Victoria wanted to stay single, because _ was lonely.", + "gold_answer": "Angela", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My teeth hurt more after eating the cake than the pie because the _ was not as sweet.", + "gold_answer": "pie", + "os_answer": "latter", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "My teeth hurt more after eating the cake than the pie because the _ was sweeter tasting.", + "gold_answer": "cake", + "os_answer": "cake", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "On Valentine's Day, Brian receives no flowers, but Kevin gets a lot. _ is probably dating someone.", + "gold_answer": "Kevin", + "os_answer": "Kevin", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had to learn how to speak Chinese for his job unlike Matthew, because _ worked in China.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had to learn how to speak Chinese for his job unlike Matthew, because _ worked in England.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The boards were used to build the houses instead of the bricks as the _ were sparse.", + "gold_answer": "bricks", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Betty avoided getting attacked in the dark alley where Elena was mugged, because _ ignored their intuition.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The actors practiced the scenes in the parking lot more than the scenes in the morgue, because the _ scenes are full of silence.", + "gold_answer": "morgue", + "os_answer": "morgue", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Victoria was interested in babies, but Katrina thought they were annoying, so _ preferred visiting the nursery.", + "gold_answer": "Victoria", + "os_answer": "Victoria", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The laws of the government are a lot worse than the rules of schools, because the _ are strict.", + "gold_answer": "laws", + "os_answer": "laws", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The kids at camp liked the activities with water, but avoided the sand, because the _ was cleansed.", + "gold_answer": "water", + "os_answer": "water", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "When gambling in Las Vegas, Christine usually bets less playing poker than Elena because _ is more cautious.", + "gold_answer": "Christine", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Natalie is extremely shy, but Lindsey is good at talking to strangers, which makes _ worse at telemarketing.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin thought Android was the superior phone system but Ian thought IOS was better. _ bought a new Note 9 from Verizon.", + "gold_answer": "Benjamin", + "os_answer": "Benjamin", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Benjamin thought Android was the superior phone system but Ian thought IOS was better. _ bought a new iPhone 9 from Verizon.", + "gold_answer": "Ian", + "os_answer": "Ian", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jill bought a slip to go with her new skirt but the _ was too short and it hung out the bottom.", + "gold_answer": "skirt", + "os_answer": "slip", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Jill bought a slip to go with her new skirt but the _ was too long and it hung out the bottom.", + "gold_answer": "slip", + "os_answer": "hem", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan kept a store of ammo in their house but Brian did not as _ approved of hunting.", + "gold_answer": "Logan", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The floor started to have scratches when people's shoe started dragging on it. The _ was rough.", + "gold_answer": "shoe", + "os_answer": "finish", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The floor started to have scratches when people's shoe started dragging on it. The _ was smooth.", + "gold_answer": "floor", + "os_answer": "floor", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Craig made sure to stretch before working out but Christopher never did, so _ frequently got injuries.", + "gold_answer": "Christopher", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Elena is concerned that Megan might have a Twitter addiction, but _ is probably worrying about nothing.", + "gold_answer": "Elena", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Donald was chosen to be a model while Dennis was passed over, because _ was exceptionally tall.", + "gold_answer": "Donald", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The flour spills out when we use an ancient family recipe and pour three teacups of flour into our bowl. The _ is too small.", + "gold_answer": "bowl", + "os_answer": "bowl", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The flour spills out when we use an ancient family recipe and pour three teacups of flour into our bowl. The _ is too big.", + "gold_answer": "teacup", + "os_answer": "quantity", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The pharmacy offered a product that could cure any disease, made of a new chemical and container, but the _ was not FDA approved.", + "gold_answer": "chemical", + "os_answer": "compound", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The pharmacy offered a product that could cure any disease, made of a new chemical and container, but the _ could hold few drugs.", + "gold_answer": "container", + "os_answer": "vial", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cracker that was given to me was worse than the cookie, because the _ was stale.", + "gold_answer": "cracker", + "os_answer": "former", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Aria tried to fix the fence in his garden by using new paint and wood, but the _ had termites.", + "gold_answer": "wood", + "os_answer": "fence", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia bought a plant for Natalie to put in her garden, so _ sent a thank you card.", + "gold_answer": "Natalie", + "os_answer": "Natalie", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "April gets stressed when she goes waterskiing more than swimming. The _ is filled with relaxation for her.", + "gold_answer": "swimming", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I handed the documents over to immigration with the passports, but they only accepted the passports, because the _ were complete.", + "gold_answer": "passports", + "os_answer": "documents", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia is a great nurse and Cynthia is a famous doctor, blood is normal to them, _ get assisted in operations.", + "gold_answer": "Cynthia", + "os_answer": "they", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Logan checked Samuel's garage to see if the car was there. It was missing so _ was gone.", + "gold_answer": "Samuel", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica was arrested for growing hemp by the police but not Sarah because _ fled during the field raid.", + "gold_answer": "Sarah", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jessica was arrested for growing hemp by the police but not Sarah because _ stayed during the field raid.", + "gold_answer": "Jessica", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "At the ballgame, Matthew was really thirsty and Aaron was not. _ took his beverage.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer thought it was important to neuter a dog and Rachel did not because _ knew lots of animals become homeless.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joseph loved to smoke cigarettes while Derrick did not although _ hated to use a hookah.", + "gold_answer": "Joseph", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The woman didn't need an apprasial for the desk, but wondered how much the table was worth, because the _ appeared to be common.", + "gold_answer": "desk", + "os_answer": "veneer", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "John could not hear his alarm clock when he was sleeping with a headphone on his head because the _ is closer.", + "gold_answer": "headphone", + "os_answer": "eardrum", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John could not hear his alarm clock when he was sleeping with a headphone on his head because the _ is farther.", + "gold_answer": "clock", + "os_answer": "distance", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The teacher was helping us study carpentry instead of studying the cooking today. The _ was mandatory.", + "gold_answer": "carpentry", + "os_answer": "substitution", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Emily was nine months pregnant but Tanya was not pregnant at all. _ had a beautiful baby girl.", + "gold_answer": "Emily", + "os_answer": "Emily", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan ordered the salad with added avocado, but Randy passed, because _ wasn't ok with the $3 upcharge.", + "gold_answer": "Randy", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ryan ordered the salad with added avocado, but Randy passed, because _ was ok with the $3 upcharge.", + "gold_answer": "Ryan", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya was an adult while Samantha was young and still had room to grow , so _ gave her her old clothes.", + "gold_answer": "Tanya", + "os_answer": "Tanya", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Tanya was an adult while Samantha was young and still had room to grow , so _ took her old clothes.", + "gold_answer": "Samantha", + "os_answer": "Samantha", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hiking group had more food than water, so they tried to conserve the _ .", + "gold_answer": "water", + "os_answer": "water", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The hiking group had less food than water, so they tried to conserve the _ .", + "gold_answer": "food", + "os_answer": "food", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Mary used the lotion instead of the cream because her skin was glowing when she used the _ .", + "gold_answer": "lotion", + "os_answer": "lotion", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "I wore the pants and the shirt together, but got more compliments on the _ because the shirt was uglier.", + "gold_answer": "pants", + "os_answer": "pants", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "John cannot listen to his music with the volume of the television his cousin is watching. The _ is quiet.", + "gold_answer": "music", + "os_answer": "volume", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The honey flows out slower from the bottle than the oil. The _ is viscous.", + "gold_answer": "honey", + "os_answer": "honey", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence volunteered to donate blood to help others, but Steven was unable to, since _ was healthy.", + "gold_answer": "Lawrence", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Reading poetry and rhymes was very entertaining for Derrick but boring for Logan, since _ was a mathematician.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Laura never feared anything like Erin because _ didn't have a very strong and very powerful mind.", + "gold_answer": "Erin", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Laura never feared anything like Erin because _ had a very strong and very powerful mind.", + "gold_answer": "Laura", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The farmer had more corn to harvest than yams because his cows liked eating the _ .", + "gold_answer": "yams", + "os_answer": "corn", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The farmer had more corn to harvest than yams because his cows hated eating the _ .", + "gold_answer": "corn", + "os_answer": "yams", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Adam asked Dennis to always remember to flush the toilet because _ doesn't flush it.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Christine knew how to make wings with better flavor than Maria, so _ waited for supper.", + "gold_answer": "Maria", + "os_answer": "everyone", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shoddy bridge held secure for when the cars were getting passengers across the town to their destinations on time. However the _ were cautious.", + "gold_answer": "passengers", + "os_answer": "authorities", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The shoddy bridge held secure for when the cars were getting passengers across the town to their destinations on time. However the _ were racing.", + "gold_answer": "cars", + "os_answer": "trains", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Buying a swimming pool was great for Adam but not for Christopher because _ had a large back yard.", + "gold_answer": "Adam", + "os_answer": "Adam", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Ann liked using oil paint rather than acrylic on canvas because _ had a shortened working time.", + "gold_answer": "acrylic", + "os_answer": "acrylic", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Cynthia was happy to give Patricia the politics section of the newspaper, because _ had little interest in the election results.", + "gold_answer": "Cynthia", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Only the bag got melted and not the wood when they were inside the flame. The _ is soft.", + "gold_answer": "bag", + "os_answer": "plastic", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Only the bag got melted and not the wood when they were inside the flame. The _ is hard.", + "gold_answer": "wood", + "os_answer": "heat", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Carrie always arrived to work after Cynthia, as _ had a shorter driving commute in the mornings.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Amy left smears all over the surface after cleaning Kayla's sink, because _ didn't supervise very much.", + "gold_answer": "Kayla", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian could learn to swim with the right instruction, but it was hard to tell whether lifeguard Matthew was qualified to provide it, since _ had never swum before.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "I slowly poured the milk over my bowl of cereal until the _ was gone.", + "gold_answer": "milk", + "os_answer": "carton", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "They disagreed over what dog to adopt as Mary wanted a yorkie while Maria wanted a labrador. _ loved small dogs.", + "gold_answer": "Mary", + "os_answer": "Mary", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Devin got sick after eating the sausage, so he laid on the couch and later moved to the bed because the _ was more comfortable.", + "gold_answer": "bed", + "os_answer": "bed", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jennifer has more money than Amy, so _ became a homeowner at a young age.", + "gold_answer": "Jennifer", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Michael had a unhappy relationship and was jealous because Lawrence had a great one only to find out the reason was _ slacked in adhering to standard marriage advice.", + "gold_answer": "Michael", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The salesman would only feature nice things in the house like the pool but not the wiring because the _ was fine.", + "gold_answer": "pool", + "os_answer": "plumbing", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "The boxes were too heavy for Benjamin to carry alone, so he asked Matthew for help. After he said yes, _ felt regret.", + "gold_answer": "Matthew", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jasmine wanted to put the emerald on the ring but it would not fit. The _ was minuscule.", + "gold_answer": "ring", + "os_answer": "setting", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jasmine wanted to put the emerald on the ring and it would not fit. The _ was colossal.", + "gold_answer": "emerald", + "os_answer": "emerald", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "John was glad the file was kept in the box before the fire outbreak started because the _ is inflammable.", + "gold_answer": "box", + "os_answer": "paper", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Sandra tried out a new conditioner for her hair that makes it curly, but was upset with the results because the _ was too straight.", + "gold_answer": "hair", + "os_answer": "texture", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Sandra tried out a new conditioner for her hair that makes it curly, but was upset with the results because the _ was too mild.", + "gold_answer": "conditioner", + "os_answer": "effect", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia had to pay less tax than Cynthia because _ made more money in the year.", + "gold_answer": "Cynthia", + "os_answer": "Cynthia", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Patricia had to pay less tax than Cynthia because _ made less money in the year.", + "gold_answer": "Patricia", + "os_answer": "she", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Brian's plants are showing a lot more growth than Logan's, because _ used better fertilizer.", + "gold_answer": "Brian", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James always feel weak whenever he walked the length of his street so he decided walking just the length of the lawn. The _ is long.", + "gold_answer": "street", + "os_answer": "street", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "James always feel weak whenever he walked the length of his street so he decided walking just the length of the lawn. The _ is short.", + "gold_answer": "lawn", + "os_answer": "distance", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The living room was cleaner than the kitchen, because we spend leess time in in the _ .", + "gold_answer": "living room", + "os_answer": "living room", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The living room was cleaner than the kitchen, because we spend more time in the the _ .", + "gold_answer": "kitchen", + "os_answer": "kitchen", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The girl broke Leslie's heart but not Kenneth's because _ was never in love with her.", + "gold_answer": "Kenneth", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The girl broke Leslie's heart but not Kenneth's because _ used to be in love with her.", + "gold_answer": "Leslie", + "os_answer": "he", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Monica suspected that Rebecca had become an alcoholic, but _ predicted an intervention to address the problem.", + "gold_answer": "Rebecca", + "os_answer": "neither", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The skateboard got broken under the weight of the fat boy and his luggage. The _ is light.", + "gold_answer": "skateboard", + "os_answer": "skateboard", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Lawrence was always gaining weight while Dennis was losing it as _ liked to eat too little.", + "gold_answer": "Dennis", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The stone still thudded on the floor even though it was dropped on the pillow. The _ is too light.", + "gold_answer": "pillow", + "os_answer": "pillow", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel touches the cool looking bulletproof vest of Kayla due to _ being on an investigation.", + "gold_answer": "Kayla", + "os_answer": "them", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Rachel touches the cool looking bulletproof vest of Kayla due to _ being on a ride along.", + "gold_answer": "Rachel", + "os_answer": "her", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Remodeling the kitchen came naturally to Michael but not William because _ had experience being a carpenter's apprentice.", + "gold_answer": "Michael", + "os_answer": "Michael", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Selena wanted the hairdresser to cut her hair with a razor instead of a clipper, because the _ always gave an edgier look.", + "gold_answer": "razor", + "os_answer": "razor", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil cut trees down into lumber every year unlike Logan because _ lives in the city.", + "gold_answer": "Logan", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Neil cut trees down into lumber every year unlike Logan because _ lives out in the countryside.", + "gold_answer": "Neil", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "We couldn't extract the blood but got the plasma out, since the _ was reachable by the needle.", + "gold_answer": "plasma", + "os_answer": "serum", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Happiness was most important to Nick but money was most important to William. _ valued a good life.", + "gold_answer": "Nick", + "os_answer": "Both", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The sound of the foot was clearly audible from the street because the _ is quiet.", + "gold_answer": "street", + "os_answer": "neighborhood", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "To remove the stain he reached for soap first, then got up and got a bowl. The _ was close by.", + "gold_answer": "soap", + "os_answer": "faucet", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "To remove the stain he reached for soap first, then got up and got a bowl. The _ was far away.", + "gold_answer": "bowl", + "os_answer": "sink", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kyle asked Brett for some tips on healthy eating because _ has recently lost weight.", + "gold_answer": "Brett", + "os_answer": "Brett", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The architect tried to build the room inside the house but the _ was too large.", + "gold_answer": "room", + "os_answer": "dimensions", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The architect tried to build the room inside the house but the _ was too small.", + "gold_answer": "house", + "os_answer": "space", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "William was a huge animal rights activist but Randy couldn't care less so _ hated leather.", + "gold_answer": "William", + "os_answer": "William", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "William was a huge animal rights activist but Randy couldn't care less so _ loved leather.", + "gold_answer": "Randy", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The school needed a new auditorium and a new teacher's lounge. They built the _ first because it benefited the faculty more.", + "gold_answer": "teacher's lounge", + "os_answer": "lounge", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The cashier was trained that real $100 bills had sharp lines and counterfeit ones might be blurry, so she accepted the _ bill.", + "gold_answer": "sharp", + "os_answer": "crisp", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "The pressure of finding new jobs is harder than finding new apartments. The _ are high in numbers.", + "gold_answer": "apartments", + "os_answer": "applicants", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She couldn't wear the bra, unlike the shirt, because the _ was the right size.", + "gold_answer": "shirt", + "os_answer": "latter", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Maria wanted to play poker with Jennifer because _ was a better player and she won a lot of money.", + "gold_answer": "Maria", + "os_answer": "she", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": false, + "dataset": "Winogrande" + }, + { + "question": "Angela was a homebody while Amy loved to travel the world whenever they could. _ took a vacation to the beach over the summer.", + "gold_answer": "Amy", + "os_answer": "Amy", + "os_eval": "Correct", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Angela was a homebody while Amy loved to travel the world whenever they could. _ took a staycation at home over the summer.", + "gold_answer": "Angela", + "os_answer": "Angela", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Kenneth was really scared to have surgery but Neil was very brave about it. _ was under a lot of stress.", + "gold_answer": "Kenneth", + "os_answer": "Kenneth", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Joel went to Michael 's house and consumed a lot of alcohol, so _ had to ride back home as a passenger.", + "gold_answer": "Joel", + "os_answer": "he", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "At the new restaurant, Betty convinced Lindsey to try fried brussel sprouts. _ was relieved when she tried new things.", + "gold_answer": "Betty", + "os_answer": "She", + "os_eval": "Incorrect", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "Jane received a pet tortoise and an aquarium as a birthday gift, but the _ was too small.", + "gold_answer": "aquarium", + "os_answer": "aquarium", + "os_eval": "Correct", + "mcq_answer": "A", + "mcq_eval": true, + "dataset": "Winogrande" + }, + { + "question": "She chose the black car over the green car, because the _ has more brighter color.", + "gold_answer": "green car", + "os_answer": "former", + "os_eval": "Incorrect", + "mcq_answer": "B", + "mcq_eval": true, + "dataset": "Winogrande" + } +] \ No newline at end of file