Spaces:
Sleeping
Sleeping
File size: 6,269 Bytes
b222ec5 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 |
import torch, torchvision, clip, time, math
import matplotlib.pyplot as plt
from model import encoder_image
from sentence import *
##### Get infos & cool facts to display during loadings
with open("infos.txt") as file:
infos = file.readlines()
##### Get css
with open("style.css") as style:
css = "<style>"+ ''.join(style.readlines())+"</style>"
##### 'DIFFICULTY SWITCH' EVENT
def switch_difficulty(var_dict, html_loading):
var_dict["difficulty"] = 1 - var_dict["difficulty"]
title, infos, new_value = loading(html_loading)
return var_dict, title, infos, new_value
##### 'LOADING' EVENT
def loading(html_loading=None):
### This is just to make sure the content changes, which triggers the .change event which, itself, will launch a new game
if html_loading == "<div style=\"display:none;\">0</div>": new_value = "<div style=\"display:none;\">1</div>"
else: new_value = "<div style=\"display:none;\">0</div>"
### Get a random tip
info = np.random.choice(infos)
### Return TITLE, TIP TEXT, NEW HTML CONTENT, CANVAS IMG
return "<h1 id=\"loading\">⌛Loading...</h1>",css+"<div id=\"prediction\"><p id=\"infos\">"+info+"</p></div>",new_value
##### 'NEW GAME' EVENT
def new_game(var_dict,img=None,first_game=False):
print("\n----------Launching new game!")
if None is not var_dict: difficulty = var_dict["difficulty"]
else: difficulty = 1
var_dict = {
"start_time": time.time(),
"total_time": 0,
"found_words": [],
"target_sentence": "",
"guessed_sentence": "",
"parts": [],
"win": 0,
"step": 0,
"prev_steps": [],
"prev_norm": float("inf"),
"tip": "",
"loading": False,
"revertedState": False,
"difficulty": difficulty
}
target = iniSentence(var_dict,first_game=first_game)
### Return TITLE, PREDICTION TEXT, CANVAS IMG, VAR DICT
return "<h1>"+target+"</h1>", getHTML(var_dict,""), None, var_dict
##### PREDICTION TEXT HTML
def getHTML(var_dict,text,win=0):
### Which parts of the sentence have been guessed?
guessed, not_guessed = "", ""
text_words = text.split(" ")
target_words = var_dict["target_sentence"].split(" ")
for i,word in enumerate(text_words):
if i < len(target_words) and word == target_words[i]: guessed += word + " "
else: not_guessed += word + " "
### Display prediction
if win!=1:
html = "<p><span>"+guessed+"</span>"+not_guessed+"</p>"
else:
minutes, seconds = math.floor(var_dict["total_time"]/60), var_dict["total_time"]%60
if minutes < 1 and seconds <= 30: emoji = "🏆😍"
elif minutes < 1: emoji = "😄"
elif minutes < 2: emoji = "😐"
elif minutes < 3: emoji = "😓"
else: emoji = "😱"
time_str = "Total time: "+ ((str(minutes)+"m") if minutes>0 else "") + str(seconds)+"s "+emoji
html = "<p id=\"win\"><span>"+guessed+"</span><br>"+time_str+"</p>"
return css+"<div id=\"prediction\">"+html+"</div>"
##### DRAWING PROCESSING & GAME STATE UPDATE
def process_img(var_dict,img,title):
# Makes sure that start_time is updates for the first game
if var_dict["start_time"] == -1:
var_dict["start_time"] = time.time()
if (None is img):
return getHTML(var_dict,"",win=0),"<h1>"+var_dict["target_sentence"]+"</h1>",var_dict
elif (None is not img) and (var_dict["win"] != 1):
print("-----Processing...")
part = var_dict["parts"][var_dict["step"]]
image = torch.tensor(img).float() / 255
### Detect Cancel event
norm = torch.norm(image)
if norm > var_dict["prev_norm"]:
print("---Cancel Event")
prevState(var_dict)
var_dict["prev_norm"] = norm
### Image preprocessing --> shape (224,224)
max_edge = max(image.shape[0],image.shape[1])
min_edge = min(image.shape[0],image.shape[1])
square_image = torch.ones(max_edge,max_edge)
pad = math.floor((max_edge - min_edge)/2)
if max_edge == image.shape[1]: square_image[pad:pad+min_edge,:] = image
else: square_image[:,pad:pad+min_edge] = image
image = torchvision.transforms.Resize((224,224))(square_image.unsqueeze(0)).repeat(1,3,1,1)
### Computing cosine similarities (drawing<->text embeddings)
with torch.no_grad():
image_features = encoder_image(image)[0]
text_features = torch.tensor(part["embeddings"])
image_features /= image_features.norm()
similarities = torch.matmul(text_features,image_features)
probs = torch.nn.Softmax(dim=-1)(similarities)
### Sort indexes by similarity
idxs = np.argsort(similarities)
### Use top-3 preditions
top3_idxs = idxs[-3:]
classes = part["classes"]
preds = [classes[idx] for idx in top3_idxs]
print(f"Top-3 Predictions: {preds}")
print(f"Top-3 Probabilities: {probs[top3_idxs]}")
### Check if win (-1: bad guess, 0:progress=guessed sentence part, 1:win=guessed whole sentence)
win = updateState(var_dict, preds)
if win == -1:
text = preds[-1]
elif win == 0:
part = var_dict["parts"][var_dict["step"]]
text = var_dict["guessed_sentence"] + link_text(part,"something") + " something"
elif win == 1:
text = var_dict["guessed_sentence"]
if var_dict["total_time"] == 0: var_dict["total_time"] = round(time.time() - var_dict["start_time"])
return getHTML(var_dict,text,var_dict["win"]),"<h1>"+var_dict["target_sentence"]+"</h1>",var_dict
else:
return getHTML(var_dict,var_dict["target_sentence"],win=1),"<h1>"+var_dict["target_sentence"]+"</h1>",var_dict
|