Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -300,26 +300,28 @@ def generate_beams(start_sentence, scores, length_penalty, decoded_sequences, be
|
|
300 |
token_scores,
|
301 |
) = ([], [], [], [], [], [])
|
302 |
|
303 |
-
|
|
|
304 |
current_beam = beam_trees[beam_ix]
|
305 |
|
306 |
# skip if the beam is already final
|
307 |
if current_beam.is_final:
|
308 |
continue
|
309 |
-
|
310 |
# Get top cumulative scores for the current beam
|
311 |
current_top_token_indexes = list(
|
312 |
-
np.array(scores[step][
|
313 |
)
|
314 |
top_token_indexes += current_top_token_indexes
|
315 |
-
token_scores += list(np.array(scores[step][
|
316 |
top_cumulative_scores += list(
|
317 |
-
np.array(scores[step][
|
318 |
+ current_beam.cumulative_score
|
319 |
)
|
320 |
beam_indexes += [beam_ix] * n_beams
|
321 |
current_sequence += [beam_trees[beam_ix].current_sequence] * n_beams
|
322 |
top_tokens += [tokenizer.decode([el]) for el in current_top_token_indexes]
|
|
|
323 |
|
324 |
top_df = pd.DataFrame.from_dict(
|
325 |
{
|
|
|
300 |
token_scores,
|
301 |
) = ([], [], [], [], [], [])
|
302 |
|
303 |
+
score_idx = 0
|
304 |
+
for beam_ix in range(len(beam_trees)):
|
305 |
current_beam = beam_trees[beam_ix]
|
306 |
|
307 |
# skip if the beam is already final
|
308 |
if current_beam.is_final:
|
309 |
continue
|
310 |
+
|
311 |
# Get top cumulative scores for the current beam
|
312 |
current_top_token_indexes = list(
|
313 |
+
np.array(scores[step][score_idx].argsort()[-n_beams:])[::-1]
|
314 |
)
|
315 |
top_token_indexes += current_top_token_indexes
|
316 |
+
token_scores += list(np.array(scores[step][score_idx][current_top_token_indexes]))
|
317 |
top_cumulative_scores += list(
|
318 |
+
np.array(scores[step][score_idx][current_top_token_indexes])
|
319 |
+ current_beam.cumulative_score
|
320 |
)
|
321 |
beam_indexes += [beam_ix] * n_beams
|
322 |
current_sequence += [beam_trees[beam_ix].current_sequence] * n_beams
|
323 |
top_tokens += [tokenizer.decode([el]) for el in current_top_token_indexes]
|
324 |
+
score_idx += 1
|
325 |
|
326 |
top_df = pd.DataFrame.from_dict(
|
327 |
{
|