Spaces:
Running
on
Zero
Running
on
Zero
test
Browse files- generate.py +10 -5
- gradio_app.py +2 -2
generate.py
CHANGED
@@ -38,11 +38,11 @@ sampler.set_max_repeats(empty_tokens, 1)
|
|
38 |
|
39 |
class Sample(BaseModel):
|
40 |
# We use get_samples_generator() to replace the placeholder with the requested fields
|
41 |
-
|
42 |
-
|
43 |
-
|
44 |
-
|
45 |
-
|
46 |
# PS: don't use StringConstraints with max_length here since it creates a fsm that is too big
|
47 |
|
48 |
|
@@ -110,6 +110,11 @@ def stream_file(filename: str, prompt: str, columns: list[str], seed: int, size:
|
|
110 |
columns.append(column)
|
111 |
logger.warning(f"stream_response({filename=}, {prompt=}, {columns=}) Generating columns... DONE (total={time.time() - _start:.02f}s)")
|
112 |
|
|
|
|
|
|
|
|
|
|
|
113 |
logger.warning(f"stream_response({filename=}, {prompt=}, {columns=}) - Generating JSON regex guide...")
|
114 |
samples_generator = get_samples_generator(new_fields=columns)
|
115 |
logger.warning(f"stream_response({filename=}, {prompt=}, {columns=}) - Generating JSON regex guide... DONE (total={time.time() - _start:.02f}s)")
|
|
|
38 |
|
39 |
class Sample(BaseModel):
|
40 |
# We use get_samples_generator() to replace the placeholder with the requested fields
|
41 |
+
ABCDabcd12: str
|
42 |
+
EFGHefgh34: str
|
43 |
+
IJKLijkl56: str
|
44 |
+
MNOPmnop78: str
|
45 |
+
QRSTqrst90: str
|
46 |
# PS: don't use StringConstraints with max_length here since it creates a fsm that is too big
|
47 |
|
48 |
|
|
|
110 |
columns.append(column)
|
111 |
logger.warning(f"stream_response({filename=}, {prompt=}, {columns=}) Generating columns... DONE (total={time.time() - _start:.02f}s)")
|
112 |
|
113 |
+
columns = [
|
114 |
+
tokenizer.decode(tokenizer.encode(column, add_special_tokens=False)[:len(orig_field)], skip_special_tokens=True)
|
115 |
+
for column, orig_field in zip(columns, Sample.model_fields)
|
116 |
+
]
|
117 |
+
|
118 |
logger.warning(f"stream_response({filename=}, {prompt=}, {columns=}) - Generating JSON regex guide...")
|
119 |
samples_generator = get_samples_generator(new_fields=columns)
|
120 |
logger.warning(f"stream_response({filename=}, {prompt=}, {columns=}) - Generating JSON regex guide... DONE (total={time.time() - _start:.02f}s)")
|
gradio_app.py
CHANGED
@@ -27,7 +27,7 @@ def stream_output(filename: str):
|
|
27 |
state_msg = (
|
28 |
f"✅ Done generating {size} samples in {time.time() - start_time:.2f}s"
|
29 |
if i + 1 == size else
|
30 |
-
f"⚙️ Generating... [{i}/{size}]"
|
31 |
)
|
32 |
yield df, "```json\n" + content + "\n```", state_msg
|
33 |
|
@@ -45,7 +45,7 @@ def test(filename: str):
|
|
45 |
state_msg = (
|
46 |
f"✅ Done generating {size} samples in {time.time() - start_time:.2f}s"
|
47 |
if i + 1 == size else
|
48 |
-
f"⚙️ Generating... [{i}/{size}]"
|
49 |
)
|
50 |
yield df, "```json\n" + content + "\n```", state_msg
|
51 |
time.sleep(0.1)
|
|
|
27 |
state_msg = (
|
28 |
f"✅ Done generating {size} samples in {time.time() - start_time:.2f}s"
|
29 |
if i + 1 == size else
|
30 |
+
f"⚙️ Generating... [{i + 1}/{size}]"
|
31 |
)
|
32 |
yield df, "```json\n" + content + "\n```", state_msg
|
33 |
|
|
|
45 |
state_msg = (
|
46 |
f"✅ Done generating {size} samples in {time.time() - start_time:.2f}s"
|
47 |
if i + 1 == size else
|
48 |
+
f"⚙️ Generating... [{i + 1}/{size}]"
|
49 |
)
|
50 |
yield df, "```json\n" + content + "\n```", state_msg
|
51 |
time.sleep(0.1)
|