Spaces:
Running
on
A100
Running
on
A100
citation section
Browse files
app.py
CHANGED
@@ -41,10 +41,6 @@ cli = "mergekit-yaml config.yaml merge --copy-tokenizer" + (
|
|
41 |
" --cuda --low-cpu-memory" if has_gpu else " --allow-crimes --out-shard-size 1B --lazy-unpickle"
|
42 |
)
|
43 |
|
44 |
-
## This Space is heavily inspired by LazyMergeKit by Maxime Labonne
|
45 |
-
## https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb
|
46 |
-
|
47 |
-
|
48 |
MARKDOWN_DESCRIPTION = """
|
49 |
# mergekit-gui
|
50 |
|
@@ -84,6 +80,22 @@ A quick overview of the currently supported merge methods:
|
|
84 |
| Passthrough | `passthrough` | β | β |
|
85 |
| [Model Stock](https://arxiv.org/abs/2403.19522) | `model_stock` | β
| β
|
|
86 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
87 |
"""
|
88 |
|
89 |
examples = [[str(f)] for f in pathlib.Path("examples").glob("*.yml")]
|
|
|
41 |
" --cuda --low-cpu-memory" if has_gpu else " --allow-crimes --out-shard-size 1B --lazy-unpickle"
|
42 |
)
|
43 |
|
|
|
|
|
|
|
|
|
44 |
MARKDOWN_DESCRIPTION = """
|
45 |
# mergekit-gui
|
46 |
|
|
|
80 |
| Passthrough | `passthrough` | β | β |
|
81 |
| [Model Stock](https://arxiv.org/abs/2403.19522) | `model_stock` | β
| β
|
|
82 |
|
83 |
+
|
84 |
+
## Citation
|
85 |
+
|
86 |
+
This GUI is powered by [Arcee's MergeKit](https://arxiv.org/abs/2403.13257).
|
87 |
+
If you use it in your research, please cite the following paper:
|
88 |
+
|
89 |
+
```
|
90 |
+
@article{goddard2024arcee,
|
91 |
+
title={Arcee's MergeKit: A Toolkit for Merging Large Language Models},
|
92 |
+
author={Goddard, Charles and Siriwardhana, Shamane and Ehghaghi, Malikeh and Meyers, Luke and Karpukhin, Vlad and Benedict, Brian and McQuade, Mark and Solawetz, Jacob},
|
93 |
+
journal={arXiv preprint arXiv:2403.13257},
|
94 |
+
year={2024}
|
95 |
+
}
|
96 |
+
```
|
97 |
+
|
98 |
+
This Space is heavily inspired by LazyMergeKit by Maxime Labonne (see [Colab](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb)).
|
99 |
"""
|
100 |
|
101 |
examples = [[str(f)] for f in pathlib.Path("examples").glob("*.yml")]
|