Spaces:
Running
on
Zero
Running
on
Zero
File size: 3,893 Bytes
ab96ee1 17b23e6 f9b65c3 17b23e6 fb0e46a 8f48aeb 17b23e6 ab96ee1 17b23e6 8f48aeb 8f262ce 17b23e6 8f48aeb 17b23e6 8f48aeb 17b23e6 8f48aeb 17b23e6 8f48aeb f9b65c3 8f48aeb f9b65c3 17b23e6 8f48aeb |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 |
# 配置环境
import subprocess
# 克隆GitHub仓库
subprocess.run(["git", "clone", "https://github.com/hiyouga/LLaMA-Factory.git"], check=True)
# 切换到仓库目录
import os
os.chdir("LLaMA-Factory")
# 列出目录内容
subprocess.run(["ls"], check=True)
# 安装unsloth
subprocess.run(["pip", "install", "unsloth[colab-new]@git+https://github.com/unslothai/unsloth.git"], check=True)
# 安装xformers
subprocess.run(["pip", "install", "-U", "xformers==0.0.25"], check=True)
# 安装当前目录下的依赖
subprocess.run(["pip", "install", ".[torch,bitsandbytes]"], check=True)
import gradio as gr
from llamafactory.chat import ChatModel
from llamafactory.extras.misc import torch_gc
import re
import spaces
from threading import Thread
def split_into_sentences(text):
sentence_endings = re.compile(r'(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\?|\!)\s')
sentences = sentence_endings.split(text)
return [sentence.strip() for sentence in sentences if sentence]
@spaces.GPU(duration=120)
def process_sentence(sentence, index, results, messages, progress, total_sentences):
messages.append({"role": "user", "content": sentence})
sentence_response = ""
for new_text in chat_model.stream_chat(messages, temperature=0.7, top_p=0.9, top_k=50, max_new_tokens=300):
sentence_response += new_text.strip()
category = sentence_response.strip().lower().replace(' ', '_')
if category != "fair":
results[index] = (sentence, category)
else:
results[index] = (sentence, "fair")
messages.append({"role": "assistant", "content": sentence_response})
torch_gc()
progress((index + 1) / total_sentences)
@spaces.GPU(duration=120)
def process_paragraph(paragraph, progress=gr.Progress()):
sentences = split_into_sentences(paragraph)
results = [None] * len(sentences)
total_sentences = len(sentences)
threads = []
for i, sentence in enumerate(sentences):
thread = Thread(target=process_sentence, args=(sentence, i, results, messages.copy(), progress, total_sentences))
threads.append(thread)
thread.start()
for thread in threads:
thread.join()
return results
args = dict(
model_name_or_path="princeton-nlp/Llama-3-Instruct-8B-SimPO", # 使用量化的 Llama-3-8B-Instruct 模型
# model_name_or_path="StevenChen16/llama3-8b-compliance-review",
# adapter_name_or_path="StevenChen16/llama3-8b-compliance-review-adapter", # 加载保存的 LoRA 适配器
template="llama3", # 与训练时使用的模板相同
finetuning_type="lora", # 与训练时使用的微调类型相同
quantization_bit=8, # 加载 8-bit 量化模型
use_unsloth=True, # 使用 UnslothAI 的 LoRA 优化以加速生成
)
chat_model = ChatModel(args)
messages = []
# 定义类型到颜色的映射
label_to_color = {
"fair": "green",
"limitation_of_liability": "red",
"unilateral_termination": "orange",
"unilateral_change": "yellow",
"content_removal": "purple",
"contract_by_using": "blue",
"choice_of_law": "cyan",
"jurisdiction": "magenta",
"arbitration": "brown",
}
with gr.Blocks() as demo:
with gr.Row(equal_height=True):
with gr.Column():
input_text = gr.Textbox(label="Input Paragraph", lines=10, placeholder="Enter the paragraph here...")
btn = gr.Button("Process")
with gr.Column():
output = gr.HighlightedText(label="Processed Paragraph", color_map=label_to_color)
progress = gr.Progress()
def on_click(paragraph):
results = process_paragraph(paragraph, progress=progress)
return results
btn.click(on_click, inputs=input_text, outputs=[output])
demo.launch(share=True)
|