pipeline-parallelism-with-controllable-memory

Running

pipeline-parallelism-with-controllable-memory / app.py

Wan Xinyi

Add 1f1b

be3048f 11 months ago

6.53 kB

	import gradio as gr
	import auto_schedule
	import v_schedule
	import hand_schedule
	from PIL import Image
	from svg_event import render_manual_graph
	import pathlib
	def greet(name, is_morning, temperature):
	salutation = "Good morning" if is_morning else "Good evening"
	greeting = f"{salutation} {name}. It is {temperature} degrees today"
	celsius = (temperature - 32) * 5 / 9
	return greeting, round(celsius, 2)

	def percentage(x):
	return f"{x*100:.2f}%"

	def get_schedule_time(result):
	result = [
	list(filter(lambda x: x.type in {'F', 'B', 'W'}, r)) for r in result
	]
	time = max(
	[
	max([x.completion_time for x in stage]) - min([x.start_time for x in stage]) for stage in result
	]
	)
	return time

	img_queue = []
	def get_schedule_image(result, max_time):
	result = [
	list(filter(lambda x: x.type in {'F', 'B', 'W'}, r)) for r in result
	]
	svg = render_manual_graph(result, max_time, len(result[0]) <= 72)
	img_queue.append(svg)
	if len(img_queue) > 32:
	poped = img_queue.pop(0)
	pathlib.Path(poped).unlink()

	return pathlib.Path(svg)



	def calculate(p, m, f, b, w, c, mem):
	if mem < p:
	baseline_time=None
	baseline_bubble=None
	baseline_acceleration=None
	baseline_image=None
	else:
	baseline_result = hand_schedule.get_hand_schedule(p, m, f, b + w, 0, c)
	baseline_result = [
	list(filter(lambda x: x.type in {'F', 'B'}, r)) for r in baseline_result
	]
	baseline_time = get_schedule_time(baseline_result)
	baseline_bubble=percentage(baseline_time/(f+b+w)/m - 1)
	baseline_acceleration=percentage(0)


	zb_result = auto_schedule.auto_schedule(p, m, auto_schedule.GraphConfig(
	cost_f=f,
	cost_b=b,
	cost_w=w,
	cost_comm=c,
	max_mem=mem * 2,
	print_scaling=1000
	))

	zb_time=get_schedule_time(zb_result)

	zb_bubble=percentage(zb_time/(f+b+w)/m - 1)
	zb_acceleration=percentage(baseline_time/zb_time - 1) if baseline_time is not None else None

	if mem < p:
	zbv_time=None
	zbv_bubble=None
	zbv_acceleration=None
	zbv_image=None
	else:
	zbv_graph = v_schedule.PipelineGraph(
	n_stage=p,
	n_micro=m,
	f_cost=f/2,
	b_cost=b/2,
	w_cost=w/2,
	c_cost=c,
	f_mem=2,
	b_mem=-1,
	w_mem=-1,
	max_mem=mem * 4,
	)
	zbv_result = zbv_graph.get_v_schedule()

	zbv_time = get_schedule_time(zbv_result)
	zbv_bubble=percentage(zbv_time/(f+b+w)/m - 1)
	zbv_acceleration=percentage(baseline_time/zbv_time - 1) if baseline_time is not None else None

	max_time = max([baseline_time, zb_time, zbv_time])
	print(max_time)
	baseline_image = get_schedule_image(baseline_result, max_time)
	zb_image = get_schedule_image(zb_result, max_time)
	zbv_image = get_schedule_image(zbv_result, max_time)

	return [baseline_time, baseline_bubble, baseline_acceleration, baseline_image, zb_time, zb_bubble, zb_acceleration, zb_image, zbv_time, zbv_bubble, zbv_acceleration, zbv_image]

	with gr.Blocks() as demo:
	gr.Markdown(open("description1.md").read())
	gr.Markdown("# Pipeline Scheduler Playground")
	with gr.Row():
	with gr.Column(scale=1):
	with gr.Group():
	gr.Markdown("Basic Parameters")
	with gr.Row():
	p=gr.Number(label="Number of stages (p)", value=4, interactive=True, precision=0)
	m=gr.Number(label="Number of microbatches (m)", value=12, interactive=True, precision=0)
	with gr.Column(scale=2):
	with gr.Group():
	gr.Markdown("Costs. All costs are used as integers. For ZBV schedules, this is the time of two virtual stages on a stage combined.")
	with gr.Row():
	f=gr.Number(label="Time of F", value=100, interactive=True, precision=0)
	b=gr.Number(label="Time of B", value=110, interactive=True, precision=0)
	w=gr.Number(label="Time of W", value=90, interactive=True, precision=0)
	c=gr.Number(label="Time of one P2P communication", value=5, interactive=True, precision=0)
	with gr.Group():
	gr.Markdown("Activation memory limit.")
	def update_mem(p, s, mem):
	print("update")
	if s=="custom":
	return mem
	return int(p*float(s.split('p')[0]) + 0.5)
	memsel=gr.Radio(choices=["1p (Same as 1F1B)", "1.5p", "2p", "3p", "custom"], value="1p (Same as 1F1B)")
	mem=gr.Number(label="Custom memory limit in terms of pending F on a stage. For ZBV schedules, this is relative to two virtual stages on a stage combined.", value=p.value, interactive=True, precision=0)
	memsel.change(update_mem, inputs=[p, memsel, mem], outputs=mem)
	p.change(update_mem, inputs=[p, memsel, mem], outputs=mem)

	button=gr.Button("Calculate", variant="primary")

	with gr.Group():
	gr.Markdown("1F1B")
	with gr.Row():
	with gr.Column(scale=1):
	baseline_time=gr.Textbox("", label="Longest Stage Time")
	baseline_bubble=gr.Textbox("", label="Bubble Rate. Calculated as (1 - longest stage time/(F+B+W)/m).")
	baseline_acceleration=gr.Textbox("", label="Acceleration compared to 1F1B")
	with gr.Column(scale=4):
	baseline_image=gr.Image(None, interactive=False, label="Schedule Image")

	with gr.Group():
	gr.Markdown("Zero Bubble Schedule")
	with gr.Row():
	with gr.Column(scale=1):
	zb_time=gr.Textbox("", label="Longest Stage Time")
	zb_bubble=gr.Textbox("", label="Bubble Rate. Calculated as (1 - longest stage time/(F+B+W)/m).")
	zb_acceleration=gr.Textbox("", label="Acceleration compared to 1F1B")
	with gr.Column(scale=4):
	zb_image=gr.Image(None, interactive=False, label="Schedule Image")
	with gr.Group():
	gr.Markdown("Zero Bubble V Schedule (ZBV)")
	with gr.Row():
	with gr.Column(scale=1):
	zbv_time=gr.Textbox("", label="Longest Stage Time")
	zbv_bubble=gr.Textbox("", label="Bubble Rate. Calculated as (1 - longest stage time/(F+B+W)/m).")
	zbv_acceleration=gr.Textbox("", label="Acceleration compared to 1F1B")
	with gr.Column(scale=4):
	zbv_image=gr.Image(None, interactive=False, label="Schedule Image")
	button.click(calculate, inputs=[p, m, f, b, w, c, mem], outputs=[baseline_time, baseline_bubble, baseline_acceleration, baseline_image, zb_time, zb_bubble, zb_acceleration, zb_image, zbv_time, zbv_bubble, zbv_acceleration, zbv_image])
	gr.Markdown(open("description2.md").read())
	demo.launch()