Spaces:

KernelPilot
/

KernelPilot-Optimization

Sleeping

App Files Files Community

KernelPilot-Optimization / app.py

wentaochen

v1 init

949310d 4 months ago

raw

history blame contribute delete

4.96 kB

	import os, tempfile, time
	import gradio as gr
	from tool.test import run_autotune_pipeline, DATA_DIR

	# ---------- Core callback ----------

	def get_test_text(test_file, test_data_input):
	if test_file is not None:
	if hasattr(test_file, "read"):
	return test_file.read().decode("utf-8")
	elif hasattr(test_file, "data"):
	return test_file.data if isinstance(test_file.data, str) else test_file.data.decode("utf-8")
	elif hasattr(test_file, "name") and os.path.exists(test_file.name):
	with open(test_file.name, "r", encoding="utf-8") as f:
	return f.read()
	# fallback to textbox
	return test_data_input or ""

	def generate_kernel(text_input, test_data_input, test_file, n_iters, progress=gr.Progress()):
	"""
	text_input : string from textbox (NL description or base CUDA code)
	test_data_input: test data (variable name, data)
	file_input : gr.File upload object (or None)
	Returns : (kernel_code_str, downloadable_file_path)
	"""
	progress((0, n_iters), desc="Initializing...")
	# 1) Select input source

	if not text_input.strip():
	return "⚠️ Please paste a description or baseline CUDA code."

	# td = tempfile.mkdtemp(prefix="auto_")

	# # ------- select test data source -------
	# if test_file is not None and test_file.size > 0:
	# test_text = test_file.read().decode("utf-8")
	# elif test_data_input.strip():
	# test_text = test_data_input
	# else:
	# return "Test data required: either fill Test Data Input or upload a .txt file.", "", None

	# src_path = os.path.join(td, f"input_{int(time.time())}.txt")
	# test_path = os.path.join(td, f"test_data_{int(time.time())}.txt")

	# with open(src_path, "w") as f:
	# f.write(text_input)

	# with open(test_path, "w") as f:
	# f.write(test_data_input or "")

	# if test_file is not None:
	# test_text = test_file.read().decode("utf-8")
	# else:
	# test_text = test_data_input

	test_text = get_test_text(test_file, test_data_input)

	if not test_text.strip():
	return "⚠️ Test data required."


	best_code = ""
	for info in run_autotune_pipeline(
	input_code=text_input,
	test_data_input=test_text,
	test_file=None,
	bin_dir=DATA_DIR,
	max_iterations=int(n_iters)
	):
	# 1) update progress bar (if iteration known)
	if info["iteration"] is not None:
	# print(f"Iteration {info['iteration']} / {n_iters}: {info['message']}")
	progress((info["iteration"], n_iters), desc=info["message"])

	# 3) kernel output only when we get new code
	if info["code"]:
	best_code = info["code"]

	# TBD: download button
	return best_code


	# ---------- Gradio UI ----------
	with gr.Blocks(
	title="KernelPilot",
	theme=gr.themes.Soft(
	text_size="lg",
	font=[
	"system-ui",
	"-apple-system",
	"BlinkMacSystemFont",
	"Segoe UI",
	"Roboto",
	"Helvetica Neue",
	"Arial",
	"Noto Sans",
	"sans-serif"
	])) as demo:
	gr.Markdown(
	"""# 🚀 KernelPilot Optimizer
	Enter a code, test data, then click Generate to obtain the optimized kernel function."""
	)

	with gr.Row():
	txt_input = gr.Textbox(
	label="📝 Input",
	lines=10,
	placeholder="Enter the code",
	scale=3
	)
	level = gr.Number(
	label="Optimazation Level",
	minimum=1,
	maximum=5,
	value=5,
	step=1,
	scale=1
	)

	with gr.Row():
	test_data_input = gr.Textbox(
	label="Test Data Input",
	lines=10,
	placeholder="<number_of_test_cases>\n<number_of_variables>\n\n<variable_1_name>\n<variable_1_testcase_1_data>\n<variable_1_testcase_2_data>\n...\n<variable_1_testcase_N_data>\n\n<variable_2_name>\n<variable_2_testcase_1_data>\n...\n<variable_2_testcase_N_data>\n\n...",
	scale=2
	)
	test_file = gr.File(
	label="Upload Test Data (.txt)",
	file_types=["text"],
	scale=1
	)

	gen_btn = gr.Button("⚡ Generate")

	kernel_output = gr.Code(
	label="🎯 Tuned CUDA Kernel",
	language="cpp"
	)

	gen_btn.click(
	fn=generate_kernel,
	inputs=[txt_input, test_data_input, test_file, level],
	outputs=[kernel_output],
	queue=True, # keeps requests queued
	show_progress=True, # show progress bar
	show_progress_on=kernel_output # update log box with progress
	)

	if __name__ == "__main__":
	demo.queue(default_concurrency_limit=1, max_size=50)
	demo.launch(server_name="0.0.0.0", server_port=7860)