Spaces:

marianvd-01
/

transformer-visualizer

Sleeping

App Files Files Community

transformer-visualizer / app.py

marianvd-01

Update app.py

9d0184c verified 8 months ago

raw

history blame contribute delete

3.1 kB

	# 🧠 Summary of Features:
	# 🔽 Dropdown to choose from 7 prebuilt models
	# 🔄 Updates attention layer & head slider limits based on the model
	# 📊 Visualizes attention maps for selected head/layer
	# 🧩 Tokenized words preview
	# 📉 Embeddings reduced to 2D using PCA
	# 📦 Model size bar chart across models
	# 📋 Full model config info in JSON viewer

	import gradio as gr
	from model_utils import MODEL_OPTIONS, load_model, get_model_info
	from visualize import (
	visualize_attention,
	show_tokenization,
	show_embeddings,
	compare_model_sizes,
	)

	# Initial load
	DEFAULT_MODEL_NAME = list(MODEL_OPTIONS.values())[0]
	tokenizer, model = load_model(DEFAULT_MODEL_NAME)

	# Shared state
	current_tokenizer = tokenizer
	current_model = model


	def update_model(selected_model_name):
	global current_tokenizer, current_model
	model_id = MODEL_OPTIONS[selected_model_name]
	current_tokenizer, current_model = load_model(model_id)
	info = get_model_info(current_model)

	# Update layer/head sliders based on model
	num_layers = info.get("Number of Layers", 1)
	num_heads = info.get("Number of Attention Heads", 1)

	return (
	info,
	gr.update(maximum=num_layers - 1, value=0),
	gr.update(maximum=num_heads - 1, value=0),
	)


	def run_all_visualizations(text, layer, head):
	attention_fig = visualize_attention(current_tokenizer, current_model, text, layer, head)
	token_fig = show_tokenization(current_tokenizer, text)
	embedding_fig = show_embeddings(current_tokenizer, current_model, text)
	return attention_fig, token_fig, embedding_fig


	# UI
	with gr.Blocks() as demo:
	gr.Markdown("## 🔍 Transformer Explorer")
	gr.Markdown("Explore attention, tokenization, and embedding visualizations for various transformer models.")

	with gr.Row():
	model_dropdown = gr.Dropdown(
	label="Choose a model",
	choices=list(MODEL_OPTIONS.keys()),
	value=list(MODEL_OPTIONS.keys())[0],
	)
	model_info = gr.JSON(label="Model Info")

	with gr.Row():
	text_input = gr.Textbox(label="Enter text", value="The quick brown fox jumps over the lazy dog.")
	layer_slider = gr.Slider(label="Layer", minimum=0, maximum=11, step=1, value=0)
	head_slider = gr.Slider(label="Head", minimum=0, maximum=11, step=1, value=0)

	run_button = gr.Button("Run Visualizations")

	with gr.Tab("📊 Attention"):
	attention_plot = gr.Plot()

	with gr.Tab("🧩 Tokenization"):
	token_plot = gr.Plot()

	with gr.Tab("📉 Embeddings"):
	embedding_plot = gr.Plot()

	with gr.Tab("📦 Model Size Comparison"):
	model_compare_plot = gr.Plot(value=compare_model_sizes())

	# Event binding
	model_dropdown.change(fn=update_model, inputs=[model_dropdown], outputs=[model_info, layer_slider, head_slider])
	run_button.click(
	fn=run_all_visualizations,
	inputs=[text_input, layer_slider, head_slider],
	outputs=[attention_plot, token_plot, embedding_plot],
	)


	if __name__ == "__main__":
	demo.launch()