Spaces:

gabehubner
/

deep-rl-explainability

Sleeping

App Files Files Community

deep-rl-explainability / app.py

ghubner

Update app with improved UI and markdown formatting

386550d 10 days ago

raw

history blame contribute delete

7.19 kB

	import gradio as gr
	from train import TrainingLoop
	from scipy.special import softmax
	import numpy as np

	# Global variables for training and data storage
	train = None
	frames, attributions = None, None

	# Lunar Lander environment state feature mapping
	LUNAR_LANDER_FEATURES = {
	0: "X-coordinate",
	1: "Y-coordinate",
	2: "Linear velocity in the X-axis",
	3: "Linear velocity in the Y-axis",
	4: "Angle",
	5: "Angular velocity",
	6: "Left leg touched the floor",
	7: "Right leg touched the floor"
	}

	def create_training_loop(env_spec):
	"""Initialize the training loop with the specified environment."""
	global train
	train = TrainingLoop(env_spec=env_spec)
	train.create_agent()
	return train.env.spec

	def display_softmax(inputs):
	"""Convert raw attribution values to softmax probabilities for visualization."""
	inputs = np.array(inputs)
	probabilities = softmax(inputs)

	softmax_dict = {
	name: float(prob)
	for name, prob in zip(LUNAR_LANDER_FEATURES.values(), probabilities)
	}
	return softmax_dict

	def generate_output(num_iterations, option):
	"""Generate attribution explanations for the trained agent."""
	global frames, attributions
	frames, attributions = train.explain_trained(
	num_iterations=num_iterations,
	option=option
	)
	slider.maximum = len(frames)

	def get_frame_and_attribution(slider_value):
	"""Get frame and attribution data for the selected timestep."""
	global frames, attributions
	slider_value = min(slider_value, len(frames) - 1)
	frame = frames[slider_value]

	print(f"Frame shape: {frame.shape}")

	attribution = display_softmax(attributions[slider_value])
	return frame, attribution

	with gr.Blocks(
	title="Deep RL Explainability",
	theme=gr.themes.Soft(),
	css="""
	.gradio-container {
	max-width: 1200px !important;
	}
	.tab-nav {
	background: linear-gradient(90deg, #667eea 0%, #764ba2 100%);
	}
	"""
	) as demo:

	# Header section
	gr.Markdown("""
	# 🚀 Deep Reinforcement Learning Explainability

	Exploring AI decision-making through Integrated Gradients in RL environments

	---
	""")

	# Introduction section
	gr.Markdown("""
	## 📖 How This Works

	This application demonstrates the application of [Integrated Gradients](https://captum.ai/docs/extension/integrated_gradients)
	to Deep Reinforcement Learning scenarios. We use PyTorch's Captum library for interpretability
	and Gymnasium for the continuous Lunar Lander environment.

	### 🧠 Training Algorithm: [DDPG](https://arxiv.org/abs/1509.02971)

	The agent is trained using Deep Deterministic Policy Gradients and achieves an average reward
	of 260.8 per episode (successful landings).

	### 🎯 How to Use This Space

	1. Select Environment: Choose the Lunar Lander environment
	2. Choose Baseline: Select between zero tensor or running average baseline
	3. Generate Attributions: Click "ATTRIBUTE" and wait ~20-25 seconds
	4. Explore Results: Use the slider to examine attributions at different timesteps

	The attributions are normalized using Softmax to provide interpretable probability distributions.
	""")

	# Main interface tab
	with gr.Tab("🔍 Attribution Analysis", elem_id="attribution-tab"):

	# Environment setup
	gr.Markdown("### 🌙 Environment Setup")
	env_spec = gr.Dropdown(
	choices=["LunarLander-v2"],
	type="value",
	multiselect=False,
	label="Environment Specification",
	value="LunarLander-v2",
	info="Select the RL environment to analyze"
	)

	env_interface = gr.Interface(
	title="Initialize Environment",
	allow_flagging="never",
	inputs=env_spec,
	fn=create_training_loop,
	outputs=gr.JSON(label="Environment Spec"),
	description="Click to initialize the training environment"
	)

	# Attribution controls
	gr.Markdown("### ⚙️ Attribution Configuration")

	with gr.Row():
	with gr.Column(scale=1):
	option = gr.Dropdown(
	choices=["Torch Tensor of 0's", "Running Average"],
	type="index",
	label="Baseline Method",
	info="Choose the baseline for Integrated Gradients"
	)

	with gr.Column(scale=1):
	baselines = gr.Slider(
	label="Number of Baseline Iterations",
	interactive=True,
	minimum=0,
	maximum=100,
	value=10,
	step=5,
	info="Number of baseline inputs to collect for averaging"
	)

	# Generate button
	generate_btn = gr.Button(
	"🚀 GENERATE ATTRIBUTIONS",
	variant="primary",
	size="lg"
	)
	generate_btn.click(
	fn=generate_output,
	inputs=[baselines, option],
	outputs=[]
	)

	# Results section
	gr.Markdown("### 📊 Results Visualization")

	slider = gr.Slider(
	label="🎬 Key Frame Selector",
	minimum=0,
	maximum=1000,
	step=1,
	value=0,
	info="Navigate through different timesteps to see attributions"
	)

	results_interface = gr.Interface(
	fn=get_frame_and_attribution,
	inputs=slider,
	live=True,
	outputs=[
	gr.Image(label="🎮 Environment State", type="numpy"),
	gr.Label(label="📈 Feature Attributions", num_top_classes=8)
	],
	title="Real-time Attribution Analysis"
	)

	gr.Markdown("""
	---

	## 🛠️ Local Usage & Installation

	### Required Packages
	```bash
	pip install torch gymnasium 'gymnasium[box2d]'
	```

	### Box2D Installation (macOS)
	```bash
	brew install swig
	pip install box2d
	```

	## 🎯 Lunar Lander Environment Details

	### Reward Structure
	- Position: Increased/decreased based on distance to landing pad
	- Velocity: Increased/decreased based on speed (slower is better)
	- Angle: Decreased when lander is tilted (horizontal is ideal)
	- Landing: +10 points for each leg touching ground
	- Fuel: -0.03 points per frame for side engine, -0.3 for main engine
	- Episode End: -100 for crash, +100 for safe landing

	Success Threshold: 200+ points per episode

	### Training Functions
	- `load_trained()`: Loads pre-trained model (1000 episodes)
	- `train()`: Trains from scratch
	- Set `render_mode=False` for faster training

	---

	Built with ❤️ using Gradio, PyTorch, and Captum
	""")

	if __name__ == "__main__":
	demo.launch()