Create app.py

500985a verified 26 days ago

4.57 kB

	import gradio as gr
	import gymnasium as gym
	from gymnasium import spaces
	import numpy as np
	import matplotlib.pyplot as plt
	from stable_baselines3 import PPO

	# --- 1. DEFINIMOS EL ENTORNO (Igual que en Colab) ---
	class DataCenterEnv(gym.Env):
	def __init__(self):
	super(DataCenterEnv, self).__init__()
	self.action_space = spaces.Discrete(5)
	self.observation_space = spaces.Box(low=0, high=100, shape=(1,), dtype=np.float32)
	self.state = 20
	self.max_steps = 100
	self.current_step = 0
	self.temps = []
	self.energies = []

	def reset(self, seed=None, options=None):
	super().reset(seed=seed)
	self.state = 20 + np.random.rand()
	self.current_step = 0
	self.temps = [self.state]
	self.energies = []
	return np.array([self.state], dtype=np.float32), {}

	def step(self, action):
	# Usamos variables globales para simular la carga que el usuario elija en la web
	global USER_CPU_LOAD_MIN, USER_CPU_LOAD_MAX
	cpu_load = np.random.uniform(USER_CPU_LOAD_MIN, USER_CPU_LOAD_MAX)

	cooling_effect = action * 2.5 # Potencia industrial
	energy_cost = action ** 2

	self.state = self.state + cpu_load - cooling_effect
	self.state = np.clip(self.state, 10, 100)
	self.current_step += 1

	reward = 0
	if 37 <= self.state <= 60: reward += 5
	else: reward -= 2
	if self.state > 80: reward -= 50
	reward -= (energy_cost * 0.1)

	terminated = False
	if self.current_step >= self.max_steps: terminated = True

	self.temps.append(self.state)
	self.energies.append(energy_cost)

	return np.array([self.state], dtype=np.float32), reward, terminated, False, {}

	# Variables globales para controlar la dificultad desde la web
	USER_CPU_LOAD_MIN = 1
	USER_CPU_LOAD_MAX = 4

	# --- 2. FUNCIÓN DE SIMULACIÓN (Lo que hace la web) ---
	def run_simulation(load_min, load_max):
	# Actualizamos las variables globales con lo que el usuario eligió
	global USER_CPU_LOAD_MIN, USER_CPU_LOAD_MAX
	USER_CPU_LOAD_MIN = load_min
	USER_CPU_LOAD_MAX = load_max

	# 1. Crear entorno y Cargar Modelo
	env = DataCenterEnv()

	# INTENTA CARGAR TU MODELO. Si no lo encuentra, usa uno aleatorio (para que no falle la demo)
	try:
	model = PPO.load("agente_aire_acondicionado.zip", env=env)
	msg = "✅ Modelo Inteligente Cargado Correctamente."
	except:
	model = None
	msg = "⚠️ ADVERTENCIA: No se encontró 'agente_aire_acondicionado.zip'. Usando acciones aleatorias."

	# 2. Correr la simulación
	obs, _ = env.reset()
	done = False

	while not done:
	if model:
	action, _ = model.predict(obs)
	else:
	action = env.action_space.sample() # Fallback aleatorio

	obs, reward, done, truncated, info = env.step(action)

	# 3. Generar Gráficos
	fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 5))

	# Gráfico Temperatura
	ax1.plot(env.temps, color="red", label="Temperatura")
	ax1.axhline(y=37, color='green', linestyle='--', label="Mínimo (37°C)")
	ax1.axhline(y=60, color='green', linestyle='--', label="Máximo (60°C)")
	ax1.set_title("Control de Temperatura")
	ax1.set_ylabel("°C")
	ax1.set_ylim(10, 90)
	ax1.legend()
	ax1.grid(True)

	# Gráfico Energía
	ax2.plot(env.energies, color="blue", label="Energía")
	ax2.set_title("Consumo de Energía")
	ax2.set_ylabel("Watts")
	ax2.grid(True)

	plt.tight_layout()
	return fig, msg

	# --- 3. INTERFAZ GRÁFICA (Gradio) ---
	with gr.Blocks() as demo:
	gr.Markdown("# ❄️ AI Cooling System Optimization Agent")
	gr.Markdown("Este agente de Aprendizaje por Refuerzo (RL) controla el aire acondicionado de un servidor para ahorrar energía sin que se sobrecaliente.")

	with gr.Row():
	with gr.Column():
	gr.Markdown("### Configuración de Carga")
	s_min = gr.Slider(1, 10, value=1, label="Carga Mínima de CPU (Calor)")
	s_max = gr.Slider(1, 10, value=4, label="Carga Máxima de CPU (Calor)")
	btn = gr.Button("🚀 Ejecutar Simulación")
	status = gr.Textbox(label="Estado del Agente")

	with gr.Column():
	plot = gr.Plot(label="Resultados en Tiempo Real")

	btn.click(fn=run_simulation, inputs=[s_min, s_max], outputs=[plot, status])

	# Lanzar la app
	demo.launch()