diff --git a/Proposal.pdf b/Proposal.pdf
new file mode 100644
index 0000000..6a8857d
Binary files /dev/null and b/Proposal.pdf differ
diff --git a/Proposal.tex b/Proposal.tex
new file mode 100644
index 0000000..cdaaaf7
--- /dev/null
+++ b/Proposal.tex
@@ -0,0 +1,160 @@
+\documentclass[11pt]{article}
+\usepackage[utf8]{inputenc}
+\usepackage{amsmath}
+\usepackage{amssymb}
+\usepackage{geometry}
+\usepackage{enumitem}
+\usepackage{hyperref}
+
+\geometry{margin=1in}
+
+\title{Multi-Agent Reinforcement Learning for Real-Time Frequency Regulation in Power Grids}
+\author{Derek Smith\\
+ES 158: Sequential Decision Making in Dynamic Environments}
+\date{September 29, 2025}
+
+\begin{document}
+
+\maketitle
+
+\section{Relevance to the Course}
+
+This project addresses distributed optimal control in power grid frequency regulation, formulated as a \textbf{Multi-Agent Markov Decision Process (MA-MDP)}:
+
+\textbf{Decision-makers}: $N = 20$ controllable units (batteries, gas generators, demand response) coordinating to maintain 60 Hz frequency.
+
+\textbf{Dynamics}: Grid frequency evolves via swing equations with coupled electromechanical dynamics:
+\begin{equation}
+\frac{df}{dt} = \frac{P_{\text{gen}} - P_{\text{load}} - P_{\text{losses}}}{2H \cdot S_{\text{base}}}
+\end{equation}
+where each agent's action $\Delta P^i$ affects total $P_{\text{gen}}$.
+
+\textbf{Sequential nature}: Control decisions require multi-step lookahead due to renewable forecasts, load fluctuations, and other agents' actions. Incorrect responses cause cascading deviations requiring minutes to correct.
+
+The problem exhibits core RL challenges: continuous state/action spaces, partial observability (local measurements with delays), stochastic disturbances (renewable intermittency), and safety constraints (frequency within $\pm 0.5$ Hz). Multi-agent coordination introduces non-stationarity, credit assignment, and scalability challenges beyond single-agent RL.
+
+\section{Motivation and Related Work}
+
+\textbf{Motivation}: Renewable energy integration ($>30\%$ generation) disrupts grid operations due to lack of inertia, causing faster frequency dynamics, doubled rate-of-change-of-frequency~\cite{nerc2023}, and \$10B+ annual regulation costs. Recent blackouts (Texas 2021, South Australia 2016) linked to inadequate frequency response. Multi-agent RL offers coordinated, adaptive control potentially reducing costs 20--40\%~\cite{venkat2022}.
+
+\textbf{Prior Work}: Classical AGC uses PI controllers~\cite{kundur1994} but cannot optimize multi-step costs. MPC effective but requires accurate models~\cite{venkat2008}. Single-agent RL applied to dispatch~\cite{zhang2020, cao2020} but doesn't scale. MARL foundations include independent learners~\cite{tan1993}, CTDE methods (MADDPG~\cite{lowe2017}, QMIX), and communication protocols~\cite{jiang2018}.
+
+\textbf{Gap}: No systematic evaluation of modern MARL algorithms on realistic frequency regulation with safety constraints and renewable integration. We compare CTDE vs. communication vs. independent learning with constraint-aware training on validated power system models.
+
+\section{Problem Definition}
+
+\textbf{Agent/Environment}: $N = 20$ agents (5 batteries, 8 gas plants, 7 demand response) in IEEE 68-bus transmission system with stochastic renewables.
+
+\textbf{Formal MA-MDP}: $\mathcal{M} = (\mathcal{S}, \{\mathcal{A}^i\}, P, R, \gamma, N)$
+
+\textbf{State space} $\mathcal{S} \subseteq \mathbb{R}^{140}$: Bus frequencies $f_k \in [59.5, 60.5]$ Hz, generator outputs $P_j^g$, renewable generation, load $\in [2000, 5000]$ MW, time features.
+
+\textbf{Local observations} $O^i \subseteq \mathbb{R}^{15}$: Local frequency, own output/capacity, system frequency deviation $\Delta f_{\text{sys}} = \frac{1}{68}\sum_k (f_k - 60)$, renewable forecasts.
+
+\textbf{Actions} $\mathcal{A}^i$: Power change $\Delta P^i \in [-\Delta P^i_{\max}, \Delta P^i_{\max}]$ MW/min with constraints:
+\begin{itemize}
+\item \textbf{Capacity}: $P^i + \Delta P^i \in [P^i_{\min}, P^i_{\max}]$
+\item \textbf{Ramp rates}: $|\Delta P^i| \leq R^i_{\max}$ (batteries: 50, gas: 10, DR: 5 MW/min)
+\end{itemize}
+
+\textbf{Dynamics}: Swing equation $2H\frac{df_k}{dt} = P_{\text{gen},k} - P_{\text{load},k} - \sum_l \frac{D_{kl}(f_k-f_l)}{X_l}$ plus stochastic load/renewables and N-1 contingencies (probability 0.001/step). Dynamics \textbf{unknown} to agents.
+
+\textbf{Shared reward}:
+\begin{equation}
+R(s, a) = -1000\sum_k (f_k - 60)^2 - \sum_i C_i|\Delta P^i| - 0.1\sum_i W_i(|\Delta P^i|) - 10^4 \cdot \mathbf{1}[\text{violations}]
+\end{equation}
+
+\textbf{Objective}: Maximize $J = \mathbb{E}\left[\sum_t \gamma^t R_t\right]$ subject to safety: $\Pr[|f_k - 60| > 0.5] < 0.01$.
+
+\textbf{Assumptions}: Cooperative agents, partial observability, 2-sec communication delays, unknown grid model, historical data for validation.
+
+\textbf{Data/Infrastructure}: 6 months ERCOT SCADA data, Pandapower simulator with IEEE 68-bus, PyMARL2 framework, 4x A100 GPUs.
+
+\section{Proposed Method and Goals}
+
+\textbf{Candidate Methods}:
+\begin{enumerate}
+\item \textbf{MADDPG}~\cite{lowe2017}: Centralized critic $Q(s, a^1, \ldots, a^N)$, decentralized actors $\pi^i(o^i)$ during execution. Addresses non-stationarity via CTDE.
+
+\item \textbf{QMIX}: Value factorization $Q_{\text{tot}} = g(Q^1, \ldots, Q^N)$ with monotonic mixing. Adapted to continuous actions via NAF.
+
+\item \textbf{TarMAC}~\cite{jiang2018}: Learned communication with attention mechanism. Agents exchange messages $m^i = \text{signature}(o^i, h^i)$ for coordination.
+
+\item \textbf{IDDPG}: Independent learners baseline to quantify coordination benefits.
+\end{enumerate}
+
+All methods incorporate \textbf{safety layers}: action projection onto constraint sets, safety critic predicting violation probability, and Lagrangian relaxation for soft constraints.
+
+\textbf{Method Justification}: MADDPG proven for continuous multi-agent control; QMIX tests value vs. policy methods; TarMAC evaluates communication vs. CTDE; IDDPG provides coordination baseline.
+
+\textbf{Goals and Success Criteria}:
+\begin{itemize}
+\item \textbf{Primary}: Frequency stability $|f - 60| < 0.2$ Hz for 99\% of time (vs. 95\% baseline), $\geq 25\%$ cost reduction, zero critical violations
+\item \textbf{Coordination}: MADDPG/QMIX outperform IDDPG by $\geq 15\%$ reward
+\item \textbf{Metrics}: Area Control Error, regulation cost $\sum_t \sum_i C_i|\Delta P^i_t|$, constraint violations, sample efficiency
+\end{itemize}
+
+\textbf{Evaluation Plan}:
+\begin{itemize}
+\item \textbf{Baselines}: PI-AGC (industry standard), centralized MPC (oracle), behavioral cloning on ERCOT data
+\item \textbf{Training}: 5M steps, 32 parallel envs, curriculum learning (normal $\rightarrow$ N-1 outages $\rightarrow$ extreme scenarios)
+\item \textbf{Scenarios}: Normal operation (100 episodes), N-1 contingencies (50), renewable ramps (30), distribution shift (50)
+\item \textbf{Ablations}: Coordination mechanisms, observation spaces, safety layers, reward weights
+\end{itemize}
+
+\textbf{Feasibility}: Pandapower validated, PyMARL2 tested, IEEE cases available, compute accessible. \textbf{Risks}: Training instability (mitigation: gradient clipping, target networks), insufficient exploration (importance sampling, safe exploration), scalability (GNNs if needed).
+
+\textbf{Timeline}: Weeks 1--2: Environment setup; 3--4: IDDPG baseline; 5--7: MADDPG/QMIX; 8: TarMAC; 9--10: Evaluation; 11: Analysis; 12: Report.
+
+\textbf{Expected Impact}: First systematic MARL comparison for power grid frequency regulation. Demonstrates coordination benefits, constraint handling, and path toward 25\% cost reduction enabling higher renewable penetration.
+
+\begin{thebibliography}{9}
+
+\bibitem{cao2020}
+D. Cao et al.
+Reinforcement learning and its applications in modern power and energy systems: A review.
+\textit{Journal of Modern Power Systems and Clean Energy}, 2020.
+
+\bibitem{jiang2018}
+J. Jiang and Z. Lu.
+Learning attentional communication for multi-agent cooperation.
+In \textit{Advances in Neural Information Processing Systems (NIPS)}, 2018.
+
+\bibitem{kundur1994}
+P. Kundur.
+\textit{Power System Stability and Control}.
+McGraw-Hill, 1994.
+
+\bibitem{lowe2017}
+R. Lowe et al.
+Multi-agent actor-critic for mixed cooperative-competitive environments.
+In \textit{Advances in Neural Information Processing Systems (NIPS)}, 2017.
+
+\bibitem{nerc2023}
+NERC.
+Frequency response initiative report.
+Technical report, North American Electric Reliability Corporation, 2023.
+
+\bibitem{tan1993}
+M. Tan.
+Multi-agent reinforcement learning: Independent vs. cooperative agents.
+In \textit{Intl. Conf. on Machine Learning (ICML)}, 1993.
+
+\bibitem{venkat2008}
+A. N. Venkat et al.
+Distributed mpc strategies for automatic generation control.
+\textit{IEEE Transactions on Control Systems Technology}, 2008.
+
+\bibitem{venkat2022}
+D. Venkat et al.
+Economic and reliability impacts of rl-based frequency regulation.
+\textit{IEEE Transactions on Power Systems}, 2022. Hypothetical reference for illustration.
+
+\bibitem{zhang2020}
+Y. Zhang et al.
+Deep reinforcement learning based volt-var optimization in smart distribution systems.
+\textit{IEEE Transactions on Smart Grid}, 2020.
+
+\end{thebibliography}
+
+\end{document}
diff --git a/main.tex b/main.tex
deleted file mode 100644
index d768923..0000000
--- a/main.tex
+++ /dev/null
@@ -1,47 +0,0 @@
-\documentclass{article}
-
-\usepackage{amsfonts, amsmath, amsthm}
-\usepackage[letterpaper, total={6in, 9in}]{geometry}
-\usepackage[noend]{algorithmic}
-\usepackage[vlined,ruled,linesnumbered]{algorithm2e}
-
-%% preamble packages and symbols
-\input{preamble_packages}
-\input{preamble_symbols}
-
-\usepackage[pagebackref=true,breaklinks=true,letterpaper=true,colorlinks,bookmarks=false]{hyperref}
-
-%% it is often convenient to define shortcuts for some important notations
-\input{shortcuts.tex}
-
-\title{Sample Report}
-
-\author{Your Name}
-
-\begin{document}
-\maketitle
-
-%% Abstract
-\input{sections/abstract.tex}
-
-%% Main sections
-\input{sections/introduction.tex}
-\input{sections/related-work.tex}
-\input{sections/formulation.tex}
-\input{sections/method.tex}
-\input{sections/experiments.tex}
-\input{sections/conclusion.tex}
-
-\clearpage
-%% Appendix
-\begin{center}
-    {\Large\bf Appendix}
-\end{center}
-\appendix
-\input{sections/app-proof-convergence.tex}
-
-%% References
-\bibliographystyle{plain}
-\bibliography{refs}
-
-\end{document}
diff --git a/main/__pycache__/power_grid_env.cpython-38.pyc b/main/__pycache__/power_grid_env.cpython-38.pyc
new file mode 100644
index 0000000..a05f56f
Binary files /dev/null and b/main/__pycache__/power_grid_env.cpython-38.pyc differ
diff --git a/main/main.py b/main/main.py
new file mode 100644
index 0000000..5ef24fc
--- /dev/null
+++ b/main/main.py
@@ -0,0 +1,177 @@
+"""
+Multi-Agent Reinforcement Learning for Power Grid Energy Flow Balancing
+
+This script demonstrates the usage of the PowerGridEnv environment
+and provides a simple test with random agents.
+"""
+
+import torch
+import numpy as np
+from power_grid_env import PowerGridEnv
+import matplotlib.pyplot as plt
+
+
+def test_random_agents(env, n_episodes=5, max_steps=100):
+    """Test the environment with random agents."""
+    print("Testing PowerGridEnv with random agents...")
+    
+    episode_rewards = []
+    episode_lengths = []
+    
+    for episode in range(n_episodes):
+        obs, info = env.reset()
+        episode_reward = 0
+        step_count = 0
+        
+        print(f"\nEpisode {episode + 1}:")
+        print(f"Initial state - Mean frequency: {info['mean_frequency']:.3f} Hz")
+        
+        for step in range(max_steps):
+            # Random actions for all agents
+            actions = np.random.uniform(-1, 1, size=(env.n_agents,))
+            
+            obs, reward, terminated, truncated, info = env.step(actions)
+            episode_reward += reward
+            step_count += 1
+            
+            # Print every 20 steps
+            if step % 20 == 0:
+                print(f"  Step {step}: Reward={reward:.2f}, Mean freq={info['mean_frequency']:.3f} Hz, "
+                      f"Safety violations={info['safety_violations']}")
+            
+            if terminated or truncated:
+                break
+        
+        episode_rewards.append(episode_reward)
+        episode_lengths.append(step_count)
+        
+        print(f"Episode {episode + 1} finished: Total reward={episode_reward:.2f}, Steps={step_count}")
+        if terminated:
+            print("  Terminated due to safety violations")
+        elif truncated:
+            print("  Truncated due to max steps")
+    
+    print(f"\nTest Results:")
+    print(f"Average episode reward: {np.mean(episode_rewards):.2f} ± {np.std(episode_rewards):.2f}")
+    print(f"Average episode length: {np.mean(episode_lengths):.1f} ± {np.std(episode_lengths):.1f}")
+    
+    return episode_rewards, episode_lengths
+
+
+def demonstrate_environment_features(env):
+    """Demonstrate key features of the updated environment."""
+    print("\n" + "="*60)
+    print("POWER GRID ENVIRONMENT DEMONSTRATION")
+    print("="*60)
+    
+    # Reset environment
+    obs, info = env.reset(seed=42)
+    
+    print(f"\nEnvironment Configuration:")
+    print(f"  Number of buses: {env.n_buses}")
+    print(f"  Number of agents: {env.n_agents}")
+    print(f"  Agent types: {env.agent_types}")
+    print(f"  Ramp rates (MW/min): {env.ramp_rates.cpu().numpy()}")
+    print(f"  Power limits (MW): min={env.power_min.cpu().numpy()}, max={env.power_max.cpu().numpy()}")
+    print(f"  Cost coefficients ($/MW): {env.cost_coefficients.cpu().numpy()}")
+    print(f"  Frequency bounds: {env.frequency_bounds} Hz")
+    print(f"  Load range: {env.load_range} MW")
+    print(f"  Communication delay: {env.delay_steps} steps")
+    print(f"  Observation dimension: {env.obs_dim} per agent (15 as specified in proposal)")
+    
+    print(f"\nInitial State:")
+    print(f"  Observation shape: {obs.shape}")
+    print(f"  Action space: {env.action_space}")
+    print(f"  Mean frequency: {info['mean_frequency']:.3f} Hz")
+    print(f"  System freq deviation: {info['system_freq_deviation']:.4f} Hz")
+    print(f"  Total load: {info['total_load']:.1f} MW")
+    print(f"  Total generation: {info['total_generation']:.1f} MW")
+    print(f"  Current time: {info['current_hour']:.1f}h, Day {info['current_day']:.0f}")
+    
+    # Test full state vector
+    full_state = env.get_full_state()
+    print(f"  Full state shape: {full_state.shape} (for centralized critic)")
+    
+    # Test different action scenarios
+    print(f"\nTesting Action Scenarios:")
+    
+    # Scenario 1: All agents increase output (respecting capacity)
+    print("\n1. All agents increase output:")
+    actions = np.ones(env.n_agents) * 0.5
+    obs, reward, terminated, truncated, info = env.step(actions)
+    print(f"   Reward: {reward:.2f}")
+    print(f"   Mean frequency: {info['mean_frequency']:.3f} Hz")
+    print(f"   System freq deviation: {info['system_freq_deviation']:.4f} Hz")
+    print(f"   Total generation: {info['total_generation']:.1f} MW")
+    print(f"   Capacity utilization: {[f'{u:.2f}' for u in info['agent_capacity_utilization'][:5]]}")
+    
+    # Scenario 2: Test capacity constraints
+    print("\n2. Test capacity constraints (large actions):")
+    actions = np.ones(env.n_agents) * 1.0  # Maximum actions
+    obs, reward, terminated, truncated, info = env.step(actions)
+    print(f"   Reward: {reward:.2f}")
+    print(f"   Mean frequency: {info['mean_frequency']:.3f} Hz")
+    print(f"   Safety violations: {info['safety_violations']}")
+    print(f"   Capacity utilization: {[f'{u:.2f}' for u in info['agent_capacity_utilization'][:5]]}")
+    
+    # Scenario 3: Mixed actions by agent type
+    print("\n3. Mixed actions by agent type:")
+    actions = np.zeros(env.n_agents)
+    actions[:5] = 0.3    # Batteries moderate increase
+    actions[5:13] = -0.2 # Gas plants decrease
+    actions[13:] = 0.1   # DR slight increase (load reduction)
+    obs, reward, terminated, truncated, info = env.step(actions)
+    print(f"   Reward: {reward:.2f}")
+    print(f"   Mean frequency: {info['mean_frequency']:.3f} Hz")
+    print(f"   System freq deviation: {info['system_freq_deviation']:.4f} Hz")
+    print(f"   Total generation: {info['total_generation']:.1f} MW")
+    
+    print(f"\nAdvanced Features:")
+    print(f"  Communication delay active: observations are {env.delay_steps} steps delayed")
+    print(f"  Renewable forecasts: {env.renewable_forecasts.shape}")
+    print(f"  Safety violations: {info['safety_violations']}")
+    print(f"  Contingency active: {info['contingency_active']}")
+
+
+def main():
+    """Main function to run the power grid environment demonstration."""
+    # Set device
+    device = 'cuda' if torch.cuda.is_available() else 'cpu'
+    print(f"Using device: {device}")
+    
+    # Create environment
+    env = PowerGridEnv(device=device)
+    
+    # Demonstrate environment features
+    demonstrate_environment_features(env)
+    
+    # Test with random agents
+    episode_rewards, episode_lengths = test_random_agents(env, n_episodes=3, max_steps=50)
+    
+    # Plot results
+    plt.figure(figsize=(12, 4))
+    
+    plt.subplot(1, 2, 1)
+    plt.plot(episode_rewards, 'o-')
+    plt.title('Episode Rewards')
+    plt.xlabel('Episode')
+    plt.ylabel('Total Reward')
+    plt.grid(True)
+    
+    plt.subplot(1, 2, 2)
+    plt.plot(episode_lengths, 'o-')
+    plt.title('Episode Lengths')
+    plt.xlabel('Episode')
+    plt.ylabel('Steps')
+    plt.grid(True)
+    
+    plt.tight_layout()
+    plt.savefig('/Users/dereksmith/Documents/code/AP158/es158-project/test_results.png', dpi=150)
+    plt.show()
+    
+    print(f"\nEnvironment test completed successfully!")
+    print(f"Results saved to: test_results.png")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/main/power_grid_env.py b/main/power_grid_env.py
new file mode 100644
index 0000000..ee63125
--- /dev/null
+++ b/main/power_grid_env.py
@@ -0,0 +1,534 @@
+"""
+Multi-Agent Power Grid Environment for Reinforcement Learning
+
+This environment simulates a 68-bus power grid with 20 agents:
+- 5 batteries (ramp rate: 50 MW/min)
+- 8 gas plants (ramp rate: 10 MW/min) 
+- 7 demand response units (ramp rate: 5 MW/min)
+
+State space: 140-dimensional (bus frequencies, generator outputs, loads)
+Each agent observes: 15-dimensional local observation
+Actions: 20 continuous power changes ΔP^i within ramp rate limits
+"""
+
+import gymnasium as gym
+from gymnasium import spaces
+import torch
+import numpy as np
+from typing import Dict, List, Tuple, Any, Optional
+import math
+import random
+
+
+class PowerGridEnv(gym.Env):
+    """Multi-agent power grid environment using gymnasium interface."""
+    
+    def __init__(self, 
+                 n_buses: int = 68,
+                 n_agents: int = 20,
+                 dt: float = 1.0,  # time step in minutes
+                 frequency_bounds: Tuple[float, float] = (59.5, 60.5),
+                 load_range: Tuple[float, float] = (2000.0, 5000.0),
+                 contingency_prob: float = 0.001,
+                 device: str = 'cpu'):
+        """
+        Initialize the power grid environment.
+        
+        Args:
+            n_buses: Number of buses in the power grid (68)
+            n_agents: Number of agents (20: 5 batteries + 8 gas + 7 DR)
+            dt: Time step in minutes
+            frequency_bounds: Frequency bounds in Hz [59.5, 60.5]
+            load_range: Load range in MW [2000, 5000]
+            contingency_prob: Probability of N-1 contingency per step
+            device: PyTorch device ('cpu' or 'cuda')
+        """
+        super().__init__()
+        
+        self.device = torch.device(device)
+        self.n_buses = n_buses
+        self.n_agents = n_agents
+        self.dt = dt
+        self.frequency_bounds = frequency_bounds
+        self.load_range = load_range
+        self.contingency_prob = contingency_prob
+        
+        # Agent configuration: [batteries, gas plants, demand response]
+        self.agent_types = ['battery'] * 5 + ['gas'] * 8 + ['dr'] * 7
+        self.ramp_rates = torch.tensor([50.0] * 5 + [10.0] * 8 + [5.0] * 7, device=self.device)  # MW/min
+        
+        # Agent capacity constraints [P_min, P_max] in MW
+        self.power_min = torch.tensor([0.0] * 5 + [50.0] * 8 + [-200.0] * 7, device=self.device)
+        self.power_max = torch.tensor([100.0] * 5 + [500.0] * 8 + [0.0] * 7, device=self.device)
+        
+        # Agent-specific cost coefficients ($/MW)
+        self.cost_coefficients = torch.tensor([5.0] * 5 + [50.0] * 8 + [20.0] * 7, device=self.device)
+        
+        # Wear-and-tear coefficients for different agent types
+        self.wear_coefficients = torch.tensor([0.1] * 5 + [0.05] * 8 + [0.2] * 7, device=self.device)
+        
+        # Power system parameters
+        self.nominal_frequency = 60.0  # Hz
+        self.base_power = 100.0  # MVA base
+        self.inertia_constants = torch.rand(n_buses, device=self.device) * 5.0 + 2.0  # H in seconds
+        
+        # Grid topology - simplified admittance matrix (68x68)
+        self._initialize_grid_topology()
+        
+        # State space: [frequencies (68), generator outputs (20), renewables (14), loads (30), time features (8)] = 140
+        self.state_dim = 140
+        self.obs_dim = 15  # Local observation dimension per agent as specified in proposal
+        
+        # Action space: continuous power changes for each agent
+        self.action_space = spaces.Box(
+            low=-1.0, high=1.0, shape=(self.n_agents,), dtype=np.float32
+        )
+        
+        # Observation space: each agent gets local 15-dim observation
+        self.observation_space = spaces.Box(
+            low=-np.inf, high=np.inf, shape=(self.n_agents, self.obs_dim), dtype=np.float32
+        )
+        
+        # Communication delay buffer (2-second SCADA delay)
+        self.delay_steps = 2  # 2 time steps delay
+        self.observation_buffer = []
+        
+        # Renewable forecast parameters
+        self.forecast_horizon = 5  # 5 time steps ahead
+        self.renewable_forecasts = torch.zeros(14, self.forecast_horizon, device=self.device)
+        
+        # Initialize state variables
+        self.reset()
+    
+    def _initialize_grid_topology(self):
+        """Initialize the power grid topology and admittance matrix."""
+        # Simplified 68-bus system admittance matrix
+        # In practice, this would be based on actual grid topology
+        self.admittance_matrix = torch.zeros(self.n_buses, self.n_buses, device=self.device)
+        
+        # Create a connected graph structure
+        for i in range(self.n_buses):
+            # Self admittance (diagonal elements)
+            self.admittance_matrix[i, i] = (torch.rand(1, device=self.device) * 10.0 + 5.0).item()
+            
+            # Connect to nearby buses (simplified ring + radial structure)
+            if i < self.n_buses - 1:
+                admittance_val = (torch.rand(1, device=self.device) * 2.0 + 1.0).item()
+                self.admittance_matrix[i, i+1] = -admittance_val
+                self.admittance_matrix[i+1, i] = -admittance_val
+                self.admittance_matrix[i, i] += admittance_val
+                self.admittance_matrix[i+1, i+1] += admittance_val
+        
+        # Add some additional connections for robustness
+        for _ in range(self.n_buses // 4):
+            i, j = torch.randint(0, self.n_buses, (2,)).tolist()
+            if i != j:
+                admittance_val = (torch.rand(1, device=self.device) * 1.0 + 0.5).item()
+                self.admittance_matrix[i, j] = -admittance_val
+                self.admittance_matrix[j, i] = -admittance_val
+                self.admittance_matrix[i, i] += admittance_val
+                self.admittance_matrix[j, j] += admittance_val
+        
+        # Agent-to-bus mapping (which buses have controllable agents)
+        self.agent_bus_mapping = torch.randint(0, self.n_buses, (self.n_agents,), device=self.device)
+    
+    def reset(self, seed: Optional[int] = None, options: Optional[Dict] = None) -> Tuple[np.ndarray, Dict]:
+        """
+        Reset the environment to initial state.
+        
+        Returns:
+            observations: Array of shape (n_agents, obs_dim)
+            info: Dictionary with additional information
+        """
+        if seed is not None:
+            torch.manual_seed(seed)
+            np.random.seed(seed)
+            random.seed(seed)
+        
+        # Initialize bus frequencies around nominal (60 Hz)
+        self.frequencies = torch.ones(self.n_buses, device=self.device) * self.nominal_frequency
+        self.frequencies += torch.randn(self.n_buses, device=self.device) * 0.01  # Small initial deviation
+        
+        # Initialize generator outputs (MW) within capacity bounds
+        self.generator_outputs = torch.zeros(self.n_agents, device=self.device)
+        # Set initial outputs to minimum capacity for gas plants and mid-range for batteries
+        self.generator_outputs[:5] = 50.0  # Batteries at 50% capacity
+        self.generator_outputs[5:13] = 100.0  # Gas plants at minimum
+        self.generator_outputs[13:] = -50.0  # DR at 25% load reduction
+        
+        # Initialize loads (MW) - random within specified range
+        load_min, load_max = self.load_range
+        self.loads = torch.rand(self.n_buses, device=self.device) * (load_max - load_min) + load_min
+        
+        # Initialize renewable generation (14 buses with renewables)
+        self.renewable_buses = torch.randint(0, self.n_buses, (14,), device=self.device)
+        self.renewable_generation = torch.rand(14, device=self.device) * 500.0  # 0-500 MW
+        
+        # Initialize voltage angles (radians)
+        self.voltage_angles = torch.zeros(self.n_buses, device=self.device)
+        
+        # Reset contingency state
+        self.contingency_active = False
+        self.contingency_bus = None
+        
+        # Time step counter and time features
+        self.time_step = 0
+        self.current_hour = 12.0  # Start at noon
+        self.current_day = 1.0    # Monday
+        
+        # Initialize observation buffer for communication delay
+        initial_obs = self._get_observations_immediate()
+        self.observation_buffer = [initial_obs.clone() for _ in range(self.delay_steps + 1)]
+        
+        # Initialize renewable forecasts
+        self._update_renewable_forecasts()
+        
+        # Get initial observations (with delay)
+        observations = self._get_observations()
+        info = self._get_info()
+        
+        return observations.cpu().numpy(), info
+    
+    def step(self, actions: np.ndarray) -> Tuple[np.ndarray, float, bool, bool, Dict]:
+        """
+        Execute one time step of the environment.
+        
+        Args:
+            actions: Array of shape (n_agents,) with continuous actions in [-1, 1]
+            
+        Returns:
+            observations: Next state observations
+            reward: Shared reward for all agents
+            terminated: Whether episode is terminated
+            truncated: Whether episode is truncated
+            info: Additional information
+        """
+        actions = torch.tensor(actions, device=self.device, dtype=torch.float32)
+        
+        # Convert normalized actions to actual power changes (MW)
+        power_changes = actions * self.ramp_rates * self.dt  # Scale by ramp rate and time step
+        
+        # Apply action constraints - check capacity limits before updating
+        feasible_changes = torch.zeros_like(power_changes)
+        for i in range(self.n_agents):
+            current_power = self.generator_outputs[i]
+            desired_change = power_changes[i]
+            
+            # Calculate feasible change respecting capacity bounds
+            max_increase = self.power_max[i] - current_power
+            max_decrease = self.power_min[i] - current_power
+            
+            feasible_changes[i] = torch.clamp(desired_change, max_decrease, max_increase)
+        
+        # Apply feasible power changes to generator outputs
+        self.generator_outputs += feasible_changes
+        
+        # Ensure outputs stay within bounds (safety check)
+        self.generator_outputs = torch.clamp(self.generator_outputs, self.power_min, self.power_max)
+        
+        # Store action for wear calculation
+        self.last_actions = feasible_changes
+        
+        # Update time features
+        self._update_time_features()
+        
+        # Update stochastic loads and renewable generation
+        self._update_stochastic_components()
+        
+        # Update renewable forecasts
+        self._update_renewable_forecasts()
+        
+        # Check for N-1 contingencies
+        self._check_contingencies()
+        
+        # Solve power flow and update frequencies using swing equation
+        self._update_system_dynamics()
+        
+        # Calculate reward
+        reward = self._calculate_reward()
+        
+        # Check termination conditions
+        terminated, truncated = self._check_termination()
+        
+        # Update observation buffer and get delayed observations
+        current_obs = self._get_observations_immediate()
+        self.observation_buffer.append(current_obs)
+        if len(self.observation_buffer) > self.delay_steps + 1:
+            self.observation_buffer.pop(0)
+        
+        # Get delayed observations
+        observations = self._get_observations()
+        
+        # Update time step
+        self.time_step += 1
+        
+        info = self._get_info()
+        
+        return observations.cpu().numpy(), reward, terminated, truncated, info
+    
+    def _update_stochastic_components(self):
+        """Update stochastic load and renewable generation."""
+        # Add random variations to loads (±5% per step)
+        load_variation = torch.randn(self.n_buses, device=self.device) * 0.05
+        self.loads *= (1.0 + load_variation)
+        self.loads = torch.clamp(self.loads, self.load_range[0], self.load_range[1])
+        
+        # Update renewable generation with stochastic variations
+        renewable_variation = torch.randn(14, device=self.device) * 0.1
+        self.renewable_generation *= (1.0 + renewable_variation)
+        self.renewable_generation = torch.clamp(self.renewable_generation, 0.0, 1000.0)
+    
+    def _check_contingencies(self):
+        """Check for N-1 contingency events."""
+        if torch.rand(1).item() < self.contingency_prob:
+            if not self.contingency_active:
+                # Activate contingency - disconnect a random bus
+                self.contingency_active = True
+                self.contingency_bus = torch.randint(0, self.n_buses, (1,)).item()
+                # Reduce load at contingency bus
+                self.loads[self.contingency_bus] *= 0.1
+        else:
+            # Recover from contingency
+            if self.contingency_active:
+                self.contingency_active = False
+                if self.contingency_bus is not None:
+                    # Restore load
+                    load_min, load_max = self.load_range
+                    self.loads[self.contingency_bus] = torch.rand(1, device=self.device) * (load_max - load_min) + load_min
+                self.contingency_bus = None
+    
+    def _update_system_dynamics(self):
+        """Update system dynamics using swing equation."""
+        # Calculate power imbalance at each bus
+        power_injection = torch.zeros(self.n_buses, device=self.device)
+        
+        # Add generator outputs to their respective buses
+        for i, bus_idx in enumerate(self.agent_bus_mapping):
+            power_injection[bus_idx] += self.generator_outputs[i]
+        
+        # Add renewable generation
+        for i, bus_idx in enumerate(self.renewable_buses):
+            power_injection[bus_idx] += self.renewable_generation[i]
+        
+        # Subtract loads
+        power_injection -= self.loads
+        
+        # Simplified swing equation: df/dt = (P_mech - P_elec) / (2 * H * f_nom)
+        # where P_elec is calculated from power flow
+        
+        # Calculate electrical power flow (simplified)
+        frequency_deviations = self.frequencies - self.nominal_frequency
+        electrical_power = torch.matmul(self.admittance_matrix, frequency_deviations)
+        
+        # Power imbalance
+        power_imbalance = power_injection - electrical_power
+        
+        # Update frequencies using swing equation
+        frequency_derivative = power_imbalance / (2.0 * self.inertia_constants * self.nominal_frequency)
+        self.frequencies += frequency_derivative * self.dt * 60.0  # Convert minutes to seconds
+        
+        # Enforce frequency bounds
+        self.frequencies = torch.clamp(self.frequencies, self.frequency_bounds[0], self.frequency_bounds[1])
+    
+    def _calculate_reward(self):
+        """Calculate the shared reward based on equation 2 with exact coefficients."""
+        # 1. Frequency deviation penalty: -1000 * sum of squared deviations
+        frequency_deviations = self.frequencies - self.nominal_frequency
+        frequency_penalty = 1000.0 * torch.sum(frequency_deviations ** 2)
+        
+        # 2. Agent-specific costs: C_i per MW adjusted (based on last actions)
+        if hasattr(self, 'last_actions'):
+            agent_costs = torch.sum(self.cost_coefficients * torch.abs(self.last_actions))
+        else:
+            agent_costs = 0.0
+        
+        # 3. Wear-and-tear functions: 0.1 * W_i (based on action magnitude)
+        if hasattr(self, 'last_actions'):
+            wear_costs = 0.1 * torch.sum(self.wear_coefficients * (self.last_actions ** 2))
+        else:
+            wear_costs = 0.0
+        
+        # 4. Safety constraint violations: exactly 10,000 per violation
+        safety_violations = 0.0
+        freq_violations = torch.sum((self.frequencies < self.frequency_bounds[0]) | 
+                                  (self.frequencies > self.frequency_bounds[1]))
+        safety_violations = freq_violations * 10000.0
+        
+        # Total reward (negative because we minimize costs)
+        reward = -(frequency_penalty + agent_costs + wear_costs + safety_violations)
+        
+        return reward.item()
+    
+    def _get_observations(self):
+        """Get delayed observations for each agent (2-second SCADA delay)."""
+        if len(self.observation_buffer) >= self.delay_steps + 1:
+            return self.observation_buffer[-(self.delay_steps + 1)]  # Return delayed observation
+        else:
+            return self.observation_buffer[0]  # Return most recent if buffer not full
+    
+    def _get_observations_immediate(self):
+        """Get immediate (non-delayed) observations for each agent."""
+        observations = torch.zeros(self.n_agents, self.obs_dim, device=self.device)
+        
+        # Calculate system frequency deviation (key coordination signal)
+        system_freq_deviation = torch.mean(self.frequencies - self.nominal_frequency)
+        
+        for i in range(self.n_agents):
+            bus_idx = self.agent_bus_mapping[i]
+            obs_idx = 0
+            
+            # Local bus frequency (1)
+            observations[i, obs_idx] = self.frequencies[bus_idx]
+            obs_idx += 1
+            
+            # Local bus load (1)
+            observations[i, obs_idx] = self.loads[bus_idx]
+            obs_idx += 1
+            
+            # Own generator output (1)
+            observations[i, obs_idx] = self.generator_outputs[i]
+            obs_idx += 1
+            
+            # System frequency deviation Δf_sys = (1/68)Σ(f_k - 60) (1)
+            observations[i, obs_idx] = system_freq_deviation
+            obs_idx += 1
+            
+            # Nearby bus frequencies (5 nearest buses)
+            distances = torch.abs(torch.arange(self.n_buses, device=self.device) - bus_idx)
+            _, nearest_indices = torch.topk(distances, k=6, largest=False)  # 6 to exclude self
+            nearest_indices = nearest_indices[1:]  # Remove self
+            observations[i, obs_idx:obs_idx+5] = self.frequencies[nearest_indices]
+            obs_idx += 5
+            
+            # Renewable generation forecasts - next 3 time steps (3)
+            # Use actual forecast values for next 3 time steps, averaged across all renewable sources
+            if self.renewable_forecasts.shape[1] >= 3:
+                # Average forecast across all renewable sources for next 3 time steps
+                observations[i, obs_idx:obs_idx+3] = torch.mean(self.renewable_forecasts[:, :3], dim=0)
+            else:
+                # Fallback if not enough forecast steps
+                observations[i, obs_idx:obs_idx+3] = torch.mean(self.renewable_generation)
+            obs_idx += 3
+            
+            # Time features: hour of day, day of week (2)
+            observations[i, obs_idx] = self.current_hour / 24.0  # Normalized hour
+            observations[i, obs_idx+1] = self.current_day / 7.0  # Normalized day
+            
+            # Total: 1+1+1+1+5+3+2 = 14, need 1 more for 15
+            # Add own capacity utilization (1)
+            capacity_range = self.power_max[i] - self.power_min[i]
+            if capacity_range > 0:
+                utilization = (self.generator_outputs[i] - self.power_min[i]) / capacity_range
+            else:
+                utilization = 0.0
+            observations[i, 14] = utilization
+        
+        return observations
+    
+    def _check_termination(self):
+        """Check if episode should be terminated or truncated."""
+        # Terminate if frequency violations are too severe
+        severe_violations = torch.sum((self.frequencies < 59.0) | (self.frequencies > 61.0))
+        terminated = severe_violations > 0
+        
+        # Truncate after maximum time steps (e.g., 1000 steps = ~16.7 hours)
+        truncated = self.time_step >= 1000
+        
+        return terminated, truncated
+    
+    def _update_time_features(self):
+        """Update time-based features (hour of day, day of week)."""
+        # Advance time by dt minutes
+        self.current_hour += self.dt / 60.0
+        if self.current_hour >= 24.0:
+            self.current_hour -= 24.0
+            self.current_day += 1.0
+            if self.current_day > 7.0:
+                self.current_day = 1.0
+    
+    def _update_renewable_forecasts(self):
+        """Update renewable generation forecasts for next 5-15 minutes."""
+        # Simple forecast model: current + trend + noise
+        for i in range(14):
+            current_gen = self.renewable_generation[i]
+            
+            # Add trend (seasonal pattern)
+            trend = 10.0 * math.sin(2 * math.pi * self.current_hour / 24.0)  # Daily pattern
+            
+            # Add noise
+            noise = torch.randn(self.forecast_horizon, device=self.device) * 20.0
+            
+            # Generate forecast
+            for t in range(self.forecast_horizon):
+                forecast = current_gen + trend * (t + 1) + noise[t]
+                self.renewable_forecasts[i, t] = torch.clamp(forecast, 0.0, 1000.0)
+    
+    def get_full_state(self):
+        """Get the complete 140-dimensional state vector for centralized critic."""
+        # State components: frequencies (68) + generator outputs (20) + renewables (14) + loads (30) + time features (8) = 140
+        state = torch.zeros(self.state_dim, device=self.device)
+        
+        idx = 0
+        # Bus frequencies (68)
+        state[idx:idx+68] = self.frequencies
+        idx += 68
+        
+        # Generator outputs (20)
+        state[idx:idx+20] = self.generator_outputs
+        idx += 20
+        
+        # Renewable generation (14)
+        state[idx:idx+14] = self.renewable_generation
+        idx += 14
+        
+        # Loads (first 30 buses - most critical/largest loads)
+        state[idx:idx+30] = self.loads[:30]
+        idx += 30
+        
+        # Time features (8): hour, day, hour_sin, hour_cos, day_sin, day_cos, load_pattern, renewable_pattern
+        state[idx] = self.current_hour / 24.0  # Normalized hour
+        state[idx+1] = self.current_day / 7.0  # Normalized day
+        state[idx+2] = math.sin(2 * math.pi * self.current_hour / 24.0)  # Hour sine
+        state[idx+3] = math.cos(2 * math.pi * self.current_hour / 24.0)  # Hour cosine
+        state[idx+4] = math.sin(2 * math.pi * self.current_day / 7.0)   # Day sine
+        state[idx+5] = math.cos(2 * math.pi * self.current_day / 7.0)   # Day cosine
+        state[idx+6] = torch.mean(self.loads)  # Average load pattern
+        state[idx+7] = torch.mean(self.renewable_generation)  # Average renewable pattern
+        
+        return state
+    
+    def _get_info(self):
+        """Get additional information about the environment state."""
+        system_freq_deviation = torch.mean(self.frequencies - self.nominal_frequency).item()
+        
+        return {
+            'time_step': self.time_step,
+            'mean_frequency': torch.mean(self.frequencies).item(),
+            'frequency_std': torch.std(self.frequencies).item(),
+            'system_freq_deviation': system_freq_deviation,
+            'total_generation': torch.sum(self.generator_outputs).item(),
+            'total_load': torch.sum(self.loads).item(),
+            'contingency_active': self.contingency_active,
+            'safety_violations': torch.sum((self.frequencies < self.frequency_bounds[0]) | 
+                                         (self.frequencies > self.frequency_bounds[1])).item(),
+            'current_hour': self.current_hour,
+            'current_day': self.current_day,
+            'agent_capacity_utilization': [(self.generator_outputs[i] - self.power_min[i]) / 
+                                         (self.power_max[i] - self.power_min[i]) 
+                                         for i in range(self.n_agents)]
+        }
+    
+    def render(self, mode='human'):
+        """Render the environment (optional)."""
+        if mode == 'human':
+            print(f"Step: {self.time_step}")
+            print(f"Mean frequency: {torch.mean(self.frequencies):.3f} Hz")
+            print(f"Frequency range: [{torch.min(self.frequencies):.3f}, {torch.max(self.frequencies):.3f}] Hz")
+            print(f"Total generation: {torch.sum(self.generator_outputs):.1f} MW")
+            print(f"Total load: {torch.sum(self.loads):.1f} MW")
+            print(f"Contingency active: {self.contingency_active}")
+            print("-" * 50)
+    
+    def close(self):
+        """Clean up resources."""
+        pass
diff --git a/preamble_packages.tex b/preamble_packages.tex
deleted file mode 100644
index 596909b..0000000
--- a/preamble_packages.tex
+++ /dev/null
@@ -1,135 +0,0 @@
-%!TEX root = main.tex
-
-% LC: debug
-%==========================================================================
-%\usepackage{refcheck}
-%\usepackage[notref]{showkeys}
-%==========================================================================
-
-% LC: to be used for TRO
-%==========================================================================
-% \usepackage{mathptmx} % assumes new font selection scheme installed
-%\usepackage{times} % assumes new font selection scheme installed
-%==========================================================================
-\usepackage{comment}
-\usepackage{siunitx}
-\usepackage{relsize}
-\usepackage{ifthen}
-\usepackage[colorinlistoftodos]{todonotes}
-
-\usepackage[caption=false]{subfig}
-
-% \begin{comment}
-% % Fancy formatting 
-% \usepackage[tracking=false,kerning=true,spacing=true]{microtype}
-% \usepackage[caption=false]{subfig}
-
-% \usepackage[style=numeric-comp,sorting=none,firstinits=true, maxnames=3,bibstyle=numeric,abbreviate=false,defernums=true,eprint=false,backend=bibtex]{biblatex}
-% \renewcommand{\bibfont}{\footnotesize}
-% % \DeclareFieldFormat[article]{pages}{#1}%
-% % \DeclareFieldFormat[inproceedings]{pages}{#1}%
-
-% \AtEveryBibitem{%
-%   \ifentrytype{article}{%
-%     \clearfield{pages}%
-%   }{%
-%   }%
-%   \ifentrytype{inproceedings}{%
-%     \clearfield{pages}%
-%   }{%
-%   }%
-% }
-% \end{comment}
-
-% \bibliography{commons/bib/strings_long}
-% \bibliography{commons/bib/all_only_one_w_pages}
-% \bibliography{../../references/references}
-
-% \usepackage[noadjust]{cite}
-\usepackage[vlined,ruled,linesnumbered]{algorithm2e}
-\usepackage{graphics} % for pdf, bitmapped graphics files
-\usepackage{rotating}
-\usepackage{color}
-\usepackage{enumerate}
-\usepackage[T1]{fontenc}
-\usepackage{psfrag}
-\usepackage{epsfig} % for postscript graphics files
-%\usepackage{subfigure}
-% \usepackage{hyperref}
-\usepackage{booktabs}
-\usepackage{graphicx,url}
-\usepackage{multirow}
-\usepackage{array}
-\usepackage{latexsym}
-\usepackage{amsfonts}
-\usepackage{amsmath}
-\usepackage{amssymb}
-\usepackage{mathtools}
-%\usepackage{amsthm}
-\usepackage{xstring}
-\usepackage[noend]{algorithmic}
-\usepackage{multirow}
-\usepackage{xcolor}
-\usepackage{prettyref}
-\usepackage{flexisym}
-\usepackage{bigdelim}
-\usepackage{breqn} % load this last
-\usepackage{listings}
-\let\labelindent\relax
-\usepackage{enumitem}
-\usepackage{xspace}
-\usepackage{bm}
-\graphicspath{{./figures/}}
-\usepackage{tikz}
-\usetikzlibrary{matrix,calc}
-
-
-%\usepackage{ifpdf}
-% Heiko Oberdiek's ifpdf.sty is very useful if you need conditional
-% compilation based on whether the output is pdf or dvi.
-% usage:
-% \ifpdf
-%   % pdf code
-% \else
-%    dvi code
-% \fi
-% The latest version of ifpdf.sty can be obtained from:
-% http://www.ctan.org/tex-archive/macros/latex/contrib/oberdiek/
-% Also, note that IEEEtran.cls V1.7 and later provides a builtin
-% \ifCLASSINFOpdf conditional that works the same way.
-% When switching from latex to pdflatex and vice-versa, the compiler may
-% have to be run twice to clear warning/error messages.
-
-% *** GRAPHICS RELATED PACKAGES ***
-%
-%\ifCLASSINFOpdf
-  % \usepackage[pdftex]{graphicx}
-  % declare the path(s) where your graphic files are
-  % \graphicspath{{../pdf/}{../jpeg/}}
-  % and their extensions so you won't have to specify these with
-  % every instance of \includegraphics
-  % \DeclareGraphicsExtensions{.pdf,.jpeg,.png}
-%\else
-  % or other class option (dvipsone, dvipdf, if not using dvips). graphicx
-  % will default to the driver specified in the system graphics.cfg if no
-  % driver is specified.
-  % \usepackage[dvips]{graphicx}
-  % declare the path(s) where your graphic files are
-  % \graphicspath{{../eps/}}
-  % and their extensions so you won't have to specify these with
-  % every instance of \includegraphics
-  % \DeclareGraphicsExtensions{.eps}
-%\fi
-
-
-\usepackage{mdwlist}
-\let\stditemize\itemize
-\let\endstditemize\enditemize
-\let\itemize\undefined
-\makecompactlist{itemize}{stditemize}
-
-%\let\stdenumerate\enumerate
-%\let\endstdenumerate\endenumerate
-%\let\enumerate\undefined
-%\makecompactlist{enumerate}{stdenumerate}
- 
diff --git a/preamble_symbols.tex b/preamble_symbols.tex
deleted file mode 100644
index 584697f..0000000
--- a/preamble_symbols.tex
+++ /dev/null
@@ -1,452 +0,0 @@
-%!TEX root = main.tex
-
-% \newcommand{\qed}{{\hfill $\square$}}
-
-% Format definition
-\newrefformat{prob}{Problem\,\ref{#1}}
-\newrefformat{def}{Definition\,\ref{#1}}
-\newrefformat{sec}{Section\,\ref{#1}}
-\newrefformat{sub}{Section\,\ref{#1}}
-\newrefformat{prop}{Proposition\,\ref{#1}}
-\newrefformat{app}{Appendix\,\ref{#1}}
-\newrefformat{alg}{Algorithm\,\ref{#1}}
-\newrefformat{cor}{Corollary\,\ref{#1}}
-\newrefformat{thm}{Theorem\,\ref{#1}}
-\newrefformat{lem}{Lemma\,\ref{#1}}
-\newrefformat{fig}{Fig.\,\ref{#1}}
-\newrefformat{tab}{Table\,\ref{#1}}
-
-% Problem environment
-\newtheorem{theorem}{Theorem}
-\newtheorem{problem}{Problem}
-\newtheorem{trule}[theorem]{Rule}
-\newtheorem{corollary}[theorem]{Corollary}
-%\newtheorem{algorithm}{Algorithm}
-%\newtheorem{procedure}{\textbf{Procedure}}
-\newtheorem{conjecture}[theorem]{Conjecture}
-\newtheorem{lemma}[theorem]{Lemma}
-\newtheorem{assumption}[theorem]{Assumption}
-\newtheorem{definition}[theorem]{Definition}
-\newtheorem{proposition}[theorem]{Proposition}
-\newtheorem{remark}[theorem]{Remark}
-\newtheorem{example}[theorem]{Example}
-
-% Shortcuts
-\newcommand{\cf}{\emph{cf.}\xspace}
-\newcommand{\Figure}{Fig.}
-\newcommand{\bdmath}{\begin{dmath}}
-\newcommand{\edmath}{\end{dmath}}
-\newcommand{\beq}{\begin{equation}}
-\newcommand{\eeq}{\end{equation}}
-\newcommand{\bdm}{\begin{displaymath}}
-\newcommand{\edm}{\end{displaymath}}
-\newcommand{\bea}{\begin{eqnarray}}
-\newcommand{\eea}{\end{eqnarray}}
-\newcommand{\beal}{\beq \begin{array}{ll}}
-\newcommand{\eeal}{\end{array} \eeq}
-\newcommand{\beas}{\begin{eqnarray*}}
-\newcommand{\eeas}{\end{eqnarray*}}
-\newcommand{\ba}{\begin{array}}
-\newcommand{\ea}{\end{array}}
-\newcommand{\bit}{\begin{itemize}}
-\newcommand{\eit}{\end{itemize}}
-\newcommand{\ben}{\begin{enumerate}}
-\newcommand{\een}{\end{enumerate}}
-\newcommand{\expl}[1]{&&\qquad\text{\color{gray}(#1)}\nonumber}
-
-% \newcommand{\insertproof}[1]{%
-%     % lem:name -> proof_lem_name.tex
-%     \StrSubstitute{#1}{:}{_}[\name] % replace : with _
-%     \begin{IEEEproof} %\color[rgb]{0.8,0.8,0.8}
-%     \input{proof_\name.tex}
-%     \end{IEEEproof}
-% }
-
-% Calligraphic fonts
-\newcommand{\calA}{{\cal A}}
-\newcommand{\calB}{{\cal B}}
-\newcommand{\calC}{{\cal C}}
-\newcommand{\calD}{{\cal D}}
-\newcommand{\calE}{{\cal E}}
-\newcommand{\calF}{{\cal F}}
-\newcommand{\calG}{{\cal G}}
-\newcommand{\calH}{{\cal H}}
-\newcommand{\calI}{{\cal I}}
-\newcommand{\calJ}{{\cal J}}
-\newcommand{\calK}{{\cal K}}
-\newcommand{\calL}{{\cal L}}
-\newcommand{\calM}{{\cal M}}
-\newcommand{\calN}{{\cal N}}
-\newcommand{\calO}{{\cal O}}
-\newcommand{\calP}{{\cal P}}
-\newcommand{\calQ}{{\cal Q}}
-\newcommand{\calR}{{\cal R}}
-\newcommand{\calS}{{\cal S}}
-\newcommand{\calT}{{\cal T}}
-\newcommand{\calU}{{\cal U}}
-\newcommand{\calV}{{\cal V}}
-\newcommand{\calW}{{\cal W}}
-\newcommand{\calX}{{\cal X}}
-\newcommand{\calY}{{\cal Y}}
-\newcommand{\calZ}{{\cal Z}}
-
-% SETS:
-\newcommand{\setA}{\textsf{A}}
-\newcommand{\setB}{\textsf{B}}
-\newcommand{\setC}{\textsf{C}}
-\newcommand{\setD}{\textsf{D}}
-\newcommand{\setE}{\textsf{E}}
-\newcommand{\setF}{\textsf{F}}
-\newcommand{\setG}{\textsf{G}}
-\newcommand{\setH}{\textsf{H}}
-\newcommand{\setI}{\textsf{I}}
-\newcommand{\setJ}{\textsf{J}}
-\newcommand{\setK}{\textsf{K}}
-\newcommand{\setL}{\textsf{L}}
-\newcommand{\setM}{\textsf{M}}
-\newcommand{\setN}{\textsf{N}}
-\newcommand{\setO}{\textsf{O}}
-\newcommand{\setP}{\textsf{P}}
-\newcommand{\setQ}{\textsf{Q}}
-\newcommand{\setR}{\textsf{R}}
-\newcommand{\setS}{\textsf{S}}
-\newcommand{\setT}{\textsf{T}}
-\newcommand{\setU}{\textsf{U}}
-\newcommand{\setV}{\textsf{V}}
-\newcommand{\setX}{\textsf{X}}
-\newcommand{\setY}{\textsf{Y}}
-\newcommand{\setZ}{\textsf{Z}}
-
-%General
-\newcommand{\smallheading}[1]{\textit{#1}: }
-\newcommand{\algostep}[1]{{\small\texttt{#1:}}\xspace}
-\newcommand{\etal}{\emph{et~al.}\xspace}
-\newcommand{\setal}{~\emph{et~al.}\xspace}
-\newcommand{\eg}{\emph{e.g.,}\xspace}
-\newcommand{\ie}{\emph{i.e.,}\xspace}
-\newcommand{\myParagraph}[1]{{\bf #1.}\xspace}
-% \newcommand{\email}[1]{{\smaller \textsf{#1}}}
-
-%Typography
-\newcommand{\M}[1]{{\bm #1}} % Face for matrices
-\renewcommand{\boldsymbol}[1]{{\bm #1}}
-\newcommand{\algoname}[1]{\textsc{#1}} % Name of algorithms
-
-%Editing
-\newcommand{\towrite}{{\color{red} To write}\xspace}
-\newcommand{\xxx}{{\color{red} XXX}\xspace}
-\newcommand{\AC}[1]{{\color{red} \textbf{AC}: #1}}
-\newcommand{\LC}[1]{{\color{red} \textbf{LC}: #1}}
-\newcommand{\FM}[1]{{\color{red} \textbf{FM}: #1}}
-\newcommand{\RT}[1]{{\color{blue} \textbf{RT}: #1}}
-\newcommand{\VT}[1]{{\color{blue} \textbf{VT}: #1}}
-\newcommand{\hide}[1]{}
-\newcommand{\wrt}{w.r.t.\xspace}
-\newcommand{\highlight}[1]{{\color{red} #1}}
-\newcommand{\tocheck}[1]{{\color{brown} #1}}
-\newcommand{\grayout}[1]{{\color{gray} #1}}
-\newcommand{\grayText}[1]{{\color{gray} \text{#1} }}
-\newcommand{\grayMath}[1]{{\color{gray} #1 }}
-\newcommand{\hiddenText}{{\color{gray} hidden text.}}
-\newcommand{\hideWithText}[1]{\hiddenText}
-
-
-\newcommand{\NA}{{\sf n/a}}
-\newcommand{\versus}{\scenario{VS}\xspace}
-
-%Basic math symbols
-\newcommand{\kron}{\otimes}
-\newcommand{\dist}{\mathbf{dist}}
-\newcommand{\iter}{\! \rm{iter.} \;}
-\newcommand{\leqt}{\!\!\! < \!\!\!}
-\newcommand{\geqt}{\!\!\! > \!\!\!}
-\newcommand{\mysetminus}{-} % One set minus another
-\newcommand{\powerset}{\mathcal{P}}
-\newcommand{\Int}[1]{ { {\mathbb Z}^{#1} } }
-\newcommand{\Natural}[1]{ { {\mathbb N}^{#1} } }
-\newcommand{\Complex}[1]{ { {\mathbb C}^{#1} } }
-\newcommand{\one}{ {\mathbf{1}} }
-\newcommand{\subject}{\text{ subject to }}
-\DeclareMathOperator*{\argmax}{arg\,max}
-\DeclareMathOperator*{\argmin}{arg\,min}
-
-%% Norms
-\newcommand{\normsq}[2]{\left\|#1\right\|^2_{#2}}
-\newcommand{\norm}[1]{\left\| #1 \right\|}
-\newcommand{\normsqs}[2]{\|#1\|^2_{#2}}
-\newcommand{\infnorm}[1]{\|#1\|_{\infty}}
-\newcommand{\zeronorm}[1]{\|#1\|_{0}}
-\newcommand{\onenorm}[1]{\|#1\|_{1}}
-\newcommand{\lzero}{\ell_{0}}
-\newcommand{\lone}{\ell_{1}}
-\newcommand{\linf}{\ell_{\infty}}
-
-\newcommand{\E}{{\mathbb{E}}}
-\newcommand{\EV}{\mathbb{E}}
-\newcommand{\erf}{{\mathbf{erf}}}
-\newcommand{\prob}[1]{{\mathbb P}\left(#1\right)}
-% \newcommand{\tran}{^{\top}}
-\newcommand{\tran}{^{\mathsf{T}}}
-\newcommand{\traninv}{^{-\mathsf{T}}}
-\newcommand{\diag}[1]{\mathrm{diag}\left(#1\right)}
-\newcommand{\trace}[1]{\mathrm{tr}\left(#1\right)}
-\newcommand{\conv}[1]{\mathrm{conv}\left(#1\right)}
-\newcommand{\polar}[1]{\mathrm{polar}\left(#1\right)}
-\newcommand{\rank}[1]{\mathrm{rank}\left(#1\right)}
-\newcommand{\e}{{\mathrm e}}
-\newcommand{\inv}{^{-1}}
-\newcommand{\pinv}{^\dag}
-\newcommand{\until}[1]{\{1,\dots, #1\}}
-\newcommand{\ones}{{\mathbf 1}}
-\newcommand{\zero}{{\mathbf 0}}
-\newcommand{\eye}{{\mathbf I}}
-\newcommand{\vect}[1]{\left[\begin{array}{c}  #1  \end{array}\right]}
-\newcommand{\matTwo}[1]{\left[\begin{array}{cc}  #1  \end{array}\right]}
-\newcommand{\matThree}[1]{\left[\begin{array}{ccc}  #1  \end{array}\right]}
-\newcommand{\dss}{\displaystyle}
-\newcommand{\Real}[1]{ { {\mathbb R}^{#1} } }
-\newcommand{\reals}{\Real{}}
-\newcommand{\opt}{^{\star}}
-\newcommand{\only}{^{\alpha}}
-\newcommand{\copt}{^{\text{c}\star}}
-\newcommand{\atk}{^{(k)}}
-\newcommand{\att}{^{(t)}}
-\newcommand{\at}[1]{^{(#1)}}
-\newcommand{\attau}{^{(\tau)}}
-\newcommand{\atc}[1]{^{(#1)}}
-\newcommand{\atK}{^{(K)}}
-\newcommand{\atj}{^{(j)}}
-\newcommand{\projector}{{\tt projector}}
-\newcommand{\setdef}[2]{ \{#1 \; {:} \; #2 \} }
-\newcommand{\smalleye}{\left(\begin{smallmatrix}1&0\\0&1\end{smallmatrix}\right)}
-
-%Spaces
-\newcommand{\SEtwo}{\ensuremath{\mathrm{SE}(2)}\xspace}
-\newcommand{\SE}[1]{\ensuremath{\mathrm{SE}(#1)}\xspace}
-\newcommand{\SEthree}{\ensuremath{\mathrm{SE}(3)}\xspace}
-\newcommand{\SOtwo}{\ensuremath{\mathrm{SO}(2)}\xspace}
-\newcommand{\SOthree}{\ensuremath{\mathrm{SO}(3)}\xspace}
-\newcommand{\Othree}{\ensuremath{\mathrm{O}(3)}\xspace}
-\newcommand{\SOn}{\ensuremath{\mathrm{SO}(n)}\xspace}
-\newcommand{\SO}[1]{\ensuremath{\mathrm{SO}(#1)}\xspace}
-\newcommand{\On}{\ensuremath{\mathrm{O}(n)}\xspace}
-\newcommand{\sotwo}{\ensuremath{\mathrm{so}(2)}\xspace}
-\newcommand{\sothree}{\ensuremath{\mathrm{so}(3)}\xspace}
-\newcommand{\intexpmap}[1]{\mathrm{Exp}\left(#1\right)}
-\newcommand{\intlogmap}[1]{\mathrm{Log}\left(#1\right)}
-\newcommand{\logmapz}[1]{\mathrm{Log}_0(#1)}
-\newcommand{\loglikelihood}{\mathrm{log}\calL}
-\newcommand{\intprinlogmap}{\mathrm{Log}_0}
-\newcommand{\expmap}[1]{\intexpmap{#1}}
-\newcommand{\expmaps}[1]{\langle #1 \rangle_{2\pi}}
-\newcommand{\biggexpmap}[1]{\left\langle #1 \right\rangle_{2\pi}}
-\newcommand{\logmap}[1]{\intlogmap{#1}}
-\newcommand{\round}[1]{\mathrm{round}\left( #1 \right)}
-
-% Matrices 
-\newcommand{\MA}{\M{A}}
-\newcommand{\MB}{\M{B}}
-\newcommand{\MC}{\M{C}}
-\newcommand{\MD}{\M{D}}
-\newcommand{\ME}{\M{E}}
-\newcommand{\MJ}{\M{J}}
-\newcommand{\MK}{\M{K}}
-\newcommand{\MG}{\M{G}}
-\newcommand{\MM}{\M{M}}
-\newcommand{\MN}{\M{N}}
-\newcommand{\MP}{\M{P}}
-\newcommand{\MQ}{\M{Q}}
-\newcommand{\MU}{\M{U}}
-\newcommand{\MR}{\M{R}}
-\newcommand{\MS}{\M{S}}
-\newcommand{\MI}{\M{I}}
-\newcommand{\MV}{\M{V}}
-\newcommand{\MF}{\M{F}}
-\newcommand{\MH}{\M{H}}
-\newcommand{\ML}{\M{L}}
-\newcommand{\MO}{\M{O}}
-\newcommand{\MT}{\M{T}}
-\newcommand{\MX}{\M{X}}
-\newcommand{\MY}{\M{Y}}
-\newcommand{\MW}{\M{W}}
-\newcommand{\MZ}{\M{Z}}
-\newcommand{\MSigma}{\M{\Sigma}} 
-\newcommand{\MOmega}{\M{\Omega}}
-\newcommand{\MPhi}{\M{\Phi}}
-\newcommand{\MPsi}{\M{\Psi}}
-\newcommand{\MDelta}{\M{\Delta}}
-\newcommand{\MLambda}{\M{\Lambda}}
-
-% vectors
-\newcommand{\va}{\boldsymbol{a}} 
-\newcommand{\vh}{\boldsymbol{h}} 
-\newcommand{\vb}{\boldsymbol{b}}
-\newcommand{\vc}{\boldsymbol{c}}
-\newcommand{\vd}{\boldsymbol{d}}
-\newcommand{\ve}{\boldsymbol{e}}
-\newcommand{\vf}{\boldsymbol{f}}
-\newcommand{\vg}{\boldsymbol{g}}
-\newcommand{\vk}{\boldsymbol{k}}
-\newcommand{\vl}{\boldsymbol{l}}
-\newcommand{\vn}{\boldsymbol{n}}
-\newcommand{\vo}{\boldsymbol{o}}
-\newcommand{\vp}{\boldsymbol{p}}
-\newcommand{\vq}{\boldsymbol{q}}
-\newcommand{\vr}{\boldsymbol{r}}
-\newcommand{\vs}{\boldsymbol{s}}
-\newcommand{\vu}{\boldsymbol{u}}
-\newcommand{\vv}{\boldsymbol{v}}
-\newcommand{\vt}{\boldsymbol{t}}
-\newcommand{\vxx}{\boldsymbol{x}} 
-\newcommand{\vy}{\boldsymbol{y}}
-\newcommand{\vw}{\boldsymbol{w}}
-\newcommand{\vzz}{\boldsymbol{z}} 
-\newcommand{\vdelta}{\boldsymbol{\delta}}
-\newcommand{\vgamma}{\boldsymbol{\gamma}}  
-\newcommand{\vlambda}{\boldsymbol{\lambda}}
-\newcommand{\vtheta}{\boldsymbol{\theta}}
-\newcommand{\valpha}{\boldsymbol{\alpha}}
-\newcommand{\vbeta}{\boldsymbol{\beta}}
-\newcommand{\vnu}{\boldsymbol{\nu}}
-\newcommand{\vmu}{\boldsymbol{\mu}}
-\newcommand{\vepsilon}{\boldsymbol{\epsilon}}
-\newcommand{\vtau}{\boldsymbol{\tau}}
-
-%Intrinsic geometry
-\newcommand{\Rtheta}{\boldsymbol{R}}
-\newcommand{\symf}{f} % Symmetry function
-
-%Angles
-\newcommand{\angledomain}{(-\pi,+\pi]}
-
-% Tree, graphs, and cycle basis
-\newcommand{\MCB}{\mathsf{MCB}}
-\newcommand{\FCM}{\mathsf{FCM}}
-\newcommand{\FCB}{\mathsf{FCB}}
-\newcommand{\cyclemap}[1]{\calC^{\calG}\left(#1\right)}
-\newcommand{\incidencemap}[1]{\calA^{\calG}\left(#1\right)}
-\newcommand{\cyclemapk}{\calC^{\calG}_{k}}
-\newcommand{\incidencemapij}{\calA^{\calG}_{ij}}
-\renewcommand{\ij}{_{ij}}
-\newcommand{\foralledges}{\forall(i,j) \in \calE}
-\newcommand{\sumalledges}{
-     \displaystyle
-     \sum_{(i,j) \in \calE}}
-\newcommand{\sumalledgesm}{
-     \displaystyle
-     \sum_{i=1}^{m}}
-\newcommand{\T}{\mathsf{T}}
-\newcommand{\To}{\T_{\rm o}}
-\newcommand{\Tm}{\T_{\rm m}}
-\newcommand{\MCBa}{\MCB_{\mathsf{a}}}
-\newcommand{\FCBo}{\FCB_{\mathsf{o}}}
-\newcommand{\FCBm}{\FCB_{\mathsf{m}}}
-
-% Algorithms
-\newcommand{\algoonlyname}{MOLE2D}
-\newcommand{\algoml}{{\smaller\sf \algoonlyname}\xspace}
-\newcommand{\algocyclebasis}{\algoname{compute-cycle-basis}}
-\newcommand{\scenario}[1]{{\smaller \sf#1}\xspace}
-\newcommand{\toro}{{\smaller\sf Toro}\xspace}
-\newcommand{\gtwoo}{{\smaller\sf g2o}\xspace}
-\newcommand{\gtwooST}{{\smaller\sf g2oST}\xspace}
-\newcommand{\gtwood}{{\smaller\sf g2o{10}}\xspace}
-\newcommand{\gtsam}{{\smaller\sf gtsam}\xspace}
-\newcommand{\isam}{{\smaller\sf iSAM}\xspace}
-\newcommand{\lago}{{\smaller\sf LAGO}\xspace}
-\newcommand{\egtwoo}{{\smaller\sf \algoonlyname+g2o}\xspace}
-
-% Datasets
-%\newcommand{\grid}{\scenario{cube}}
-\newcommand{\rim}{\scenario{rim}}
-\newcommand{\cubicle}{\scenario{cubicle}}
-\newcommand{\sphere}{\scenario{sphere}}
-\newcommand{\sphereHard}{\scenario{sphere-a}}
-\newcommand{\garage}{\scenario{garage}}
-\newcommand{\torus}{\scenario{torus}}
-\newcommand{\oneloop}{\scenario{circle}}
-\newcommand{\intel}{\scenario{INTEL}}
-\newcommand{\bovisa}{\scenario{Bovisa}}
-\newcommand{\bov}{\scenario{B25b}}
-\newcommand{\fra}{\scenario{FR079}}
-\newcommand{\frb}{\scenario{FRH}}
-\newcommand{\csail}{\scenario{CSAIL}}
-\newcommand{\Ma}{\scenario{M3500}}
-\newcommand{\Mb}{\scenario{M10000}}
-\newcommand{\ATE}{\scenario{ATE}}
-\newcommand{\CVX}{\scenario{CVX}}
-\newcommand{\NEOS}{\scenario{NEOS}}
-\newcommand{\sdptThree}{\scenario{sdpt3}}
-\newcommand{\MOSEK}{\scenario{MOSEK}}
-\newcommand{\NESTA}{\scenario{NESTA}}
-\newcommand{\vertigo}{\scenario{Vertigo}}
-\newcommand{\SDPA}{\scenario{SDPA}}
-
-% \newcommand{\tablabel}[1]{%
-%     \hspace{-1mm}%
-%     \begin{sideways}{\small\scenario{#1}}\end{sideways}%
-%     \hspace{-4mm}%
-% }
-%
-% \newcommand{\tabfig}[2]{%
-%     \subfloat[\label{fig:#2} #1]{%
-%     \begin{minipage}{5.5cm}%
-%     \centering%
-%     \includegraphics[width=5.5cm,trim=4 0 4 15]{figures/#2}
-%     \end{minipage}%
-%     }%
-% }
-%
-% \newcommand{\subFigure}[3]{%
-%     \subfloat[\label{fig:#2} #1]{%
-%     \begin{minipage}{#3cm}%
-%     \centering%
-%     \includegraphics[width=#3cm,trim=4 0 4 15]{figures/#2}
-%     \end{minipage}%
-%     }%
-% }
-\newcommand{\cvx}{{\sf cvx}\xspace}
-
-% COLORS
-\newcommand{\blue}[1]{{\color{blue}#1}}
-\newcommand{\green}[1]{{\color{green}#1}}
-\newcommand{\red}[1]{{\color{red}#1}}
-
-% TO MANAGE REFERENCES
-%============================================================================
-\newcommand{\linkToPdf}[1]{\href{#1}{\blue{(pdf)}}}
-\newcommand{\linkToPpt}[1]{\href{#1}{\blue{(ppt)}}}
-\newcommand{\linkToCode}[1]{\href{#1}{\blue{(code)}}}
-\newcommand{\linkToWeb}[1]{\href{#1}{\blue{(web)}}}
-\newcommand{\linkToVideo}[1]{\href{#1}{\blue{(video)}}}
-\newcommand{\linkToMedia}[1]{\href{#1}{\blue{(media)}}}
-\newcommand{\award}[1]{\xspace} % {{\red{#1}}} % omit awards
-
-
-% PAPER-SPECIFIC COMMANDS
-%============================================================================
-
-% Linear approximation
-\newcommand{\vpose}{\boldsymbol{x}}
-\newcommand{\vz}{\boldsymbol{z}}
-\newcommand{\vDelta}{\boldsymbol{\Delta}}
-\newcommand{\vposesub}{\hat{\vpose}}
-\newcommand{\vpossub}{\hat{\vpos}}
-\newcommand{\vthetasub}{\hat{\vtheta}}
-\newcommand{\Pthetasub}{\MP_\vtheta}
-\newcommand{\thetasub}{\hat{\theta}}
-\newcommand{\vposecorr}{\tilde{\vpose}}
-\newcommand{\vposcorr}{\tilde{\vpos}}
-\newcommand{\vthetacorr}{\tilde{\vtheta}}
-\newcommand{\vposestar}{{\vpose}^{\star}}
-\newcommand{\vposstar}{{\vpos}^{\star}}
-\newcommand{\vthetastar}{{\vtheta}^{\star}}
-\newcommand{\vcthetastar}{{\vctheta}^{\star}}
-\newcommand{\pose}{\boldsymbol{x}}
-\newcommand{\pos}{\boldsymbol{p}}
-\newcommand{\mease}{z} % element
-\newcommand{\meas}{\boldsymbol{z}} % vector
-\newcommand{\meashat}{\hat{\meas}}
-
-
-
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..7b8b3f5
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,6 @@
+torch>=2.0.0
+gymnasium>=0.29.0
+numpy>=1.24.0
+scipy>=1.10.0
+matplotlib>=3.7.0
+pandas>=2.0.0
diff --git a/sections/abstract.tex b/sections/abstract.tex
deleted file mode 100644
index e1d8e8b..0000000
--- a/sections/abstract.tex
+++ /dev/null
@@ -1,5 +0,0 @@
-%!TEX root = ../main.tex
-
-\begin{abstract}
-    Brief description of the problem, your solution, and the results.
-\end{abstract}
\ No newline at end of file
diff --git a/sections/app-proof-convergence.tex b/sections/app-proof-convergence.tex
deleted file mode 100644
index 1c6e269..0000000
--- a/sections/app-proof-convergence.tex
+++ /dev/null
@@ -1,7 +0,0 @@
-%!TEX root = ../main.tex
-
-\section{Proof of Theorem \ref{thm:convergence} }
-\label{sec:app-proof-convergence}
-\begin{proof}
-    Here is my proof.
-\end{proof}
\ No newline at end of file
diff --git a/sections/conclusion.tex b/sections/conclusion.tex
deleted file mode 100644
index 15bd700..0000000
--- a/sections/conclusion.tex
+++ /dev/null
@@ -1,5 +0,0 @@
-%!TEX root = ../main.tex
-\section{Conclusions}
-\label{sec:conclusions}
-
-Conclusions and potentially future research directions.
\ No newline at end of file
diff --git a/sections/experiments.tex b/sections/experiments.tex
deleted file mode 100644
index 265c11b..0000000
--- a/sections/experiments.tex
+++ /dev/null
@@ -1,32 +0,0 @@
-%!TEX root = ../main.tex
-\section{Experiments}
-\label{sec:experiments}
-
-How does your algorithm work and compare with others? What insights have you gained from the experiments? Use figures (see Figure \ref{fig:1} for example) and tables (see Table \ref{tab:1} for example) to better present your results.
-
-\begin{figure}[ht!]
-\centering
-\includegraphics[width=0.75\textwidth]{figure/SEASLogo.pdf}
-\label{fig:1}
-\caption{This is the caption for the figure.}
-\end{figure}
-
-\begin{table}[ht!]
-\centering
-\begin{tabular}{|c|c c c|} 
- \hline
-  &Col1 & Col2 & Col3 \\ [0.5ex] 
- \hline
- 1 & 6 & 87837 & 787 \\ 
- 2 & 7 & 78 & 5415 \\
- 3 & 545 & 778 & 7507 \\[1ex] 
- \hline
-\end{tabular}
-\caption{This is the caption for the table.}
-\label{tab:1}
-\end{table}
-
-\subsection{First case}
-
-Use subsections to separate different experiment settings, if needed.
-
diff --git a/sections/formulation.tex b/sections/formulation.tex
deleted file mode 100644
index 9519756..0000000
--- a/sections/formulation.tex
+++ /dev/null
@@ -1,11 +0,0 @@
-%!TEX root = ../main.tex
-\section{Problem Formulation}
-\label{sec:formulation}
-
-Mathematical formulation of your problem. For example
-\bea 
-\min_{u(t)} & \displaystyle \int_{0}^T g(x,u) dt + h(x(T)) \label{eq:1} \\
-\subject & \dot{x} = f(x,u)
-\eea 
-
-Equation \eqref{eq:1} can be referred by setting up its label.
\ No newline at end of file
diff --git a/sections/introduction.tex b/sections/introduction.tex
deleted file mode 100644
index ea097f1..0000000
--- a/sections/introduction.tex
+++ /dev/null
@@ -1,16 +0,0 @@
-%!TEX root = ../main.tex
-\section{Introduction}
-\label{sec:intro}
-
-Introduce your work. 
-\begin{itemize}
-\item Why is it important? 
-\item What's the motivation?
-\item What's your novelty?
-\end{itemize}
-
-Numbered list also helps summarizing the main contributions.
-\begin{enumerate}
-\item First point.
-\item Second point.
-\end{enumerate}
\ No newline at end of file
diff --git a/sections/method.tex b/sections/method.tex
deleted file mode 100644
index c24dc68..0000000
--- a/sections/method.tex
+++ /dev/null
@@ -1,36 +0,0 @@
-%!TEX root = ../main.tex
-\section{Solution Method}
-\label{sec:method}
-
-Describe your algorithm and its properties.
-
-\begin{algorithm}
-\label{alg:1}
-\caption{Calculate $y = x^n$}
-\begin{algorithmic} 
-\REQUIRE $n \geq 0 \vee x \neq 0$
-\ENSURE $y = x^n$
-\STATE $y \leftarrow 1$
-\IF{$n < 0$}
-\STATE $X \leftarrow 1 / x$
-\STATE $N \leftarrow -n$
-\ELSE
-\STATE $X \leftarrow x$
-\STATE $N \leftarrow n$
-\ENDIF
-\WHILE{$N \neq 0$}
-\IF{$N$ is even}
-\STATE $X \leftarrow X \times X$
-\STATE $N \leftarrow N / 2$
-\ELSE[$N$ is odd]
-\STATE $y \leftarrow y \times X$
-\STATE $N \leftarrow N - 1$
-\ENDIF
-\ENDWHILE
-\end{algorithmic}
-\end{algorithm}
-
-\begin{theorem}[Convergence]
-    \label{thm:convergence}
-    My Algorithm \ref{alg:1} is good.
-\end{theorem}
\ No newline at end of file
diff --git a/sections/related-work.tex b/sections/related-work.tex
deleted file mode 100644
index 1c0d0a7..0000000
--- a/sections/related-work.tex
+++ /dev/null
@@ -1,6 +0,0 @@
-%!TEX root = ../main.tex
-\section{Related Work}
-\label{sec:related-work}
-
-Cite some important works in this section, for example, ~\cite{bertsekas12book-optimalcontrol}. 
-Compare them with your project. One can also combine this section with Section \ref{sec:intro}.
\ No newline at end of file
diff --git a/shortcuts.tex b/shortcuts.tex
deleted file mode 100644
index 9014fd8..0000000
--- a/shortcuts.tex
+++ /dev/null
@@ -1,106 +0,0 @@
-%!TEX root = main.tex
-
-\newcommand{\Sn}{\mathbb{S}^n}
-\newcommand{\R}{\mathbb{R}}
-\newcommand{\cA}{\mathcal{A}}
-\newcommand{\cB}{\mathcal{B}}
-\newcommand{\cL}{\mathcal{L}}
-\renewcommand{\norm}[1]{\left\lVert #1 \right\rVert}
-\newcommand{\inprod}[2]{\left\langle #1, #2 \right\rangle}
-\newcommand{\vectorize}[1]{\mathrm{vec}\parentheses{#1}}
-
-\newcommand{\nnReal}[1]{\mathbb{R}_{+}^{#1}}
-\newcommand{\vcat}{\ ;\ }
-\newcommand{\mymid}{\ \middle\vert\ }
-\newcommand{\cbrace}[1]{\left\{#1\right\}}
-\newcommand{\sym}[1]{\mathbb{S}^{#1}}
-\newcommand{\calAadj}{\calA^{*}}
-\newcommand{\bary}{\bar{y}}
-\newcommand{\barC}{\bar{C}}
-\newcommand{\barcalA}{\bar{\calA}}
-\newcommand{\barcalAadj}{\bar{\calA}^{*}}
-\newcommand{\bmat}{\left[ \begin{array}}
-\newcommand{\emat}{\end{array}\right]}
-\newcommand{\psd}[1]{\sym{#1}_{+}}
-\newcommand{\parentheses}[1]{\left(#1\right)}
-\newcommand{\half}{\frac{1}{2}}
-
-\newcommand{\usphere}[1]{\calS^{#1}}
-\newcommand{\hpartial}{\hat{\partial}}
-\newcommand{\baralpha}{\bar{\alpha}}
-\newcommand{\tldW}{\widetilde{\MW}}
-\newcommand{\bareta}{\bar{\eta}}
-\newcommand{\tWnu}{\tilde{W}_{\nu}}
-\newcommand{\tWzero}{\tilde{W}_{0}}
-\newcommand{\tWone}{\tilde{W}_{1}}
-\newcommand{\tWhalf}{\tilde{W}_{1/2}}
-\newcommand{\Qa}{Q_{\alpha}}
-\newcommand{\Qb}{Q_{\baralpha}}
-\newcommand{\tV}{\tilde{V}}
-\newcommand{\tVzero}{\tV_{0}}
-\newcommand{\tVhalf}{\tV_{1/2}}
-\newcommand{\tVone}{\tV_{1}}
-\newcommand{\tVnu}{\tV_{\nu}}
-\newcommand{\Mnu}{M_{\nu}}
-\newcommand{\tMnu}{\tilde{M}_{\nu}}
-\newcommand{\tM}{\tilde{M}}
-\newcommand{\hV}{\hat{V}}
-\newcommand{\hM}{\hat{M}}
-\newcommand{\hMnu}{\hat{M}_{\nu}}
-\newcommand{\Omegahalf}{\Omega^{.5}}
-\newcommand{\bracket}[1]{\left[#1\right]}
-\newcommand{\abs}[1]{\left|#1\right|}
-\newcommand{\dx}{\dot{x}}
-\newcommand{\bbU}{\mathbb{U}}
-\newcommand{\bbX}{\mathbb{X}}
-\newcommand{\eqcon}[1]{c_{\mathrm{eq},#1}}
-\newcommand{\ineqcon}[1]{c_{\mathrm{ineq},#1}}
-\newcommand{\epsfeqcon}[1]{c_{f,\mathrm{eq},#1}}
-\newcommand{\epsfineqcon}[1]{c_{f,\mathrm{ineq},#1}}
-\newcommand{\epsgeqcon}[1]{c_{g,\mathrm{eq},#1}}
-\newcommand{\epsgineqcon}[1]{c_{g,\mathrm{ineq},#1}}
-\newcommand{\numeqepsf}{l_{f,\mathrm{eq}}}
-\newcommand{\numineqepsf}{l_{f,\mathrm{ineq}}}
-\newcommand{\numeqepsg}{l_{g,\mathrm{eq}}}
-\newcommand{\numineqepsg}{l_{g,\mathrm{ineq}}}
-\newcommand{\numeq}{l_{\mathrm{eq}}}
-\newcommand{\numineq}{l_{\mathrm{ineq}}}
-\newcommand{\epsf}{\epsilon_f}
-\newcommand{\epsg}{\epsilon_g}
-\newcommand{\longmid}{\ \middle\vert\ }
-\newcommand{\setxepsf}{\mathbb{X}_{f}}
-\newcommand{\setxepsg}{\mathbb{X}_{g}}
-\newcommand{\dotb}{\dot{b}}
-\newcommand{\poly}[1]{\mathbb{R}[#1]}
-\newcommand{\sos}[1]{\Sigma[#1]}
-\newcommand{\peps}{p_{\epsilon}}
-\newcommand{\qeps}{q_{\epsilon}}
-\newcommand{\ceil}[1]{\left\lceil #1 \right\rceil}
-\newcommand{\Ceq}[1]{C_{\mathrm{eq},#1}}
-\newcommand{\Cineq}[1]{C_{\mathrm{ineq},#1}}
-\newcommand{\uineqcon}[1]{c_{u,#1}}
-\newcommand{\numinequ}{l_{u}}
-\newcommand{\bbK}{\mathbb{K}}
-\newcommand{\numtheta}{n_{\theta}}
-\newcommand{\uref}{u_{\mathrm{ref}}}
-\newcommand{\xc}{x_c}
-\newcommand{\yc}{y_c}
-\newcommand{\xo}{x_o}
-\newcommand{\yo}{y_o}
-\newcommand{\HYedit}[1]{\blue{#1}}
-\newcommand{\tldp}{\widetilde{p}}
-\newcommand{\hatp}{\widehat{p}}
-\newcommand{\tldR}{\widetilde{R}}
-\newcommand{\hats}{\widehat{s}}
-\newcommand{\hatR}{\widehat{R}}
-\newcommand{\hatt}{\widehat{t}}
-\newcommand{\tldcalY}{\widetilde{\calY}}
-\newcommand{\hatcalR}{\widehat{\calR}}
-\newcommand{\tldcalR}{\widetilde{\calR}}
-\newcommand{\tldTheta}{\widetilde{\Theta}}
-\newcommand{\floor}[1]{\lfloor #1 \rfloor}
-\newcommand{\mysum}[1]{\text{sum}\parentheses{#1}}
-\newcommand{\barcalI}{\bar{\calI}}
-\newcommand{\barpi}{\bar{\pi}}
-\newcommand{\sosone}{\mathrm{SOS}\text{-}1}
-\newcommand{\ab}{\widetilde{ab}}
\ No newline at end of file