main.py

"""
This script is used to evaluate the performance of the ev2gym environment.
"""
from ev2gym.models.ev2gym_env import EV2Gym
from ev2gym.baselines.gurobi_models.tracking_error import PowerTrackingErrorrMin
from ev2gym.baselines.gurobi_models.PST_V2G_profit_max import PST_V2GProfitMaxOracleGB
from ev2gym.baselines.gurobi_models.PST_V2G_profit_max_mo import mo_PST_V2GProfitMaxOracleGB
from ev2gym.utilities.utils import print_statistics
# from ev2gym.baselines.gurobi_models.profit_max import V2GProfitMaxOracleGB
# from ev2gym.baselines.mpc.ocmf_mpc import OCMF_V2G, OCMF_G2V
from ev2gym.baselines.mpc.eMPC import eMPC_V2G, eMPC_G2V
# from ev2gym.baselines.mpc.V2GProfitMax import V2GProfitMaxOracle

from ev2gym.baselines.heuristics import RoundRobin, ChargeAsLateAsPossible, ChargeAsFastAsPossible, RoundRobin_GF
# from ev2gym.baselines.heuristics import RoundRobin_GF_off_allowed, RoundRobin_GF
# from ev2gym.baselines.heuristics import ChargeAsFastAsPossibleToDesiredCapacity
# from GNN.state import PublicPST_GNN
from ev2gym.rl_agent.reward import SimpleReward, ProfitMax_TrPenalty_UserIncentives
from ev2gym.rl_agent.state import PublicPST

from utils import PST_V2G_ProfitMax_reward, PST_V2G_ProfitMaxGNN_state,PST_V2G_ProfitMax_state, PST_V2G_ProfitMax_state_to_GNN

from ev2gym.baselines.mpc.eMPC_v2 import eMPC_V2G_v2

import numpy as np
import matplotlib.pyplot as plt
import gymnasium as gym
from tqdm import tqdm
import yaml
import os

def eval():
    """
    Runs an evaluation of the ev2gym environment.
    """

    save_plots = True

    replay_path = "./replay/replay_sim_2024_02_21_056441.pkl"
    replay_path = None

    config_file = "./config_files/PST_V2G_ProfixMax_25.yaml"
    # config_file = "./config_files/PST_V2G_ProfixMax_250.yaml"

    # env = EV2Gym(config_file=config_file,
    #              load_from_replay_path=replay_path,
    #              verbose=False,
    #              save_replay=True,
    #              save_plots=save_plots,
    #              state_function=PublicPST_GNN,
    #              reward_function=SimpleReward,
    #              )

    env = EV2Gym(config_file=config_file,
                 generate_rnd_game=True,
                 save_replay=True,
                 save_plots=save_plots,
                 #  lightweight_plots=True,
                 reward_function=PST_V2G_ProfitMax_reward,
                 state_function=PST_V2G_ProfitMax_state,
                 verbose=False,
                 )
    
    config = yaml.load(open(config_file, 'r'), Loader=yaml.FullLoader)

    _, _ = env.reset()
    agent = RoundRobin_GF(env, verbose=False)
    # agent = ChargeAsFastAsPossible()
    # agent = eMPC_V2G_v2(env, 
    #                     control_horizon=10,
    #                     MIPGap = 0.1,
    #                     time_limit=30,
    #                     verbose=True)

    for _ in range(env.simulation_length):
        # actions = np.ones(env.cs*env.number_of_ports_per_cs)
        actions = agent.get_action(env)
        # actions = 2*np.random.rand(env.action_space.shape[0]) - 1
        
        
        new_state, reward, done, truncated, stats = env.step(
            actions)  # takes action
        
        # gnn_state = PST_V2G_ProfitMax_state_to_GNN(new_state,config)
        # print(f"\n\nConverted GNN state:\n{gnn_state}")
        # print(f' env features: {gnn_state.env_features}')
        # print(f' EVs features: {gnn_state.ev_features}')
        # print(f' CSs features: {gnn_state.cs_features}')        
        # print(f' CSs features: {gnn_state.tr_features}')  
        # print(f' edges: {gnn_state.edge_index}')      
        # print(f' action_mapper: {gnn_state.action_mapper}')   
        # print(f' ev_indexes: {gnn_state.ev_indexes}')  
        # print(f' cs_indexes: {gnn_state.cs_indexes}')
        # print(f' tr_indexes: {gnn_state.tr_indexes}')
        # print(f' env_indexes: {gnn_state.env_indexes}')
        # print(f' sample node length: {gnn_state.sample_node_length}')
        # print(f' node types: {gnn_state.node_types}')
        
        # og_gnn_state = PST_V2G_ProfitMaxGNN_state(env)
        # print('---\nOG GNN state:\n', PST_V2G_ProfitMaxGNN_state(env))
        # print(f' env features: {og_gnn_state.env_features}')
        # print(f' EVs features: {og_gnn_state.ev_features}')
        # print(f' CSs features: {og_gnn_state.cs_features}')
        # print(f' CSs features: {og_gnn_state.tr_features}')
        # print(f' edges: {og_gnn_state.edge_index}')
        # print(f' action_mapper: {og_gnn_state.action_mapper}')
        # print(f' ev_indexes: {og_gnn_state.ev_indexes}')
        # print(f' cs_indexes: {og_gnn_state.cs_indexes}')
        # print(f' tr_indexes: {og_gnn_state.tr_indexes}')
        # print(f' env_indexes: {og_gnn_state.env_indexes}')
        # print(f' sample node length: {og_gnn_state.sample_node_length}')      
        # print(f' node types: {og_gnn_state.node_types}')                  
        
        # assert (gnn_state.env_features == og_gnn_state.env_features).all()
        # assert (gnn_state.ev_features == og_gnn_state.ev_features).all()
        # assert (gnn_state.cs_features == og_gnn_state.cs_features).all()
        # assert (gnn_state.tr_features == og_gnn_state.tr_features).all()
        # assert (gnn_state.edge_index == og_gnn_state.edge_index).all()
        # assert (gnn_state.action_mapper == og_gnn_state.action_mapper).all()
        # assert (gnn_state.ev_indexes == og_gnn_state.ev_indexes).all()
        # assert (gnn_state.cs_indexes == og_gnn_state.cs_indexes).all()
        # assert (gnn_state.tr_indexes == og_gnn_state.tr_indexes).all()
        # assert (gnn_state.env_indexes == og_gnn_state.env_indexes).all()
        # assert (gnn_state.sample_node_length == og_gnn_state.sample_node_length)
        # assert (gnn_state.node_types == og_gnn_state.node_types).all()
        
        
        # input("Press Enter to continue...")
        # input("Press Enter to continue...")
        if done:
            # print(stats)
            print_statistics(env)
            break
    return

    new_replay_path = f"replay/replay_{env.sim_name}.pkl"

    env = EV2Gym(config_file=config_file,
                 load_from_replay_path=new_replay_path,
                 save_plots=save_plots,
                 reward_function=PST_V2G_ProfitMax_reward,
                 state_function=PST_V2G_ProfitMax_state,
                 )

    # env = BinaryAction(env)

    state, _ = env.reset()

    ev_profiles = env.EVs_profiles
    max_time_of_stay = max([ev.time_of_departure - ev.time_of_arrival
                            for ev in ev_profiles])
    min_time_of_stay = min([ev.time_of_departure - ev.time_of_arrival
                            for ev in ev_profiles])

    print(f'Number of EVs: {len(ev_profiles)}')
    print(f'Max time of stay: {max_time_of_stay}')
    print(f'Min time of stay: {min_time_of_stay}')
    # exit()
    # agent = OCMF_V2G(env, control_horizon=30, verbose=True)
    # agent = OCMF_G2V(env, control_horizon=25, verbose=True)
    # agent = eMPC_V2G(env, control_horizon=25, verbose=True)
    # agent = V2GProfitMaxOracle(env,verbose=True)
    # agent = PowerTrackingErrorrMin(new_replay_path)
    # agent = PST_V2GProfitMaxOracleGB(new_replay_path)
    agent = mo_PST_V2GProfitMaxOracleGB(new_replay_path,
                                        timelimit=120,
                                        MIPGap=None,
                                        verbose=True)
                                        
    # agent = eMPC_G2V(env, control_horizon=15, verbose=False)
    # agent = RoundRobin(env, verbose=False)
    # agent = ChargeAsLateAsPossible(verbose=False)
    # agent = ChargeAsFastAsPossible()
    # agent = ChargeAsFastAsPossibleToDesiredCapacity()

    for _ in range(env.simulation_length):
        # actions = np.random.rand(env.action_space.shape[0])
        actions = agent.get_action(env)

        new_state, reward, done, truncated, stats = env.step(
            actions)  # takes action

        if done:
            print_statistics(env)
            break


if __name__ == "__main__":

    # eval()
    # exit()
    
    
    successfully_evaluated = 0
    failed_evaluations = 0

    while True:
        try:

            eval()
            successfully_evaluated += 1
            print(
                f"Successfully evaluated: {successfully_evaluated} / {successfully_evaluated + failed_evaluations}")
        except Exception as e:
            print(e)
            failed_evaluations += 1
            print(
                f"Failed evaluations: {failed_evaluations} / {successfully_evaluated + failed_evaluations}")
            # continue