Wildfire-Control-Python/main.py at master · dashdeckers/Wildfire-Control-Python · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
# Argument handling
import argparse
parser = argparse.ArgumentParser()

parser.add_argument("-r", "--run", action="store_true",
                    help="Start the learning process")

parser.add_argument("-m", "--memories", type=int, default=100,
                    help="Number of runs of demonstration data to initialize with")

parser.add_argument("-e", "--episodes", type=int, default=10000,
                    help="Number of episodes / runs to learn for")

parser.add_argument("-t", "--type", type=str, default="DQN",
                    choices=["DQN", "SARSA", "DDQN", "BOTH", "Baseline", "Human"],
                    help="The algorithm to use")

parser.add_argument("-n", "--name", type=str, default="no_name",
                    help="A custom name to give the saved log and model files")

args = parser.parse_args()

if args.run and args.name == "no_name":
    parser.error("You should provide a name when running a learning session")

if args.type in ["Baseline", "DQN", "SARSA", "DDQN", "BOTH"] and args.episodes == 0:
    parser.error("You should specify the number of episodes for the algorithm")

# Suppress the many unnecessary TensorFlow warnings
import os, sys
import tensorflow as tf
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
tf.logging.set_verbosity(tf.logging.ERROR)


# Create the simulation
from Simulation.forest_fire import ForestFire
forestfire = ForestFire()


# Start learning straight away
if args.run:
    if args.type == "Baseline":
        print(f"Running Baseline with {args.episodes} episodes")
    else:
        print(f"Running {args.type} with {args.memories} "
              f"memories and {args.episodes} episodes")

    if args.type in ["DQN", "Baseline"]:
        from DQN import DQN
    if args.type == "SARSA":
        from DQN_SARSA import DQN_SARSA as DQN
    if args.type == "DDQN":
        from DQN_DUEL import DQN_DUEL as DQN
    if args.type == "BOTH":
        from DQN_BOTH import DQN_BOTH as DQN

    Agent = DQN(forestfire, args.name)

    if args.type == "Baseline":
        Agent.collect_memories(args.episodes, perform_baseline=True)
    else:
        Agent.collect_memories(args.memories)
        Agent.learn(args.episodes)

# Don't start learning
else:
    # Run the simulation in human mode
    if args.type == "Human":
        from misc import run_human
        run_human(forestfire)
    # Just import everything for interactive mode
    else:
        from misc import run_human, time_simulation_run
        from DQN import DQN
        from DQN_SARSA import DQN_SARSA
        from DQN_DUEL import DQN_DUEL
        from DQN_BOTH import DQN_BOTH

        # Create the agents
        DQN = DQN(forestfire, verbose=False)
        DQN_SARSA = DQN_SARSA(forestfire, verbose=False)
        DQN_DUEL = DQN_DUEL(forestfire, verbose=False)
        DQN_BOTH = DQN_BOTH(forestfire, verbose=False)

        # Get a list of imported algorithms to play with
        options = [o for o in dir() \
                  if not o.startswith("__") \
                  and not o in ["os", "code", "tf", "argparse",
                                "args", "parser", "ForestFire"]]
        # Display those algorithms for ease of use
        msg = (
            f"\nImported the following functions and algorithms for interactive mode:"
            f"\n{[o for o in options]}\n"
            f"Load a model with .load_model, play optimally with .play_optimal.\n"
        )
        # Drop the user in the interpreter, if the script is not already called with -i
        if sys.flags.interactive:
            print(msg)
        else:
            import code
            code.interact(banner=msg, local=locals())