-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathatari.py
100 lines (86 loc) · 3.13 KB
/
atari.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
import numpy as np
from numpy.core.numeric import Inf
import gym
from genes import *
from geneticOptimizer import *
from atari_env import *
from atari_help import *
import multiprocessing as mp
import json
import sys
class Game:
def __init__(self):
self.environment = AtariEnv(game="boxing")
def battle(self, ind):
fitness = run_game(self.environment, ind, False)
return fitness + 20
def calculateFitnessHelp(self, all):
num_threads = int(mp.cpu_count() - 1)
pool = mp.Pool(num_threads)
res = pool.map(self.battle, all)
for ind, fitness in zip(all, res):
ind.setFitness(fitness)
pool.close()
print(np.mean(res))
def calculateFitness(self, population, _):
all = []
for list in population:
for ind in list["individuals"]:
all.append(ind)
self.calculateFitnessHelp(all)
if __name__ == "__main__":
if len(sys.argv) > 1:
fm = open("atari_meta_194.json", "r")
meta = Genes.Metaparameters.load(fm)
fm.close()
fg = open("atari_best_194.json", "r")
best = Genes.load(fg, meta)
fg.close()
game = Game()
# game.calculateFitnessHelp(population)
# best = max(population, key=lambda ind: ind.getFitness())
# fout = open("atari_best_194.json", "w")
# best.save(fout)
# fout.close()
run_game(game.environment, best, True, 999999999999999)
game.environment.close()
else:
inputs = 128
outputs = 4
base = Genes(inputs, outputs, Genes.Metaparameters(
perturbation_chance=0.5,
perturbation_stdev=0.5,
new_link_weight_stdev=4,
new_node_chance=0.15,
c1=1.7, c2=1.7, c3=1.2,
allow_recurrent=False))
population = [base.clone() for i in range(150)]
for ind in population:
for _ in range(50):
ind.mutate()
#for output_node_index in range(outputs):
# for input_node_index in range(inputs):
# ind.add_connection(ind.input_node_index(input_node_index), ind.output_node_index(output_node_index))
# ind.add_connection(Genes.BIAS_INDEX, ind.output_node_index(output_node_index))
game = Game()
optimizer = GeneticOptimizer(population, game, 300)
optimizer.initialize()
optimizer.evolve()
best = optimizer.getBestIndividual()
population = optimizer.getPopulation()
f = open("atari_best.json", "w")
best.save(f)
f.close()
f = open("atari_population.json", "w")
all_inds = []
for species in optimizer.getPopulation():
for individual in species["individuals"]:
all_inds.append(individual)
f.write(json.dumps([ind.as_json() for ind in all_inds]))
f.close()
f = open("atari_meta.json", "w")
best._metaparameters.save(f)
f.close()
environment = AtariEnv(game="boxing")
fitness = run_game(environment, best, True, 99999999999999999999999)
environment.close()