-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathNeuroTanks.elm
277 lines (238 loc) · 7.94 KB
/
NeuroTanks.elm
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
module NeuroTanks exposing (Tank, Simulation,
sim0, genSim, genGen, stepTank, simulate, drawMine, drawSim)
import Vec2 exposing (..)
import Genetics exposing (..)
import NeuralNet exposing (NeuralNet)
import Color exposing (red, green, grey)
import Collage exposing (Form, filled, outlined, rect, solid, rotate)
import ClassicalEngine exposing
(Circle, OBR, wrap2, collideOBRxCircle, drawObstacle, drawOBR)
import Random exposing (Generator)
import Random.Float exposing (standardNormal)
import Time exposing (Time)
import Set exposing (Set)
import Array exposing (Array)
--- CONSTANTS ---
-- mines are circles with this radius
mineSize : Float
mineSize = 5
-- tanks are squares with this width
tankSize : Float
tankSize = 20
-- there are this many mines in the play area
numMines : Int
numMines = 40
-- this many players, including one human, each control a tank
numTanks : Int
numTanks = 16
-- each round lasts this long
genTime : Time
genTime = 30 * Time.second
-- the score is visible for this long after each round
overTime : Time
overTime = 3 * Time.second
-- the left and right tank treads may each go this fast
treadMax : Float
treadMax = 70
-- bots must remain within this radius to gain fitness points
fitnessRadius : Float
fitnessRadius = 100
-- a bot receives this many points for disarming a mine
fitnessBonus : Float
fitnessBonus = 100
-- the ratio of children which are not direct copies of their parents
crossoverChance : Float
crossoverChance = 0.6
brainStructure : List Int
brainStructure = [2, 3, 2]
--- STRUCTURES ---
type alias Tank = OBR
{ treads : Vec2
, inv : Set Vec2
, brain : NeuralNet
, strategy : NeuralNet
, fitness : Float
}
type alias Mine = Circle
type alias Simulation =
{ size : Vec2
, tanks : List Tank
, mines : List Mine
, reset : Time
, generation : Int
}
--- SIMULATION ---
tank0 : Tank
tank0 =
{ o = (0, 0)
, dir = (1, 0)
, size = (tankSize, tankSize)
, treads = (0, 0)
, inv = Set.empty
, brain = []
, strategy = []
, fitness = 0
}
sim0 : Simulation
sim0 =
{ size = (0, 0)
, tanks = []
, mines = []
, reset = Time.hour
, generation = 0
}
-- returns a random generator that can generate a fully initialized simulation
genSim : Float -> Float -> Generator Simulation
genSim w h = let
genMines = Random.list numMines
<| Random.map (\pos -> { o = pos, r = mineSize })
<| Vec2.random (-w*0.5, -h*0.5) (w*0.5, h*0.5)
genTanks = Random.list (numTanks - 1)
<| Random.map2 (\b s -> { tank0 | brain = b, strategy = s })
(NeuralNet.random brainStructure) (NeuralNet.random brainStructure)
in
Random.map2 (\mines tanks ->
{ size = (w, h)
, tanks = tank0 :: tanks
, mines = mines
, reset = genTime
, generation = 1
}) genMines genTanks
-- advances the simulation by one frame, or restarts if time is up
simulate : Time -> Simulation -> Simulation
simulate tick sim = let sim = { sim | reset = sim.reset - tick } in
if sim.reset > 0 then stepSim tick sim else sim
resetTank : Tank -> Tank
resetTank tank = { tank0 | brain = tank.brain, strategy = tank.strategy }
-- returns a generator for the next genetic generation in the simulation
genGen : Simulation -> Generator Simulation
genGen sim = let
genDefault = Random.map (always sim) Random.bool
genCrossoverParams = Random.map3 (,,)
(Random.float 0 1) (Random.float 0 1) (Random.float 0 1)
genMutateParams = Random.map2 (,)
standardNormal (NeuralNet.random brainStructure)
in
case sim.tanks of
[] -> genDefault
player :: bots ->
case List.sortBy (.fitness >> negate) bots |> List.map resetTank of
[] -> genDefault
elite :: rest ->
Random.map (\rand -> { sim
| tanks = resetTank player :: elite :: List.map
(\(pqr, uus) -> crossoverTanks rest pqr |> mutateTank uus)
rand
, reset = genTime
, generation = sim.generation + 1
}
) (Random.list (List.length rest) (Random.map2 (,)
genCrossoverParams genMutateParams))
crossoverTanks : List Tank -> (Float, Float, Float) -> Tank
crossoverTanks tanks (p, q, r) = let
parent1 = selectRanked tanks p |> Maybe.withDefault tank0
parent2 = selectRanked tanks q |> Maybe.withDefault tank0
in
if r < crossoverChance
then let r = r / crossoverChance in
{ parent1
| brain = NeuralNet.crossover r parent1.brain parent2.brain
, strategy = NeuralNet.crossover r parent1.strategy parent2.strategy
}
else parent1
mutateTank : (Float, NeuralNet) -> Tank -> Tank
mutateTank (u, u's) tank = let
(brain, strategy) = NeuralNet.mutate u u's tank.strategy tank.brain
in
{ tank | brain = brain, strategy = strategy }
-- advances the simulation by one frame
stepSim : Time -> Simulation -> Simulation
stepSim tick sim = { sim | tanks = List.map (
steerTank sim.mines >> stepTank tick
>> (\tank -> { tank | o =
wrap2 (sim.size .* -0.5) (sim.size .* 0.5) tank.o })
>> (\tank -> { tank | fitness =
tank.fitness + (fitnessRadius - List.foldl
(\mine -> min (dist tank.o mine.o)) fitnessRadius sim.mines)
/ fitnessRadius * Time.inSeconds tick })
>> (\tank -> List.foldl (\mine tank -> case collideOBRxCircle tank mine of
Just _ -> { tank
| inv = Set.insert mine.o tank.inv
, fitness = tank.fitness +
if Set.member mine.o tank.inv then 0 else fitnessBonus
}
Nothing -> tank
) tank sim.mines)
) sim.tanks
}
--- BEHAVIOURS ---
touchDist : Float
touchDist = tankSize / 2 + mineSize
steeringOffset : Float
steeringOffset = touchDist / (fitnessBonus - touchDist)
steeringFactor : Float
steeringFactor = steeringOffset * fitnessBonus
steerTank : List Mine -> Tank -> Tank
steerTank mines tank = if List.length tank.brain == 0 then tank else let
polars = mines
|> List.filter (\mine -> not (Set.member mine.o tank.inv))
|> List.map (\mine -> let diff = mine.o .-. tank.o in
(norm diff, angle diff - angle tank.dir))
inputs = case List.minimum polars of
Just (dist, angle) ->
Array.fromList [steeringFactor / dist - steeringOffset, angle / pi]
Nothing -> Array.repeat 2 0
outputs = NeuralNet.propagate tank.brain inputs
in
{ tank | treads =
( Maybe.withDefault 0 (Array.get 0 outputs)
, Maybe.withDefault 0 (Array.get 1 outputs)
)
}
-- moves tank treads (thus moving the tank)
stepTank : Time -> Tank -> Tank
stepTank tick tank = let
dt = Time.inSeconds tick
(treadL, treadR) = clamp2 -1 1 tank.treads .* treadMax
width = fst tank.size
in
if treadL == treadR then
if treadL == 0.0 then
tank
else
{ tank | o = perp tank.dir .* (treadR * dt) .+. tank.o }
else if treadL == -treadR then
{ tank | dir = Vec2.rotate ((treadR - treadL) / width * dt) tank.dir }
else let
r = (treadR / (treadR - treadL) - 0.5) * width
pivot = tank.o .-. (r *. tank.dir)
v = (treadL + treadR) * 0.5
new_dir = Vec2.rotate (v / r * dt) tank.dir
new_pos = pivot .+. (new_dir .* r)
in
{ tank | o = new_pos, dir = new_dir }
--- DRAWING ---
-- draw a green square with a "barrel" rectangle pointing forward
drawTank : Bool -> Tank -> List Form
drawTank thick tank = let
angle = (atan2 (snd tank.dir) (fst tank.dir))
barrel_offset = tank.size .*. (0.0, 0.5)
barrel_pos = (tank.o .+. Vec2.rotate angle barrel_offset)
lineStyle = solid green
fullStyle = if thick then { lineStyle | width = 3 } else lineStyle
in
(filled green (uncurry rect (tank.size .*. (0.2, 0.5)))
|> Collage.rotate angle
|> Collage.move barrel_pos
) :: drawOBR fullStyle tank
-- draw a red circle
drawMine : Mine -> List Form
drawMine = drawObstacle red
-- draw all objects in the simulation
drawSim : Simulation -> List Form
drawSim sim = let
hiscore = List.foldl (.fitness >> max) 0 sim.tanks
in
outlined (solid grey) (uncurry rect sim.size)
:: List.foldl (\t -> drawTank (t.fitness == hiscore) t |> (++)) [] sim.tanks
++ List.foldl (drawMine >> (++)) [] sim.mines