VoxelEngine/labirinth_ai/LabyrinthWorld.py

import time

from Objects.Cube.Cube import Cube
from Objects.World import World
import numpy as np
import random


class LabyrinthWorld(World):
    randomBuffer = 0
    batchsize = 1000
    randomBuffer = max(4 * batchsize, randomBuffer)

    def __init__(self, chunk_size_x: int, chunk_size_y: int, chunk_size_z: int,
                 chunk_n_x: int, chunk_n_y: int, chunk_n_z: int, programs: dict):
        self.board_shape = (chunk_size_x * chunk_n_x, chunk_size_y * chunk_n_y)
        self.board = np.zeros(self.board_shape)
        super(LabyrinthWorld, self).__init__(chunk_size_x, chunk_size_y, chunk_size_z,
                                             chunk_n_x, chunk_n_y, chunk_n_z, programs)
        self.max_room_dim = 20

        self.min_room_dim = 6

        self.max_room_num = 32
        self.max_corridors = 4 * self.max_room_num

        self.max_crates = self.max_room_num

        self.subjects = []
        self.ins = []
        self.actions = []
        self.targets = []

        self.model = None
        self.lastUpdate = time.time()
        self.nextTrain = self.randomBuffer
        self.round = 0

        self.trailMix = np.zeros(self.board_shape)
        self.grass = np.zeros(self.board_shape)
        self.hunter_grass = np.zeros(self.board_shape)
        self.subjectDict = {}

    def generate(self, seed: int = None, sea_plate_height: int = 50, continental_plate_height: int = 200):
        board = np.zeros(self.board_shape)
        random.seed(seed)
        np.random.seed(seed)

        # find random starting point
        px = random.randint(self.max_room_dim, (self.board_shape[0] - 1) - self.max_room_dim)
        py = random.randint(self.max_room_dim, (self.board_shape[1] - 1) - self.max_room_dim)

        # 0, 0 is top left
        right = (1, 0)
        left = (-1, 0)
        up = (0, -1)
        down = (0, 1)

        # place rooms
        room_num = 0
        corridor_num = 0
        while room_num < self.max_room_num and corridor_num < self.max_corridors:
            # try to place Room
            w = random.randint(self.min_room_dim, self.max_room_dim)
            h = random.randint(self.min_room_dim, self.max_room_dim)
            can_place_room = np.sum(
                board[px - int(w / 2.0):px + int(w / 2.0), py - int(h / 2.0):py + int(h / 2.0)] == 1) == 0 and px - int(
                w / 2.0) >= 0 and px + int(w / 2.0) < self.board_shape[0] and \
                             py - int(h / 2.0) >= 0 and py + int(h / 2.0) < self.board_shape[1]

            if can_place_room:
                # place Room
                board[px - int(w / 2.0):px + int(w / 2.0), py - int(h / 2.0):py + int(h / 2.0)] = 1
                room_num += 1
            else:
                # move && place Corridor
                directions = []
                while len(directions) == 0:
                    movable = []
                    corridor_length = random.randint(self.min_room_dim, self.max_room_dim)
                    if px - corridor_length >= 0:
                        movable.append(left)
                        if board[px - 1, py] != 2:
                            directions.append(left)

                    if px + corridor_length < self.board_shape[0]:
                        movable.append(right)
                        if board[px + 1, py] != 2:
                            directions.append(right)

                    if py - corridor_length >= 0:
                        movable.append(up)
                        if board[px, py - 1] != 2:
                            directions.append(up)

                    if py + corridor_length < self.board_shape[1]:
                        movable.append(down)
                        if board[px, py + 1] != 2:
                            directions.append(down)

                    if len(directions) != 0:
                        if len(directions) > 1:
                            d = directions[random.randint(0, len(directions) - 1)]
                        else:
                            d = directions[0]
                        changed = False
                        for _ in range(corridor_length):
                            if board[px, py] != 1 and board[px, py] != 2:
                                board[px, py] = 2
                                if (-d[0], -d[1]) not in movable or board[px - d[0], py - d[1]] != 2:
                                    changed = True
                            px += d[0]
                            py += d[1]
                        if changed:
                            corridor_num += 1
                    else:
                        if len(movable) != 0:
                            if len(movable) > 1:
                                d = movable[random.randint(0, len(movable) - 1)]
                            else:
                                d = movable[0]
                            for _ in range(corridor_length):
                                px += d[0]
                                py += d[1]

        crates = 0
        while crates < self.max_crates:
            px = random.randint(0, (self.board_shape[0] - 1))
            py = random.randint(0, (self.board_shape[1] - 1))

            if board[px, py] == 1:
                board[px, py] = 3
                crates += 1

        board[board == 2] = 1

        print((room_num, self.max_room_num))
        print((corridor_num, self.max_corridors))
        self.board = board

        # setting up the board
        for x_pos in range(0, self.board_shape[0]):
            for y_pos in range(0, self.board_shape[1]):
                for z_pos in range(0, 1):
                    self.put_object(x_pos, y_pos, z_pos, Cube().setColor(1, 1, 1))

        # adding subjects
        from labirinth_ai.Subject import Hunter, Herbivore
        while len(self.subjects) < 2:
            px = random.randint(self.max_room_dim, self.board_shape[0] - self.max_room_dim)
            py = random.randint(self.max_room_dim, self.board_shape[1] - self.max_room_dim)
            if self.board[px, py] == 1:
                self.subjects.append(Hunter(px, py))
                self.ins += self.subjects[-1].x_in
                self.actions += self.subjects[-1].actions
                self.targets += self.subjects[-1].target

        while len(self.subjects) < 10:
            px = random.randint(self.max_room_dim, self.board_shape[0] - self.max_room_dim)
            py = random.randint(self.max_room_dim, self.board_shape[1] - self.max_room_dim)
            if self.board[px, py] == 1:
                self.subjects.append(Herbivore(px, py))
                self.ins += self.subjects[-1].x_in
                self.actions += self.subjects[-1].actions
                self.targets += self.subjects[-1].target

        for x in range(self.board_shape[0]):
            for y in range(self.board_shape[1]):
                self.subjectDict[(x, y)] = []

        for sub in self.subjects:
            self.subjectDict[(sub.x, sub.y)].append(sub)

    def update(self):
        # start = time.time()
        if self.model is None:
            for sub in self.subjects:
                sub.calculateAction(self)
        else:
            states = list(map(lambda e: e.createState(self), self.subjects))
            states = sum(list(map(lambda e: [e, e, e, e], states)), [])
            vals = self.model.predict(states)
            vals = np.reshape(np.transpose(np.reshape(vals, (len(self.subjects), 4, 2)), (0, 2, 1)),
                              (len(self.subjects), 1, 8))
            list(map(lambda e: e[1].calculateAction(self, vals[e[0]], states[e[0]]), enumerate(self.subjects)))

        for sub in self.subjects:
            if sub.alive:
                sub.update(self, doTrain=self.model is None)
            sub.tick += 1

        if self.model is not None:
            if self.round >= self.nextTrain:
                samples = list(map(lambda e: e.generateSamples(), self.subjects))
                states = sum(list(map(lambda e: e[0], samples)), [])
                targets = sum(list(map(lambda e: e[1], samples)), [])
                self.model.fit(states, targets)
                self.nextTrain = self.batchsize / 5
                self.round = 0
                for sub in self.subjects:
                    if len(sub.samples) > 20*self.batchsize:
                        sub.samples = sub.samples[:-20*self.batchsize]
            else:
                self.round += 1

        new_subjects = []
        kill_table = {}
        live_table = {}
        for sub in self.subjects:
            if sub.name not in kill_table.keys():
                kill_table[sub.name] = 0
                live_table[sub.name] = 0
            kill_table[sub.name] += sub.kills
            live_table[sub.name] += sub.lives
            if sub.alive:
                new_subjects.append(sub)
            else:
                px = random.randint(self.max_room_dim, (self.board_shape[0] - 1) - self.max_room_dim)
                py = random.randint(self.max_room_dim, (self.board_shape[1] - 1) - self.max_room_dim)
                while self.board[px, py] == 0:
                    px = random.randint(self.max_room_dim, (self.board_shape[0] - 1) - self.max_room_dim)
                    py = random.randint(self.max_room_dim, (self.board_shape[1] - 1) - self.max_room_dim)
                sub.respawnUpdate(px, py, self)
                new_subjects.append(sub)

        self.subjects = new_subjects
        self.trailMix *= 0.99

        self.grass = np.minimum(self.grass + 0.01 * (self.board != 0), 3)
        self.hunter_grass = np.minimum(self.hunter_grass + 0.01 * (self.board != 0), 3)

        self.trailMix *= (self.trailMix > 0.01)
adds labyrinth and subjects as well as performance increases 2022-02-07 21:08:45 +01:00			`import time`

			`from Objects.Cube.Cube import Cube`
			`from Objects.World import World`
			`import numpy as np`
			`import random`


			`class LabyrinthWorld(World):`
			`randomBuffer = 0`
			`batchsize = 1000`
			`randomBuffer = max(4 * batchsize, randomBuffer)`

			`def __init__(self, chunk_size_x: int, chunk_size_y: int, chunk_size_z: int,`
			`chunk_n_x: int, chunk_n_y: int, chunk_n_z: int, programs: dict):`
			`self.board_shape = (chunk_size_x * chunk_n_x, chunk_size_y * chunk_n_y)`
			`self.board = np.zeros(self.board_shape)`
			`super(LabyrinthWorld, self).__init__(chunk_size_x, chunk_size_y, chunk_size_z,`
			`chunk_n_x, chunk_n_y, chunk_n_z, programs)`
			`self.max_room_dim = 20`

			`self.min_room_dim = 6`

			`self.max_room_num = 32`
			`self.max_corridors = 4 * self.max_room_num`

			`self.max_crates = self.max_room_num`

			`self.subjects = []`
			`self.ins = []`
			`self.actions = []`
			`self.targets = []`

			`self.model = None`
			`self.lastUpdate = time.time()`
			`self.nextTrain = self.randomBuffer`
			`self.round = 0`

			`self.trailMix = np.zeros(self.board_shape)`
			`self.grass = np.zeros(self.board_shape)`
			`self.hunter_grass = np.zeros(self.board_shape)`
			`self.subjectDict = {}`

			`def generate(self, seed: int = None, sea_plate_height: int = 50, continental_plate_height: int = 200):`
			`board = np.zeros(self.board_shape)`
			`random.seed(seed)`
			`np.random.seed(seed)`

			`# find random starting point`
			`px = random.randint(self.max_room_dim, (self.board_shape[0] - 1) - self.max_room_dim)`
			`py = random.randint(self.max_room_dim, (self.board_shape[1] - 1) - self.max_room_dim)`

			`# 0, 0 is top left`
			`right = (1, 0)`
			`left = (-1, 0)`
			`up = (0, -1)`
			`down = (0, 1)`

			`# place rooms`
			`room_num = 0`
			`corridor_num = 0`
			`while room_num < self.max_room_num and corridor_num < self.max_corridors:`
			`# try to place Room`
			`w = random.randint(self.min_room_dim, self.max_room_dim)`
			`h = random.randint(self.min_room_dim, self.max_room_dim)`
			`can_place_room = np.sum(`
			`board[px - int(w / 2.0):px + int(w / 2.0), py - int(h / 2.0):py + int(h / 2.0)] == 1) == 0 and px - int(`
			`w / 2.0) >= 0 and px + int(w / 2.0) < self.board_shape[0] and \`
			`py - int(h / 2.0) >= 0 and py + int(h / 2.0) < self.board_shape[1]`

			`if can_place_room:`
			`# place Room`
			`board[px - int(w / 2.0):px + int(w / 2.0), py - int(h / 2.0):py + int(h / 2.0)] = 1`
			`room_num += 1`
			`else:`
			`# move && place Corridor`
			`directions = []`
			`while len(directions) == 0:`
			`movable = []`
			`corridor_length = random.randint(self.min_room_dim, self.max_room_dim)`
			`if px - corridor_length >= 0:`
			`movable.append(left)`
			`if board[px - 1, py] != 2:`
			`directions.append(left)`

			`if px + corridor_length < self.board_shape[0]:`
			`movable.append(right)`
			`if board[px + 1, py] != 2:`
			`directions.append(right)`

			`if py - corridor_length >= 0:`
			`movable.append(up)`
			`if board[px, py - 1] != 2:`
			`directions.append(up)`

			`if py + corridor_length < self.board_shape[1]:`
			`movable.append(down)`
			`if board[px, py + 1] != 2:`
			`directions.append(down)`

			`if len(directions) != 0:`
			`if len(directions) > 1:`
			`d = directions[random.randint(0, len(directions) - 1)]`
			`else:`
			`d = directions[0]`
			`changed = False`
			`for _ in range(corridor_length):`
			`if board[px, py] != 1 and board[px, py] != 2:`
			`board[px, py] = 2`
			`if (-d[0], -d[1]) not in movable or board[px - d[0], py - d[1]] != 2:`
			`changed = True`
			`px += d[0]`
			`py += d[1]`
			`if changed:`
			`corridor_num += 1`
			`else:`
			`if len(movable) != 0:`
			`if len(movable) > 1:`
			`d = movable[random.randint(0, len(movable) - 1)]`
			`else:`
			`d = movable[0]`
			`for _ in range(corridor_length):`
			`px += d[0]`
			`py += d[1]`

			`crates = 0`
			`while crates < self.max_crates:`
			`px = random.randint(0, (self.board_shape[0] - 1))`
			`py = random.randint(0, (self.board_shape[1] - 1))`

			`if board[px, py] == 1:`
			`board[px, py] = 3`
			`crates += 1`

			`board[board == 2] = 1`

			`print((room_num, self.max_room_num))`
			`print((corridor_num, self.max_corridors))`
			`self.board = board`

			`# setting up the board`
			`for x_pos in range(0, self.board_shape[0]):`
			`for y_pos in range(0, self.board_shape[1]):`
			`for z_pos in range(0, 1):`
			`self.put_object(x_pos, y_pos, z_pos, Cube().setColor(1, 1, 1))`

			`# adding subjects`
			`from labirinth_ai.Subject import Hunter, Herbivore`
			`while len(self.subjects) < 2:`
			`px = random.randint(self.max_room_dim, self.board_shape[0] - self.max_room_dim)`
			`py = random.randint(self.max_room_dim, self.board_shape[1] - self.max_room_dim)`
			`if self.board[px, py] == 1:`
			`self.subjects.append(Hunter(px, py))`
			`self.ins += self.subjects[-1].x_in`
			`self.actions += self.subjects[-1].actions`
			`self.targets += self.subjects[-1].target`

			`while len(self.subjects) < 10:`
			`px = random.randint(self.max_room_dim, self.board_shape[0] - self.max_room_dim)`
			`py = random.randint(self.max_room_dim, self.board_shape[1] - self.max_room_dim)`
			`if self.board[px, py] == 1:`
			`self.subjects.append(Herbivore(px, py))`
			`self.ins += self.subjects[-1].x_in`
			`self.actions += self.subjects[-1].actions`
			`self.targets += self.subjects[-1].target`

			`for x in range(self.board_shape[0]):`
			`for y in range(self.board_shape[1]):`
			`self.subjectDict[(x, y)] = []`

			`for sub in self.subjects:`
			`self.subjectDict[(sub.x, sub.y)].append(sub)`

			`def update(self):`
			`# start = time.time()`
			`if self.model is None:`
			`for sub in self.subjects:`
			`sub.calculateAction(self)`
			`else:`
			`states = list(map(lambda e: e.createState(self), self.subjects))`
			`states = sum(list(map(lambda e: [e, e, e, e], states)), [])`
			`vals = self.model.predict(states)`
			`vals = np.reshape(np.transpose(np.reshape(vals, (len(self.subjects), 4, 2)), (0, 2, 1)),`
			`(len(self.subjects), 1, 8))`
			`list(map(lambda e: e[1].calculateAction(self, vals[e[0]], states[e[0]]), enumerate(self.subjects)))`

			`for sub in self.subjects:`
			`if sub.alive:`
			`sub.update(self, doTrain=self.model is None)`
			`sub.tick += 1`

			`if self.model is not None:`
			`if self.round >= self.nextTrain:`
			`samples = list(map(lambda e: e.generateSamples(), self.subjects))`
			`states = sum(list(map(lambda e: e[0], samples)), [])`
			`targets = sum(list(map(lambda e: e[1], samples)), [])`
			`self.model.fit(states, targets)`
			`self.nextTrain = self.batchsize / 5`
			`self.round = 0`
			`for sub in self.subjects:`
			`if len(sub.samples) > 20*self.batchsize:`
			`sub.samples = sub.samples[:-20*self.batchsize]`
			`else:`
			`self.round += 1`

			`new_subjects = []`
			`kill_table = {}`
			`live_table = {}`
			`for sub in self.subjects:`
			`if sub.name not in kill_table.keys():`
			`kill_table[sub.name] = 0`
			`live_table[sub.name] = 0`
			`kill_table[sub.name] += sub.kills`
			`live_table[sub.name] += sub.lives`
			`if sub.alive:`
			`new_subjects.append(sub)`
			`else:`
			`px = random.randint(self.max_room_dim, (self.board_shape[0] - 1) - self.max_room_dim)`
			`py = random.randint(self.max_room_dim, (self.board_shape[1] - 1) - self.max_room_dim)`
			`while self.board[px, py] == 0:`
			`px = random.randint(self.max_room_dim, (self.board_shape[0] - 1) - self.max_room_dim)`
			`py = random.randint(self.max_room_dim, (self.board_shape[1] - 1) - self.max_room_dim)`
			`sub.respawnUpdate(px, py, self)`
			`new_subjects.append(sub)`

			`self.subjects = new_subjects`
			`self.trailMix *= 0.99`

			`self.grass = np.minimum(self.grass + 0.01 * (self.board != 0), 3)`
			`self.hunter_grass = np.minimum(self.hunter_grass + 0.01 * (self.board != 0), 3)`

			`self.trailMix *= (self.trailMix > 0.01)`