dbravender/dartmcts - Change UPK6W3YC62YCWHXNGGK4PDJBPK5JEZW5R3HYGWDJSVF5ULKFQERAC

Add Tic Tac Toe neural network game encoding

Created by Dan Bravender on June 10, 2023

UPK6W3YC62YCWHXNGGK4PDJBPK5JEZW5R3HYGWDJSVF5ULKFQERAC

Dependencies

In channels

main

Change contents

Deletion in test/dartmcts_test.dart at line 43 [7.22]
B:BD[6.54] → [6.54:84]
```
    // TODO: implement toJson
```
Deletion in test/dartmcts_test.dart at line 121 [7.22]
B:BD[6.168] → [6.168:198]
```
    // TODO: implement toJson
```
Insertion in pubspec.yaml at line 11 [7.440]
[4.143]
```
dependencies:
  uuid: ^3.0.7
```

Insertion in pubspec.lock at line 324 [7.2040]

[4.6293]

  uuid:
    dependency: "direct main"
    description:
      name: uuid
      sha256: "648e103079f7c64a36dc7d39369cabb358d377078a051d6ae2ad3aa539519313"
      url: "https://pub.dev"
    source: hosted
    version: "3.0.7"

File addition: trainingserver.dart (----------)

[7.12800]

import 'package:dartmcts/net.dart';
import 'package:shelf/shelf.dart';
import 'package:shelf/shelf_io.dart' as shelf_io;
import 'dart:convert';
import 'package:uuid/uuid.dart';
Function? gameHandler;
void serve(TrainableInterface Function() trainer) async {
  var handler =
      const Pipeline().addMiddleware(logRequests()).addHandler(_handleRequest);
  gameHandler = () => trainer.call();
  var server = await shelf_io.serve(handler, 'localhost', 5000);
  print('Serving at http://${server.address.host}:${server.port}');
}
Map<String, TrainableInterface> gamesInProgress = {};
Future<Response> _handleRequest(Request request) async {
  if (request.url.path == "newgame") {
    TrainableInterface game = gameHandler?.call();
    var uuid = const Uuid();
    String id = uuid.v4().toString();
    gamesInProgress[id] = game;
    return Response.ok(
        json.encode({
          "id": id,
          "player_count": game.playerCount,
          "action_space_size": game.actionSpaceSize,
          "observation_space_size": game.observationSpaceSize,
          "current_player": game.currentPlayer,
          "observation": game.observation(),
          "legal_actions": game.legalActions()
        }),
        headers: {'Content-Type': 'application/json'});
  } else {
    var pieces = request.url.path.split('/');
    assert(pieces[0] == "step");
    var id = pieces[1];
    var action = json.decode(await request.readAsString())['action'];
    TrainableInterface? game = gamesInProgress[id]!;
    var gameResponse = game.step(action);
    var stepResponse = json.encode({
      "observation": game.observation(),
      "legal_actions": game.legalActions(),
      "next_player": game.currentPlayer,
      "reward": gameResponse.reward,
      "done": gameResponse.done
    });
    if (gameResponse.done) {
      // free memory for finished games
      gamesInProgress.remove(id);
      game = null;
    }
    return Response.ok(stepResponse,
        headers: {'Content-Type': 'application/json'});
  }
}

Insertion in lib/tictactoe.dart at line 2 [8.118]
[8.160]
[8.160]
```
import 'package:dartmcts/net.dart';
```

Insertion in lib/tictactoe.dart at line 123 [8.118]

[6.2706]

[8.2879]

  }
}
List<double> legalMoves(TicTacToeGame game) {
  List<double> l = initOneHot(9);
  var moves = game.getMoves();
  for (var move in moves) {
    l[move!] = 1;

Insertion in lib/tictactoe.dart at line 132 [8.118]

[8.2883]

  return l;
}
List<double> encodeGame(TicTacToeGame game) {
  List<double> l = [];
  List<double> myLocations = List.filled(9, 0);
  List<double> opponentLocations = List.filled(9, 0);
  game.board.asMap().forEach((i, player) {
    if (player == null) return;
    if (player == game.currentPlayer) {
      myLocations[i] = 1;
    } else {
      opponentLocations[i] = 1;
    }
  });
  l.addAll(myLocations);
  l.addAll(opponentLocations);
  // legalMoves must always be appended to the observation
  l.addAll(legalMoves(game));
  return l;

Insertion in lib/tictactoe.dart at line 153 [8.118]

[8.2885]


class TicTacToeNNInterface extends TrainableInterface {
  TicTacToeGame game = TicTacToeGame.newGame() as TicTacToeGame;
  @override
  int get playerCount => 2;
  @override
  int get currentPlayer => game.currentPlayer == TicTacToePlayer.O ? 0 : 1;
  @override
  List<double> legalActions() {
    return legalMoves(game);
  }
  @override
  List<double> observation() {
    return encodeGame(game);
  }
  @override
  StepResponse step(int move) {
    bool done = false;
    List<double> reward = List.filled(playerCount, 0.0);
    game = game.cloneAndApplyMove(move, null);
    if (game.getMoves().length == 0 || game.winner != null) {
      done = true;
      if (game.winner == null) {
        // tie
        reward = [0, 0];
      } else {
        // clear winner - the winner gets 1.0 - everyone else gets -1.0 reward
        reward = [-1.0, -1.0];
        reward[game.winner! == TicTacToePlayer.O ? 0 : 1] = 1.0;
      }
    }
    return StepResponse(
      done: done,
      reward: reward,
    );
  }
}

File addition: net.dart (----------)

[7.12800]

/// Initialize and optionally set a value in a one-hot array
List<double> initOneHot(int length, {double filler = 0, int? value}) {
  var l = List<double>.filled(length, filler);
  if (value != null) {
    l[value] = 1;
  }
  return l;
}
/// A tuple for move and score
class MoveScore<Move> {
  Move move;
  double score;
  MoveScore(this.move, this.score);
  @override
  String toString() {
    return 'MoveScore(score: $score, move: $move)';
  }
}
/// A response for a move
class StepResponse {
  bool done = false;
  List<double> reward = [];
  StepResponse({required this.done, required this.reward});
}
abstract class TrainableInterface {
  int get actionSpaceSize {
    return legalActions().length;
  }
  int get observationSpaceSize {
    return observation().length - legalActions().length;
  }
  late int playerCount;
  late int currentPlayer;
  List<double> observation();
  List<double> legalActions();
  StepResponse step(int move);
}

Deletion in lib/fourinarow.dart at line 95 [9.3648]
B:BD[3.286] → [3.286:316]
```
    // TODO: implement toJson
```
Replacement in lib/dartmcts.dart at line 186 [7.12817]
B:BD[2.232] → [2.232:260]
```
    tiedChildren.shuffle();
```
[2.232]
[2.260]
```
    tiedChildren.shuffle(config.random);
```
File addition: bin (d--x------)
[7.2]

File addition: tictactoeserver.dart (---x------)

[0.5118]

import 'package:dartmcts/trainingserver.dart';
import 'package:dartmcts/tictactoe.dart';
void main() {
  serve(() => TicTacToeNNInterface());
}

Replacement in Makefile at line 5 [5.12]
B:BD[5.51] → [5.51:61]
```
	dart test
```
[5.51]
```
	dart test
traintictactoe:
	dart bin/tictactoeserver.dart
```

Add Tic Tac Toe neural network game encoding

Dependencies

In channels

Change contents

Deletion in test/dartmcts_test.dart at line 43 [7.22]

Deletion in test/dartmcts_test.dart at line 121 [7.22]

Insertion in pubspec.yaml at line 11 [7.440]

Insertion in pubspec.lock at line 324 [7.2040]

File addition: trainingserver.dart (----------)

Insertion in lib/tictactoe.dart at line 2 [8.118]

Insertion in lib/tictactoe.dart at line 123 [8.118]

Insertion in lib/tictactoe.dart at line 132 [8.118]

Insertion in lib/tictactoe.dart at line 153 [8.118]

File addition: net.dart (----------)

Deletion in lib/fourinarow.dart at line 95 [9.3648]

Replacement in lib/dartmcts.dart at line 186 [7.12817]

File addition: bin (d--x------)

File addition: tictactoeserver.dart (---x------)

Replacement in Makefile at line 5 [5.12]