minigo/features.py at colab · hyu2000/minigo

268 lines (213 loc) · 8.79 KB
# Copyright 2018 Google LLC
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#      http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
Features used by AlphaGo Zero, in approximate order of importance.
Feature                 # Notes
Stone History           16 The stones of each color during the last 8 moves.
Ones                    1  Constant plane of 1s
All features with 8 planes are 1-hot encoded, with plane i marked with 1
only if the feature was equal to i. Any features >= 8 would be marked as 8.
This file includes the features from the first paper as DEFAULT_FEATURES
and the features from AGZ as AGZ_FEATURES.
import numpy as np
import utils
# Resolution/truncation limit for one-hot features
def make_onehot(feature, planes: int):
    """ onehot_features[:,:,i] = 1 iff a point has i+1 liberty; the last plane = 1 if a point has liberty >=i+1
    onehot_features = np.zeros(feature.shape + (planes,), dtype=np.uint8)
    capped = np.minimum(feature, planes)
    onehot_index_offsets = np.arange(0, utils.product(
        onehot_features.shape), planes) + capped.ravel()
    # A 0 is encoded as [0,0,0,0], not [1,0,0,0], so we'll
    # filter out any offsets that are a multiple of $planes
    # A 1 is encoded as [1,0,0,0], not [0,1,0,0], so subtract 1 from offsets
    nonzero_elements = (capped != 0).ravel()
    nonzero_index_offsets = onehot_index_offsets[nonzero_elements] - 1
    onehot_features.ravel()[nonzero_index_offsets] = 1
    return onehot_features
def planes(num_planes):
    def deco(f):
        f.planes = num_planes
        return f
    return deco
# TODO(tommadams): add a generic stone_features for all N <= 8
@planes(16)
def stone_features(position: go.Position):
    """ AGZ: 8 binary feature planes each for black / white: latest 8 board positions """
    # a bit easier to calculate it with axis 0 being the 16 board states,
    # and then roll axis 0 to the end.
    features = np.zeros([16, go.N, go.N], dtype=np.uint8)
    num_deltas_avail = position.board_deltas.shape[0]
    cumulative_deltas = np.cumsum(position.board_deltas, axis=0)
    last_eight = np.tile(position.board, [8, 1, 1])
    # apply deltas to compute previous board states
    last_eight[1:num_deltas_avail + 1] -= cumulative_deltas
    # if no more deltas are available, just repeat oldest board.
    last_eight[num_deltas_avail + 1:] = last_eight[num_deltas_avail].reshape(1, go.N, go.N)
    features[::2] = last_eight == position.to_play
    features[1::2] = last_eight == -position.to_play
    return np.rollaxis(features, 0, 3)
def recent_board_features(position: go.Position):
    """ recent 8 boards (each with 1/0/-1), latest board last """
    num_deltas_avail = position.board_deltas.shape[0]
    cumulative_deltas = np.cumsum(position.board_deltas, axis=0)
    last_eight = np.tile(position.board, [8, 1, 1])
    # apply deltas to compute previous board states
    last_eight[1:num_deltas_avail + 1] -= cumulative_deltas
    # if no more deltas are available, just repeat oldest board.
    last_eight[num_deltas_avail + 1:] = last_eight[num_deltas_avail].reshape(1, go.N, go.N)
    return np.moveaxis(last_eight[::-1], 0, -1)
# TODO(tommadams): add a generic stone_features for all N <= 8
def stone_features_4(position):
    # a bit easier to calculate it with axis 0 being the 16 board states,
    # and then roll axis 0 to the end.
    features = np.zeros([8, go.N, go.N], dtype=np.uint8)
    num_deltas_avail = position.board_deltas.shape[0]
    cumulative_deltas = np.cumsum(position.board_deltas, axis=0)
    last = np.tile(position.board, [4, 1, 1])
    # apply deltas to compute previous board states
    last[1:num_deltas_avail + 1] -= cumulative_deltas
    # if no more deltas are available, just repeat oldest board.
    last[num_deltas_avail + 1:] = last[num_deltas_avail].reshape(1, go.N, go.N)
    features[::2] = last == position.to_play
    features[1::2] = last == -position.to_play
    return np.rollaxis(features, 0, 3)
def color_to_play_feature(position):
    if position.to_play == go.BLACK:
        return np.ones([go.N, go.N, 1], dtype=np.uint8)
        return np.zeros([go.N, go.N, 1], dtype=np.uint8)
def stone_color_feature(position):
    """ this feature is from the pov of current player """
    board = position.board
    features = np.zeros([go.N, go.N, 3], dtype=np.uint8)
    if position.to_play == go.BLACK:
        features[board == go.BLACK, 0] = 1
        features[board == go.WHITE, 1] = 1
        features[board == go.WHITE, 0] = 1
        features[board == go.BLACK, 1] = 1
    features[board == go.EMPTY, 2] = 1
    return features
def ones_feature(position):
    return np.ones([go.N, go.N, 1], dtype=np.uint8)
def recent_move_feature(position):
    onehot_features = np.zeros([go.N, go.N, P], dtype=np.uint8)
    for i, player_move in enumerate(reversed(position.recent[-P:])):
        _, move = player_move  # unpack the info from position.recent
        if move is not None:
            onehot_features[move[0], move[1], i] = 1
    return onehot_features
def recent_move_feature3(position):
    onehot_features = np.zeros([go.N, go.N, 3], dtype=np.uint8)
    for i, player_move in enumerate(reversed(position.recent[-3:])):
        _, move = player_move  # unpack the info from position.recent
        if move is not None:
            onehot_features[move[0], move[1], i] = 1
    return onehot_features
def liberty_feature(position):
    return make_onehot(position.get_liberties(), P)
def liberty_feature3(position: go.Position):
    """ liberties for both black/white """
    return make_onehot(position.get_liberties(), 3)
def few_liberties_feature(position: go.Position):
    """ indicates where our stones in danger, see tests """
    feature = position.get_liberties()
    onehot_features = np.zeros(feature.shape + (3,), dtype=np.uint8)
    onehot_index_offsets = np.arange(0, utils.product(
        onehot_features.shape), 3) + feature.ravel()
    nonzero_elements = ((feature != 0) & (feature <= 3)).ravel()
    nonzero_index_offsets = onehot_index_offsets[nonzero_elements] - 1
    onehot_features.ravel()[nonzero_index_offsets] = 1
    return onehot_features
def would_capture_feature(position):
    """ binary feature: 1 if playing there results in capturing of enemy stones
    Equivalently, the empty spot near enemy group of liberty 1
    features = np.zeros([go.N, go.N, 1], dtype=np.uint8)
    for g in position.lib_tracker.groups.values():
        if g.color == position.to_play:
            continue
        if len(g.liberties) == 1:
            lib = next(iter(g.liberties))
            features[lib + (0,)] = 1
    return features
DEFAULT_FEATURES = [
    stone_color_feature,
    ones_feature,
    liberty_feature,
    recent_move_feature,
    would_capture_feature,
DEFAULT_FEATURES_PLANES = sum(f.planes for f in DEFAULT_FEATURES)
AGZ_FEATURES = [
    stone_features,
    color_to_play_feature
AGZ_FEATURES_PLANES = sum(f.planes for f in AGZ_FEATURES)
MLPERF07_FEATURES = [
    stone_features_4,
    color_to_play_feature,
    few_liberties_feature,
    would_capture_feature,
MLPERF07_FEATURES_PLANES = sum(f.planes for f in MLPERF07_FEATURES)
""" DLGO sevenplane: black liberties, white liberties, ko violation """
DLGO_FEATURES = [
    stone_color_feature,
    # ones_feature,
    liberty_feature3,
    color_to_play_feature
DLGO_FEATURES_PLANES = sum(f.planes for f in DLGO_FEATURES)
""" redux: based on DEFAULT_FEATURES. Used in 9x9 exp2 """
REDUX_FEATURES = [
    stone_color_feature,
    color_to_play_feature,
    liberty_feature3,
    recent_move_feature3,
    would_capture_feature,
REDUX_FEATURES_PLANES = sum(f.planes for f in REDUX_FEATURES)  # 11
""" a0jax: """
A0JAX_FEATURES = [
    recent_board_features,
    ones_feature
A0JAX_FEATURES_PLANES = sum(f.planes for f in REDUX_FEATURES)
""" REDUX_FEATURES + focus area. Used in 9x9 exp3 """
EXP3_FEATURES = REDUX_FEATURES
EXP3_FEATURES_PLANES = 1 + sum(f.planes for f in EXP3_FEATURES)  # 12
def extract_features(position, features, goal: np.array=None):
    """ goal right now is the mask: go.N * go.N """
    pos_features = np.concatenate([feature(position) for feature in features], axis=2)
    if goal is None:
        return pos_features
    goal_features = np.expand_dims(goal, axis=2)
    return np.concatenate([pos_features, goal_features], axis=2)
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

features.py

Latest commit

History

features.py

File metadata and controls