Spaces:

AIPsy
/

chessXAI

Runtime error

App Files Files Community

chessXAI / global_data.py

seredapj

Upload 19 files

0c536cc verified 12 months ago

raw

history blame contribute delete

21.1 kB

	import chess.engine
	from constants import ROOT_DIR, CONTENT_HEIGHT, LEFT_PANE_WIDTH, EXPORT_FORMAT, EXPORT_SCALE
	from time import sleep
	# from test_array import activations_array

	from copy import deepcopy

	from board2planes import board2planes

	import yaml

	import os
	from os.path import isdir, join
	import sys

	import numpy as np


	SIMULATE_TF = False #TODO: Remove this option, deprecated
	# turn off tensorflow importing and generate random data to speed up development
	DEV_MODE = False
	SIMULATED_LAYERS = 6
	SIMULATED_HEADS = 64
	FIXED_ROW = None # 1 #None to disable
	FIXED_COL = None # 5 #None to disable
	if DEV_MODE:
	class DummyModel:
	def __init__(self, layers, heads):
	self.layers = layers
	self.heads = heads

	def __call__(self, args, *kwargs):
	data = [np.random.rand(1, self.heads, 64, 64) for i in range(self.layers)]
	return [None, None, None, data]

	else:
	import tensorflow as tf
	from tensorflow.compat.v1 import ConfigProto
	from tensorflow.compat.v1 import InteractiveSession


	# class to hold data, state and configurations
	# Dash is stateless and in general it is very bad idea to store data in global variables on server side
	# However, this application is ment to be run by single user on local machine, so it is safe to store data and state
	# information on global object
	class GlobalData:
	def __init__(self):
	import os
	if not DEV_MODE:
	# import tensorflow as tf
	os.environ["CUDA_VISIBLE_DEVICES"] = "0"

	# from tensorflow.compat.v1 import ConfigProto
	# from tensorflow.compat.v1 import InteractiveSession
	# import chess
	# import matplotlib.patheffects as path_effects

	#config = ConfigProto()
	#config.gpu_options.allow_growth = True
	#session = InteractiveSession(config=config)
	#tf.keras.backend.clear_session()

	self.tmp = 0
	self.export_format = EXPORT_FORMAT
	self.export_scale = EXPORT_SCALE
	self.fen = 'rnbqkbnr/pppppppp/8/8/8/8/PPPPPPPP/RNBQKBNR w KQkq - 0 1' # '2kr3r/ppp2b2/2n4p/4p3/Q2Pq1pP/2P1N3/PP3PP1/R1B1KB1R w KQ - 3 18'#'6n1/1p1k4/3p4/pNp5/P1P4p/7P/1P4KP/r7 w - - 2 121'#
	self.board = chess.Board(fen=self.fen)
	self.focused_square_ind = 0
	self.active_move_table_cell = None # tuple (row_ind, col_id), e.g. (12, 'White')

	self.activations = None # activations_array
	self.visualization_mode = 'ROW'
	self.visualization_mode_is_64x64 = False
	self.subplot_mode = 'big' #'fit' # big'#'fit'#, 'big'
	self.subplot_cols = 0
	self.subplot_rows = 0
	self.number_of_heads = 0
	self.selected_head = None
	self.show_all_heads = True

	self.show_colorscale = False
	self.colorscale_mode = 'mode1'

	self.figure_container_height = '100%' # '100%'

	self.running_counter = 0 # used to pass new values to hidden indicator elements which will trigger follow-up callback
	self.grid_has_changed = False

	# self.has_subplot_grid_changed = True
	# self.figure_layout_images = None #store layout and only recalculate when subplot grid has changed
	# self.figure_layout_annotations = None
	# self.need_update_axis = True

	self.screen_w = 0
	self.screen_h = 0
	self.figure_w = 0
	self.figure_h = 0
	self.heatmap_w = 0
	self.heatmap_h = 0
	self.heatmap_fig_w = 0
	self.heatmap_fig_h = 0
	self.heatmap_gap = 0
	self.colorscale_x_offset = 0

	self.heatmap_horizontal_gap = 0.275

	self.figure_cache = {}

	self.update_grid_shape()

	self.pgn_data = [] # list of boards in pgn
	self.move_table_boards = {} # dict of boards in pgn, key is (move_table.row_ind, move_table.column_id)

	if not SIMULATE_TF:
	self.selected_layer = None
	else:
	self.selected_layer = 0

	self.nr_of_layers_in_body = -1
	self.has_attention_policy = False

	self.model_paths = []
	self.model_names = []
	self.model_yamls = {} #key = model path, value = yaml of that model
	self.model_cache = {}
	self.find_models2()
	self.model_path = None#self.model_paths[0] # '/home/jusufe/PycharmProjects/lc0-attention-visualizer/T12_saved_model_1M'
	self.model = None
	self.tfp = None #TensorflowProcess
	if not SIMULATE_TF:
	self.load_model()
	self.activations_data = None

	if self.model is not None or SIMULATE_TF:
	self.update_activations_data()

	if self.selected_layer is not None:
	self.set_layer(self.selected_layer)

	self.move_table_active_cell = None

	self.force_update_graph = False

	def set_subplot_mode(self, fit_to_page):
	if fit_to_page == [True]:
	self.subplot_mode = 'fit'
	else:
	self.subplot_mode = 'big'
	self.update_grid_shape()

	def set_screen_size(self, w, h):
	self.screen_w = w
	self.screen_h = h

	self.figure_w = w*LEFT_PANE_WIDTH/100
	self.figure_h = h*CONTENT_HEIGHT/100
	print('GRAPH AREA', self.figure_w, self.figure_h)

	def set_heatmap_size(self, size):
	if size != '1':
	#print('-----------------------HEATMAP SIZE', size)
	# w, h = size
	# print('TYETETETETEU', global_data.screen_w)
	# global_data.set_screen_size(w, h)
	#print('>>>>>: HEATMAP WIDTH', size[0])
	#print('>>>>>: HEATMAP HEIGHT', size[1])
	#print('>>>>>: FIG WIDTH', size[2])
	#print('>>>>>: FIG HEIGHT', size[3])
	#print('>>>>>: HEATMAP GAP', size[4])

	self.heatmap_w = float(size[0])
	self.heatmap_h = float(size[1])
	self.heatmap_fig_w = float(size[2])
	self.heatmap_fig_h = float(size[3])
	self.heatmap_gap = round(float(size[4]), 2)

	self.colorscale_x_offset = float(size[5])/self.heatmap_fig_w

	if size[6] == 1:
	self.force_update_graph = True
	else:
	self.force_update_graph = False


	#if self.heatmap_gap < 30:
	# self.heatmap_horizontal_gap += 0.025

	# self.heatmap_horizontal_gap = min(0.25, self.heatmap_horizontal_gap)
	#if self.heatmap_gap < 200:
	# self.heatmap_horizontal_gap += -0.025
	# self.heatmap_horizontal_gap = max(0.1, self.heatmap_horizontal_gap)

	def set_colorscale_mode(self, mode, colorscale_mode, colorscale_mode_64x64, show):
	if mode == '64x64':
	self.colorscale_mode = colorscale_mode_64x64
	else:
	self.colorscale_mode = colorscale_mode
	#print('SHOW value', show)
	self.show_colorscale = show == [True]

	def cache_figure(self, fig):
	if not self.check_if_figure_is_cached() and fig != {}:
	key = self.get_figure_cache_key()
	cached_fig = deepcopy(fig)
	cached_fig.update_layout({'coloraxis1': None}, overwrite=True)
	#print('CACHING FIGURE:')
	self.figure_cache[key] = cached_fig

	def get_cached_figure(self):
	if self.check_if_figure_is_cached():
	key = self.get_figure_cache_key()
	fig = deepcopy(self.figure_cache[key])
	else:
	fig = None
	return fig

	def check_if_figure_is_cached(self):
	key = self.get_figure_cache_key()
	return key in self.figure_cache

	def get_figure_cache_key(self):
	return (self.subplot_rows, self.subplot_cols, self.visualization_mode_is_64x64,
	self.selected_head if not self.show_all_heads else -1, self.show_colorscale, self.colorscale_mode,
	self.board.turn)
	#return (self.subplot_rows, self.subplot_cols, self.visualization_mode_is_64x64, self.selected_head if not self.show_all_heads else -1, self.heatmap_horizontal_gap, self.heatmap_fig_h, self.heatmap_fig_w)
	#return (self.subplot_rows, self.subplot_cols, self.visualization_mode_is_64x64, self.show_all_heads)

	def get_side_to_move(self):
	return ['Black', 'White'][self.board.turn]

	def load_model(self):
	if self.model_path in self.model_cache:
	self.model, self.tfp = self.model_cache[self.model_path]

	elif self.model_path is not None:
	#net = '/home/jusufe/Projects/lc0/BT1024-3142c-swa-186000.pb.gz'
	#yaml_path = '/home/jusufe/Downloads/cfg.yaml'
	if not DEV_MODE:
	net = self.model_path
	yaml_path = self.model_yamls[self.model_path]
	with open(yaml_path) as f:
	cfg = f.read()
	cfg = yaml.safe_load(cfg)

	if 'dropout_rate' in cfg['model']:
	print('Setting dropout_rate to 0.0')
	cfg['model']['dropout_rate'] = 0.0

	tfp = tfprocess.TFProcess(cfg)
	tfp.init_net()
	tfp.replace_weights(net, ignore_errors=True)
	self.model = tfp.model
	self.tfp = tfp
	else:
	self.model = DummyModel(SIMULATED_LAYERS, SIMULATED_HEADS)
	self.tfp = None

	else:
	self.model = None
	self.tfp = None

	def find_models(self):
	root = ROOT_DIR
	models_root_folder = os.path.join(root, 'models')
	model_folders = [f for f in os.listdir(models_root_folder) if isdir(join(models_root_folder, f))]
	model_paths = [os.path.relpath(join(models_root_folder, f)) for f in os.listdir(models_root_folder) if
	isdir(join(models_root_folder, f))]
	self.model_names = model_folders
	self.model_paths = model_paths

	#print('MODELS:')
	#print(self.model_names)
	#print(self.model_paths)

	def find_models2(self):
	import os
	from os.path import isdir, join
	root = ROOT_DIR
	models_root_folder = os.path.join(root, 'models')
	model_folders = [f for f in os.listdir(models_root_folder) if isdir(join(models_root_folder, f))]
	model_paths = [os.path.relpath(join(models_root_folder, f)) for f in os.listdir(models_root_folder) if
	isdir(join(models_root_folder, f))]

	models = []
	paths = []
	yamls = []
	for path in model_paths:
	yaml_files = [file for file in os.listdir(path) if file.endswith(".yaml")]
	if len(yaml_files) != 1:
	continue
	model_files = [file for file in os.listdir(path) if file.endswith(".pb.gz")]
	if len(model_files) == 0:
	continue

	models += model_files
	paths += [os.path.relpath(join(path, f)) for f in model_files]
	yaml_file = os.path.relpath(join(path, yaml_files[0]))
	yamls += [yaml_file]*len(model_files)

	self.model_yamls = {path: yaml_file for path, yaml_file in zip(paths, yamls)}
	self.model_names = models
	self.model_paths = paths#model_paths


	def update_activations_data(self):

	if self.model is not None and self.selected_layer is None:
	self.selected_layer = 0

	if not SIMULATE_TF:
	if self.selected_layer is not None and self.model is not None and self.selected_layer != 'Smolgen':
	if not DEV_MODE:
	inputs = board2planes(self.board)
	inputs = tf.reshape(tf.convert_to_tensor(inputs, dtype=tf.float32), [-1, 112, 8, 8])
	else:
	inputs = None

	outputs = self.model(inputs)
	self.activations_data = outputs[-1]
	for i,x in enumerate(self.activations_data):
	print( 'LAYERS', i, x.shape)

	#smolgen = self.tfp.smol_weight_gen_dense.get_weights()[0].reshape((256, 64, 64))
	#print('Smolgen')
	#print(type(smolgen))
	#print(smolgen.shape)
	#print(type(smolgen[0]))
	#print(smolgen[0].shape)
	#_, _, _, self.activations_data = self.model(inputs)
	elif self.selected_layer == 'Smolgen' and self.tfp is not None and self.tfp.use_smolgen:
	weights = self.tfp.smol_weight_gen_dense.get_weights()[0]
	self.activations_data = weights.reshape((weights.shape[0], 64, 64))
	print('TYPEEEEE', type(self.activations_data))

	else:
	layers = SIMULATED_LAYERS
	heads = SIMULATED_HEADS
	self.activations_data = [np.random.rand(1, heads, 64, 64) for i in range(layers)]

	if self.model is not None:

	if self.model_path not in self.model_cache:
	self.model_cache[self.model_path] = [self.model, self.tfp]

	self.update_layers_in_body_count()

	#TODO: figure out better way to determine if we have policy attention weights
	#TODO: What happens if policy vis is selected and user switches to model without policy layer? Take care of this case.
	if self.activations_data is not None and self.activations_data[-2].shape == (1, 8, 24):
	self.has_attention_policy = True
	else:
	self.has_attention_policy = False
	# self.update_selected_activation_data()
	# self.activations = self.activations_data[self.selected_layer]

	def update_grid_shape(self):
	# TODO: add client side callback triggered by Interval component to save window or precise container dimensions to Div
	# TODO: Trigger server side figure update callback when dimensions are recorded and store in global_data
	# TODO: If needed, recalculate subplot rows and cols and container scaler based on the changed dimension

	def calc_cols(heads, rows):
	if heads % rows == 0:
	cols = int(heads / rows)
	else:
	cols = int(1 + heads / rows)
	return cols

	if FIXED_ROW and FIXED_COL:
	self.subplot_cols = FIXED_COL
	self.subplot_rows = FIXED_ROW
	return None

	heads = self.number_of_heads
	if self.subplot_mode == 'fit':
	max_rows_in_screen = 4
	if heads <= 4:
	rows = 1
	elif heads <= 8:
	rows = 2
	else:
	rows = heads // 8 + int(heads % 8 != 0)

	elif self.subplot_mode == 'big':
	#print(heads)

	max_rows_in_screen = 2
	rows = heads // 4 + int(heads % 4 != 0)
	#print(rows)

	if rows > max_rows_in_screen:
	container_height = f'{int((rows / max_rows_in_screen) * 100)}%'
	else:
	container_height = '100%'

	if rows != 0:
	cols = calc_cols(heads, rows)
	else:
	cols = 0

	if self.subplot_rows != rows or self.subplot_cols != cols:
	self.grid_has_changed = True

	self.subplot_cols = cols
	self.subplot_rows = rows

	if self.show_all_heads:
	self.figure_container_height = container_height
	else:
	self.figure_container_height = '100%'

	def update_selected_activation_data(self):
	# import numpy as np
	# self.activations = activations_array + np.random.rand(8, 64, 64)
	if self.activations_data is not None:
	if self.selected_layer not in ('Policy', 'Smolgen'):
	if not DEV_MODE:
	activations = tf.squeeze(self.activations_data[self.selected_layer], axis=0).numpy()
	#self.activations = activations[:, ::-1, :] #Flip along y-axis
	else:
	activations = np.squeeze(self.activations_data[self.selected_layer], axis=0)
	elif self.selected_layer == 'Policy':
	print('RAW POLICY SHAPE', self.activations_data[-1].shape)
	activations = self.activations_data[-1].numpy()
	#print('POLICY SHAPE', activations.shape)

	#print('RAW POLICY SHAPE', self.activations_data[-1].shape)
	#activations = np.squeeze(self.activations_data[-1].numpy(), axis=0) #shape 64,64
	#promo = np.squeeze(self.activations_data[-2].numpy(), axis=0) #shape 8,24
	#print('promo shape:', promo.shape)
	#if self.board.turn:
	# pad_shape = (48, 8)
	#else:
	# pad_shape = (8, 48)
	#promo_padded = np.pad(promo, (pad_shape, (0, 0)), mode='constant', constant_values=None) #shape 64,24
	#self.activations = np.expand_dims(np.concatenate((activations, promo_padded), axis=1), axis=0)#shape 1,64,88
	#print('POLICY SHAPE', self.activations.shape)
	elif self.selected_layer == 'Smolgen':
	activations = self.tfp.smol_weight_gen_dense.get_weights()[0].reshape((256, 64, 64))

	self.activations = activations[:, ::-1, :] # Flip along y-axis

	def set_visualization_mode(self, mode):
	self.visualization_mode = mode
	self.visualization_mode_is_64x64 = mode == '64x64'

	def set_layer(self, layer):
	self.selected_layer = layer
	self.update_selected_activation_data()
	if layer not in ('Policy', 'Smolgen'):
	self.number_of_heads = self.activations_data[self.selected_layer].shape[1]
	elif layer == 'Policy':
	self.number_of_heads = 1
	elif layer == 'Smolgen':
	self.number_of_heads = self.activations.shape[0]
	self.set_head(0)
	self.update_grid_shape()

	def set_head(self, head):
	self.selected_head = head

	def set_model(self, model):
	if model != self.model_path:
	self.model_path = model
	self.load_model()
	self.update_activations_data()
	self.update_selected_activation_data()
	self.number_of_heads = self.activations_data[self.selected_layer].shape[1]
	if self.selected_head is None:
	self.selected_head = 0
	else:
	self.selected_head = min(self.selected_head, self.number_of_heads - 1)
	self.update_grid_shape()
	if SIMULATE_TF:
	sleep(2)

	def update_layers_in_body_count(self):
	# TODO: figure out robust way to separate attention layers in body from the rest. UPDATE: Use yaml
	heads = self.activations_data[0].shape[1]
	for ind, layer in enumerate(self.activations_data):
	if layer.shape[1] != heads or len(layer.shape) != 4:
	ind = ind - 1
	break
	self.nr_of_layers_in_body = ind + 1
	if self.selected_layer not in ('Policy', 'Smolgen'):
	self.selected_layer = min(self.selected_layer, self.nr_of_layers_in_body - 1)

	def get_head_data(self, head):

	if self.activations.shape[0] <= head:
	return None

	if self.visualization_mode == '64x64':
	# print('64x64 selection')
	data = self.activations[head, :, :]

	elif self.visualization_mode == 'ROW':
	# print('ROW selection')
	if self.board.turn or self.selected_layer == 'Smolgen': #White turn to move
	row = 63 - self.focused_square_ind
	data = self.activations[head, row, :].reshape((8, 8))
	else:
	#row = self.focused_square_ind
	multiples = self.focused_square_ind // 8
	remainder = self.focused_square_ind % 8

	a = 7 - remainder
	b = multiples * 8
	row = a + b
	data = self.activations[head, row, :].reshape((8, 8))[::-1, :]
	else:
	# print('COL selection')
	if self.board.turn or self.selected_layer == 'Smolgen': #White turn to move
	col = self.focused_square_ind
	data = self.activations[head, :, col].reshape((8, 8))[::-1, ::-1]
	else:
	focused = 63 - self.focused_square_ind
	multiples = focused // 8
	remainder = focused % 8
	a = 7 - remainder
	b = multiples * 8
	col = a + b
	#print('COL!!!!!!!!!!!!!!!!!', col, a, b, focused, self.focused_square_ind)
	data = self.activations[head, :, col].reshape((8, 8))[:, ::-1]
	return data

	def set_fen(self, fen):
	self.board.set_fen(fen)
	self.fen = fen
	self.update_activations_data()
	self.update_selected_activation_data()

	def set_board(self, board):
	self.board = deepcopy(board)
	self.update_activations_data()
	self.update_selected_activation_data()


	global_data = GlobalData()
	print('global data created')