AMKLS/train2.py at main · Horus0305/AMKLS · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
import pandas as pd
import numpy as np
import chess
import tensorflow as tf
from tensorflow import keras
import matplotlib.pyplot as plt
from keras.models import Sequential
from keras.layers import Dense, Flatten, Dropout
from keras.regularizers import l2
from keras.optimizers import Adam
from keras.callbacks import EarlyStopping, ReduceLROnPlateau

# Load your dataset
train_df = pd.read_csv('train.csv', index_col='id')

# Function to encode pieces using material values
def encode_board(board):
    material_dict = {
        'p': -1, 'b': -3.5, 'n': -3, 'r': -5, 'q': -9, 'k': -4,
        'K': 4, '.': 0, 'P': 1, 'B': 3.5, 'N': 3, 'R': 5, 'Q': 9
    }
    board_str = str(board).replace(' ', '')
    board_list = []
    for row in board_str.split('\n'):
        row_list = []
        for piece in row:
            row_list.append(material_dict.get(piece, 0))  # Use 0 for empty squares
        board_list.append(row_list)
    return np.array(board_list)

# Encode a FEN string into a board representation
def encode_fen_string(fen_str):
    board = chess.Board(fen=fen_str)
    return encode_board(board)

# Prepare the training data
X = np.stack(train_df['board'].apply(encode_fen_string)).reshape(-1, 8, 8)  # Shape (num_samples, 8, 8)
y = train_df['black_score'].values

# Normalize y (black_score)
y_mean = y.mean()
y_std = y.std()
y_normalized = (y - y_mean) / y_std

# Normalize X (the board features)
X_mean = X.mean()
X_std = X.std()
X_normalized = (X - X_mean) / X_std

# Build a simple neural network model with L2 regularization
model = Sequential([
    Flatten(input_shape=(8, 8)),  # Flatten the 8x8 input to a 1D array
    Dense(128, activation='relu', kernel_regularizer=l2(0.01)),  # L2 regularization
    Dropout(0.3),
    Dense(64, activation='relu', kernel_regularizer=l2(0.01)),  # L2 regularization
    Dropout(0.3),
    Dense(1)  # Output layer for predicting the normalized black score
])

# Compile the model with MSE and MAE as metrics
model.compile(optimizer=Adam(learning_rate=0.001), loss='mean_squared_error', metrics=['mean_squared_error', 'mean_absolute_error'])

# Train the model
early_stopping = EarlyStopping(monitor='val_loss', patience=10, restore_best_weights=True)
lr_reducer = ReduceLROnPlateau(monitor='val_loss', factor=0.5, patience=5, min_lr=0.00001)

# Train the model with callbacks
history = model.fit(
    X_normalized, y_normalized,
    epochs=100,
    batch_size=10,
    validation_split=0.2,
    callbacks=[early_stopping, lr_reducer]  # Add callbacks here
)

# Save the model
model.save('chess_model.keras')

# Predict on new data (denormalizing predictions)
preds_normalized = model.predict(X_normalized)
preds = preds_normalized * y_std + y_mean  # Denormalize predictions

# Plot training and validation loss
plt.style.use('ggplot')
plt.figure(figsize=(12, 6))
plt.subplot(1, 3, 1)
plt.plot(history.history['loss'], label='train loss')
plt.plot(history.history['val_loss'], label='val loss')
plt.legend()
plt.title('Loss During Training')

# Plot Mean Squared Error (MSE)
plt.subplot(1, 3, 2)
plt.plot(history.history['mean_squared_error'], label='train MSE')
plt.plot(history.history['val_mean_squared_error'], label='val MSE')
plt.legend()
plt.title('MSE During Training')

# Plot Mean Absolute Error (MAE)
plt.subplot(1, 3, 3)
plt.plot(history.history['mean_absolute_error'], label='train MAE')
plt.plot(history.history['val_mean_absolute_error'], label='val MAE')
plt.legend()
plt.title('MAE During Training')

# Show all plots
plt.tight_layout()
plt.show()