commit old stuff

posmap: use std::mem::swap
elo: improve code quality and add confidence intervals
2025-07-24 23:19:09 -07:00 · 2025-04-30 18:08:40 -04:00 · 2025-04-30 13:52:19 -04:00 · 2025-04-29 18:43:38 -04:00 · 2025-04-29 18:32:44 -04:00 · 2025-04-29 18:20:53 -04:00
6 changed files with 125 additions and 123 deletions
--- a/src/elo.rs
+++ b/src/elo.rs
@@ -2,14 +2,14 @@ use crate::{
    agent::{Agent, RandomAgent},
    complexagent::ComplexAgent,
    game_inner::GameInner,
-    logic::{ChildrenEvalMethod, FutureMoveConfig},
+    logic::{ChildrenEvalMethod, FutureMoveConfig, FutureMoves},
    repr::{Board, Piece, Winner},
 };
 use indicatif::{ProgressBar, ProgressStyle};
 use rand::seq::SliceRandom;
 use rayon::iter::{IntoParallelIterator, ParallelIterator};
 use skillratings::{
-    elo::{elo, EloConfig, EloRating},
+    glicko2::{confidence_interval, glicko2, Glicko2Rating},
    Outcomes, Rating,
 };
 use std::num::NonZero;
@@ -18,18 +18,19 @@ type AgentMaker = Box<dyn Fn(Piece) -> Box<dyn Agent>>;

 #[allow(dead_code)]
 pub fn run() {
+    let total_memory = 30_000_000_000; // 30 GB
+    let num_threads = std::thread::available_parallelism()
+        .map(NonZero::get)
+        .expect("unable to get number of threads");
+    let mem_per_thread = total_memory / num_threads;
+
    let fmv_base = FutureMoveConfig {
-        max_depth: 20,
-        min_arena_depth: 14,
-        top_k_children: 2,
-        up_to_minus: 10,
-        max_arena_size: usize::MAX,
-        do_prune: false,
+        max_arena_size: mem_per_thread / FutureMoves::ARENA_ENTRY_SIZE,
        print: false,
-        children_eval_method: Default::default(),
+        ..Default::default()
    };

-    let configs = [4, 5, 6]
+    let configs = [2, 3, 4, 5, 6, 7, 8]
        .into_iter()
        .map(move |d| FutureMoveConfig {
            max_depth: d,
@@ -120,7 +121,7 @@ pub fn run() {
        })
        .collect();

-    if true {
+    if false {
        vec.push((
            "RandomAgent".to_string(),
            Box::new(move |piece| Box::new(RandomAgent::new(piece))),
@@ -129,26 +130,35 @@ pub fn run() {

    let mut arena = PlayerArena::new(vec);

-    arena.prop_arena(100);
+    arena.prop_arena(500);

    println!("{}", arena);
 }

 pub struct PlayerArena {
    /// Name, Creator Function, Elo
-    players: Vec<(String, AgentMaker, EloRating)>,
+    players: Vec<(String, AgentMaker, Glicko2Rating)>,
 }

 impl std::fmt::Display for PlayerArena {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        let mut players_i: Vec<usize> = (0..self.players.len()).collect();
-        players_i.sort_by_key(|&i| -(self.players[i].2.rating() * 100.0) as i64);
+
+        players_i.sort_by(|&a, &b| {
+            self.players[b]
+                .2
+                .rating()
+                .total_cmp(&self.players[a].2.rating())
+        });

        for i in players_i {
+            let conf_interval = confidence_interval(&self.players[i].2);
+
            writeln!(
                f,
-                "({:.2}): {}",
+                "({:.2}[+/-{:.2}]): {}",
                self.players[i].2.rating(),
+                conf_interval.1 - self.players[i].2.rating(),
                self.players[i].0
            )?;
        }
@@ -162,9 +172,8 @@ impl PlayerArena {
        Self {
            players: players
                .into_iter()
-                .zip([EloRating::new()].into_iter().cycle())
-                // flatten tuple
-                .map(|((a, b), c)| (a, b, c))
+                // All starting ratings should be the default
+                .map(|(a, b)| (a, b, Default::default()))
                .collect(),
        }
    }
@@ -229,7 +238,7 @@ impl PlayerArena {
            self.process_outcome(i, j, &o);

            if received_num > 0 {
-                term.clear_last_lines(self.players.len())
+                term.clear_last_lines(self.players.len() + 1)
                    .expect("unable to clear prev lines");
            }
            term.write_str(format!("{}", self).as_str())
@@ -237,8 +246,12 @@ impl PlayerArena {

            received_num += 1;
            p.inc(1);
+            // add extra newline after progressbar
+            println!();
+
            // break if all pairs were recieved
            if received_num == num {
+                drop(receiver);
                break;
            }
        }
@@ -263,14 +276,12 @@ impl PlayerArena {
    }

    fn process_outcome(&mut self, player1: usize, player2: usize, outcome: &Outcomes) {
-        let (np1, np2) = elo(
+        (self.players[player1].2, self.players[player2].2) = glicko2(
            &self.players[player1].2,
            &self.players[player2].2,
            outcome,
-            &EloConfig { k: 10.0 },
+            &Default::default(),
        );
-        self.players[player1].2 = np1;
-        self.players[player2].2 = np2;
    }

    fn play_two_inner(player_1: Box<dyn Agent>, player_2: Box<dyn Agent>) -> Outcomes {
@@ -278,7 +289,7 @@ impl PlayerArena {
            player_1,
            player_2,
            false,
-            // Board::random(rand::random_range(20..=30)),
+            // Board::random(rand::random_range(4..=15)),
            Board::STARTING_POSITION,
        )
        .expect("unable to create game")
--- a/src/logic/future_moves.rs
+++ b/src/logic/future_moves.rs
@@ -34,7 +34,7 @@ pub struct FutureMoves {
    board: Board,
 }

-#[derive(Copy, Clone, Allocative)]
+#[derive(Copy, Clone, Allocative, Default)]
 pub struct FutureMoveConfig {
    /// Max depth of that we should try and traverse
    pub max_depth: usize,
@@ -87,21 +87,17 @@ impl std::fmt::Display for FutureMoveConfig {
    }
 }

-#[derive(Debug, Clone, Copy, Allocative)]
+#[derive(Debug, Clone, Copy, Allocative, Default)]
 #[allow(dead_code)]
 pub enum ChildrenEvalMethod {
    /// Best so far?
+    // #[default]
    MinMax,

+    #[default]
    MinMaxProb,
 }

-impl Default for ChildrenEvalMethod {
-    fn default() -> Self {
-        Self::MinMax
-    }
-}
-
 impl FutureMoves {
    pub const fn new(agent_color: Piece, config: FutureMoveConfig) -> Self {
        Self {
@@ -113,6 +109,9 @@ impl FutureMoves {
        }
    }

+    pub const ARENA_ENTRY_SIZE: usize =
+        size_of::<Move>() + size_of::<usize>() * (Board::AREA.0 as usize / 4);
+
    /// Return the length of the Arena
    pub fn arena_len(&self) -> usize {
        self.arena.len()
@@ -214,18 +213,7 @@ impl FutureMoves {
    }

    fn create_move(&self, coord: MoveCoord, board: Board, color: Piece) -> Move {
-        Move::new(
-            coord,
-            board,
-            color,
-            self.agent_color,
-            MoveValueConfig {
-                self_value_raw: matches!(
-                    self.config.children_eval_method,
-                    ChildrenEvalMethod::MinMaxProb
-                ),
-            },
-        )
+        Move::new(coord, board, color, self.agent_color, MoveValueConfig {})
    }

    fn generate_children_raw(&self, parent_idx: usize) -> Vec<Move> {
@@ -308,23 +296,6 @@ impl FutureMoves {
                    .iter()
                    .map(|&child| self.arena[child].value)
                    .collect::<Vec<_>>();
-
-                match self.config.children_eval_method {
-                    ChildrenEvalMethod::MinMax => {
-                        let child_value = if self.arena[idx].color == self.agent_color {
-                            // get best (for the adversary) enemy play
-                            // this assumes the adversary is playing optimally
-
-                            children_values.into_iter().map(|x| x.value).min()
-                        } else {
-                            children_values.into_iter().map(|x| x.value).max()
-                        }
-                        .unwrap_or(0);
-
-                        self.arena[idx].value.value =
-                            self.arena[idx].self_value.value + child_value;
-                    }
-                    ChildrenEvalMethod::MinMaxProb => {
                let child_value = if self.arena[idx].color == self.agent_color {
                    // get best (for the adversary) enemy play
                    // this assumes the adversary is playing optimally
@@ -335,11 +306,18 @@ impl FutureMoves {
                }
                .cloned()
                .unwrap_or(Default::default());
-
                self.arena[idx].value = self.arena[idx].self_value;
+
+                match self.config.children_eval_method {
+                    ChildrenEvalMethod::MinMax => {
+                        self.arena[idx].value.value += child_value.value;
+                        self.arena[idx].value.set_state(child_value.state());
+                    }
+                    ChildrenEvalMethod::MinMaxProb => {
                        self.arena[idx]
                            .value
                            .populate_self_from_children(&children_values);
+
                        self.arena[idx].value.value += child_value.value;
                    }
                }
@@ -386,12 +364,15 @@ impl FutureMoves {
    /// Return the best move which is a child of `self.current_root`
    pub fn best_move(&self) -> Option<MoveCoord> {
        self.current_root
-            .and_then(|x| {
-                self.arena[x]
+            .and_then(|x| match self.config.children_eval_method {
+                ChildrenEvalMethod::MinMax => self.arena[x]
                    .children
                    .iter()
-                    // this would be considered `minimax`
-                    .max_by_key(|&&idx| self.arena[idx].value)
+                    .max_by_key(|&&idx| self.arena[idx].value),
+                ChildrenEvalMethod::MinMaxProb => self.arena[x]
+                    .children
+                    .iter()
+                    .max_by_key(|&&idx| self.arena[idx].value),
            })
            .inspect(|&&x| {
                assert_eq!(
--- a/src/logic/move.rs
+++ b/src/logic/move.rs
@@ -38,9 +38,7 @@ pub struct Move {
    pub is_trimmed: bool,
 }

-pub struct MoveValueConfig {
-    pub self_value_raw: bool,
-}
+pub struct MoveValueConfig {}

 impl Move {
    pub fn new(
@@ -48,7 +46,7 @@ impl Move {
        board: Board,
        color: Piece,
        agent_color: Piece,
-        mvc: MoveValueConfig,
+        _: MoveValueConfig,
    ) -> Self {
        let mut m = Move {
            coord,
@@ -76,30 +74,11 @@ impl Move {
            Winner::None => {}
        }

-        if mvc.self_value_raw {
        m.self_value.value =
            const { BoardValueMap::weighted() }.board_value(&board, agent_color) as i32;
-        } else {
-            m.self_value.value = m.compute_self_value(agent_color, &board, mvc) as i32;
-        }
        m
    }

-    fn compute_self_value(&self, agent_color: Piece, board: &Board, _mvc: MoveValueConfig) -> i16 {
-        if self.winner == Winner::Player(!agent_color) {
-            // if this board results in the opponent winning, MAJORLY negatively weigh this move
-            // NOTE! this branch isn't completely deleted because if so, the bot wouldn't make a move.
-            // We shouldn't prune branches because we still need to always react to the opponent's moves
-            return i16::MIN + 1;
-        } else if self.winner == Winner::Player(agent_color) {
-            // results in a win for the agent
-            return i16::MAX - 1;
-        }
-
-        // I guess ignore Ties here, don't give them an explicit value,
-        const { BoardValueMap::weighted() }.board_value(board, agent_color)
-    }
-
    /// Sort children of the [`Move`] by their self_value in `arena`
    pub fn sort_children(&mut self, arena: &[Move]) {
        self.children.sort_by(|&a, &b| {
--- a/src/logic/mvs.rs
+++ b/src/logic/mvs.rs
@@ -19,10 +19,11 @@ pub struct MoveValueStats {

 impl MoveValueStats {
    #[cfg(test)]
-    pub fn new_from_wins_losses(wins: u16, losses: u16) -> Self {
+    pub fn new_from_outcomes(wins: u16, losses: u16, ties: u16) -> Self {
        Self {
            wins,
            losses,
+            ties,
            ..Default::default()
        }
    }
@@ -55,22 +56,19 @@ impl MoveValueStats {
        self.state = state;
    }

+    pub const fn state(&self) -> Option<MVSGameState> {
+        self.state
+    }
+
    pub fn populate_self_from_children(&mut self, others: &[Self]) {
-        self.wins = others.iter().map(|x| x.wins).sum::<u16>()
-            + others
-                .iter()
-                .filter(|x| x.state == Some(MVSGameState::Win))
-                .count() as u16;
-        self.losses = others.iter().map(|x| x.losses).sum::<u16>()
-            + others
-                .iter()
-                .filter(|x| x.state == Some(MVSGameState::Loss))
-                .count() as u16;
-        self.ties = others.iter().map(|x| x.ties).sum::<u16>()
-            + others
-                .iter()
-                .filter(|x| x.state == Some(MVSGameState::Tie))
-                .count() as u16;
+        (self.wins, self.losses, self.ties) =
+            others.iter().fold((0, 0, 0), |(wins, losses, ties), x| {
+                (
+                    wins + x.wins + (x.state == Some(MVSGameState::Win)) as u16,
+                    losses + x.losses + (x.state == Some(MVSGameState::Loss)) as u16,
+                    ties + x.ties + (x.state == Some(MVSGameState::Tie)) as u16,
+                )
+            });
    }
 }

@@ -87,7 +85,7 @@ impl Ord for MoveValueStats {
        }

        let (s_cw, o_cw) = (self.chance_win(), other.chance_win());
-        if s_cw.is_some() | o_cw.is_some() {
+        if s_cw.is_some() || o_cw.is_some() {
            if s_cw > o_cw {
                return Ordering::Greater;
            } else if o_cw > s_cw {
@@ -105,29 +103,62 @@ mod tests {

    #[test]
    fn two_prob() {
-        let one = MoveValueStats::new_from_wins_losses(10, 4);
-        let two = MoveValueStats::new_from_wins_losses(4, 6);
+        let one = MoveValueStats::new_from_outcomes(100, 40, 0);
+
+        let two = MoveValueStats::new_from_outcomes(40, 60, 0);
        assert!(one > two);
    }

    #[test]
    fn one_prob_one_non() {
-        let one = MoveValueStats::new_from_wins_losses(10, 4);
+        let one = MoveValueStats::new_from_outcomes(100, 4, 0);
        let two = MoveValueStats::new_from_value(10);
        assert!(one > two);
    }

    #[test]
    fn one_prob_one_win() {
-        let one = MoveValueStats::new_from_wins_losses(10, 4);
+        let one = MoveValueStats::new_from_outcomes(100, 4, 0);
        let two = MoveValueStats::new_from_state(Some(MVSGameState::Win));
        assert!(one < two);
    }

    #[test]
    fn two_prob_zero() {
-        let one = MoveValueStats::new_from_wins_losses(10, 0);
-        let two = MoveValueStats::new_from_wins_losses(0, 6);
+        let one = MoveValueStats::new_from_outcomes(100, 0, 0);
+        let two = MoveValueStats::new_from_outcomes(0, 60, 0);
        assert!(one > two);
    }
+
+    #[test]
+    fn test_children_pop() {
+        let mut a = MoveValueStats::new_from_value(0);
+
+        let children = vec![
+            MoveValueStats::new_from_outcomes(1, 0, 0),
+            MoveValueStats::new_from_outcomes(0, 2, 0),
+            MoveValueStats::new_from_outcomes(0, 0, 3),
+        ];
+        a.populate_self_from_children(&children);
+        assert_eq!(a.wins, 1, "Wins should be 1");
+        assert_eq!(a.losses, 2, "Losses should be 2");
+        assert_eq!(a.ties, 3, "Ties should be 3");
+    }
+
+    #[test]
+    fn test_children_pop_state() {
+        let mut a = MoveValueStats::new_from_value(0);
+
+        let children = vec![
+            MoveValueStats::new_from_state(Some(MVSGameState::Win)),
+            MoveValueStats::new_from_state(Some(MVSGameState::Win)),
+            MoveValueStats::new_from_state(Some(MVSGameState::Loss)),
+            MoveValueStats::new_from_state(Some(MVSGameState::Tie)),
+            MoveValueStats::new_from_state(Some(MVSGameState::Tie)),
+        ];
+        a.populate_self_from_children(&children);
+        assert_eq!(a.wins, 2, "Wins should be 2");
+        assert_eq!(a.losses, 1, "Losses should be 1");
+        assert_eq!(a.ties, 2, "Ties should be 2");
+    }
 }
--- a/src/main.rs
+++ b/src/main.rs
@@ -39,7 +39,7 @@ fn main() {
        min_arena_depth: 14,
        top_k_children: 2,
        up_to_minus: 10,
-        max_arena_size: 200_000_000,
+        max_arena_size: 50_000_000,
        do_prune: false,
        print: true,
        children_eval_method: Default::default(),
--- a/src/repr/pos_map.rs
+++ b/src/repr/pos_map.rs
@@ -14,12 +14,12 @@ impl<T: Copy> PosMap<T> {
        Self(MaybeUninit::zeroed().assume_init())
    }

-    pub const fn from(v: [[T; Board::SIZE as usize]; Board::SIZE as usize]) -> Self {
+    pub const fn from(mut v: [[T; Board::SIZE as usize]; Board::SIZE as usize]) -> Self {
        let mut n = unsafe { Self::uninit() };

        const_for!(i in 0..Board::SIZE => {
            const_for!(j in 0..Board::SIZE => {
-                n.set(CoordPair::from_axes(i, j), v[i as usize][j as usize]);
+                std::mem::swap(n.get_mut(CoordPair::from_axes(i, j)), &mut v[i as usize][j as usize]);
            });
        });
        n
Author	SHA1	Message	Date
Simon Gardling	4ca6dfc572	commit old stuff	2025-07-24 23:19:09 -07:00
Simon Gardling	ef2e551085	posmap: use std::mem::swap	2025-04-30 18:08:40 -04:00
Simon Gardling	b5e73cbbcf	elo: improve code quality and add confidence intervals	2025-04-30 13:52:19 -04:00
Simon Gardling	aeca76fda6	fix typo	2025-04-29 18:43:38 -04:00
Simon Gardling	111ce718da	cleanup minmax impl	2025-04-29 18:32:44 -04:00
Simon Gardling	9342760d82	simplify populate_self_from_children	2025-04-29 18:20:53 -04:00
Simon Gardling	967f1f6efb	elo: fix display	2025-04-28 20:00:43 -04:00
Simon Gardling	94831b720b	elo: simplify config	2025-04-28 19:45:47 -04:00
Simon Gardling	e966a3ac9a	elo: starting board pos	2025-04-28 19:11:26 -04:00
Simon Gardling	c50892d79a	elo: edit settings	2025-04-28 19:02:40 -04:00
Simon Gardling	6b9516a510	fix logic and minmax	2025-04-28 18:44:37 -04:00
Simon Gardling	eedc80e46a	fixes	2025-04-28 01:43:24 -04:00