Skip to content

Commit f3f8b75

Browse files
authored
v1.0.0 + Format (#96)
Bench: 184439
1 parent b00a6f1 commit f3f8b75

30 files changed

+136
-70
lines changed

.cargo/config.toml

-2
This file was deleted.

.gitignore

+1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
/target
2+
/.cargo
23
*-policy-*
34
*.data
45
*.binpack

Cargo.lock

+1-1
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
[package]
22
name = "monty"
3-
version = "0.1.0"
3+
version = "1.0.0"
44
edition = "2021"
55
authors = ["Jamie Whiting"]
66

README.md

+23-8
Original file line numberDiff line numberDiff line change
@@ -4,22 +4,37 @@
44
#### "MCTS is cool."
55

66
![License](https://img.shields.io/github/license/jw1912/monty?style=for-the-badge)
7-
[![GitHub release (latest by date)](https://img.shields.io/github/v/release/jw1912/monty?style=for-the-badge)](https://github.com/jw1912/akimbo/releases/latest)
8-
[![Commits](https://img.shields.io/github/commits-since/jw1912/monty/latest?style=for-the-badge)](https://github.com/jw1912/akimbo/commits/main)
7+
[![GitHub release (latest by date)](https://img.shields.io/github/v/release/jw1912/monty?style=for-the-badge)](https://github.com/jw1912/monty/releases/latest)
8+
[![Commits](https://img.shields.io/github/commits-since/jw1912/monty/latest?style=for-the-badge)](https://github.com/jw1912/monty/commits/main)
99

1010
</div>
1111

1212
## Compiling
1313
You need a network file, and run the following command
1414
```
15-
make <name of game> EVALFILE=<relative path to network file>
15+
make <name of game (lowercase)> EXE=<output path> EVALFILE=<path to network file>
1616
```
17-
to compile monty for the given game.
17+
to compile monty for the given game (chess, ataxx, shatranj).
1818

19-
## Supported Games
20-
- Ataxx
21-
- Chess
22-
- Shatranj
19+
## Originality Status
20+
21+
The first version (0.1.0) used external data for value networks and self-generated policy data. The networks were then reset
22+
completely, and all future versions are trained exclusively on monty's own data, generated from scratch with uniform policy
23+
and material counting value.
24+
25+
## Credits
26+
Thanks to everyone at SWE as usual, in particular Cosmo (Viridithas) and Zuppa (Alexandria), for helping with data generation, and Plutie, for running an LTC tune.
27+
28+
## ELO
29+
30+
<div align="center">
31+
32+
| Version | Release Date | CCRL 40/15 | CCRL Blitz | CCRL FRC | Notes |
33+
| :-: | :-: | :-: | :-: | :-: | :-: |
34+
| [1.0.0](https://github.com/jw1912/monty/releases/tag/v1.0.0) | 28th May 2024 | TBD | TBD | TBD | Fully Original Data |
35+
| [0.1.0](https://github.com/jw1912/monty/releases/tag/v0.1.0) | 26th March 2024 | - | - | 2974 | First Release |
36+
37+
</div>
2338

2439
## How it works
2540

build.rs

+4-4
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,10 @@
1-
#[cfg(not(feature="nonet"))]
1+
#[cfg(not(feature = "nonet"))]
22
use std::env;
33

4-
#[cfg(not(feature="nonet"))]
4+
#[cfg(not(feature = "nonet"))]
55
const DEFAULT_PATH: &str = "resources/net.network";
66

7-
#[cfg(not(feature="nonet"))]
7+
#[cfg(not(feature = "nonet"))]
88
fn main() {
99
println!("cargo:rerun-if-env-changed=EVALFILE");
1010
println!("cargo:rerun-if-changed=resources/chess.network");
@@ -15,5 +15,5 @@ fn main() {
1515
}
1616
}
1717

18-
#[cfg(feature="nonet")]
18+
#[cfg(feature = "nonet")]
1919
fn main() {}

datagen/src/bin/monty.rs

+4-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,8 @@
11
use datagen::{parse_args, run_datagen};
2-
use monty::{chess::{PolicyNetwork, ValueNetwork}, UciLike};
2+
use monty::{
3+
chess::{PolicyNetwork, ValueNetwork},
4+
UciLike,
5+
};
36

47
#[repr(C)]
58
struct Nets(ValueNetwork, PolicyNetwork);

datagen/src/bin/montyj.rs

+5-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,8 @@
11
use datagen::{parse_args, run_datagen};
2-
use monty::{shatranj::{PolicyNetwork, Shatranj}, ValueNetwork};
2+
use monty::{
3+
shatranj::{PolicyNetwork, Shatranj},
4+
ValueNetwork,
5+
};
36

47
#[repr(C)]
58
struct Nets(ValueNetwork<768, 8>, PolicyNetwork);
@@ -15,4 +18,4 @@ fn main() {
1518
let (threads, book, policy) = parse_args(args);
1619

1720
run_datagen::<Shatranj, 112>(1_000, threads, policy, "Shatranj", &POLICY, &VALUE, book);
18-
}
21+
}

datagen/src/bin/montyxx.rs

+5-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,8 @@
11
use datagen::{parse_args, run_datagen};
2-
use monty::{ataxx::{Ataxx, PolicyNetwork}, ValueNetwork};
2+
use monty::{
3+
ataxx::{Ataxx, PolicyNetwork},
4+
ValueNetwork,
5+
};
36

47
#[repr(C)]
58
struct Nets(ValueNetwork<2916, 256>, PolicyNetwork);
@@ -15,4 +18,4 @@ fn main() {
1518
let (threads, book, policy) = parse_args(args);
1619

1720
run_datagen::<Ataxx, 114>(1_000, threads, policy, "Ataxx", &POLICY, &VALUE, book);
18-
}
21+
}

datagen/src/impls/chess.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -197,7 +197,7 @@ impl Binpack {
197197
let mov = u16::from_le_bytes([buf[0], buf[1]]);
198198
let score = i16::from_le_bytes([buf[2], buf[3]]);
199199

200-
f(&mut board, &castling,mov.into(), score, result);
200+
f(&mut board, &castling, mov.into(), score, result);
201201
}
202202

203203
Ok(())

datagen/src/impls/shatranj.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -191,4 +191,4 @@ impl Binpack {
191191

192192
Ok(())
193193
}
194-
}
194+
}

datagen/src/lib.rs

+7-3
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,11 @@ pub use thread::{write, DatagenThread};
88
use monty::{ataxx::Ataxx, chess::Chess, shatranj::Shatranj, GameRep};
99

1010
use std::{
11-
env::Args, fs::File, io::Read, sync::atomic::{AtomicBool, Ordering}, time::Duration
11+
env::Args,
12+
fs::File,
13+
io::Read,
14+
sync::atomic::{AtomicBool, Ordering},
15+
time::Duration,
1216
};
1317

1418
pub type AtaxxPolicyData = PolicyData<Ataxx, 114>;
@@ -145,11 +149,11 @@ pub fn parse_args(mut args: Args) -> (usize, Option<String>, bool) {
145149
1 => {
146150
threads = Some(arg.parse().expect("can't parse"));
147151
mode = 0;
148-
},
152+
}
149153
2 => {
150154
book = Some(arg);
151155
mode = 0;
152-
},
156+
}
153157
_ => println!("unrecognised argument {arg}"),
154158
},
155159
}

datagen/src/thread.rs

+8-3
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,12 @@ pub struct DatagenThread<'a, T: DatagenSupport> {
2222
}
2323

2424
impl<'a, T: DatagenSupport> DatagenThread<'a, T> {
25-
pub fn new(id: u32, params: MctsParams, stop: &'a AtomicBool, book: Option<Vec<&'a str>>) -> Self {
25+
pub fn new(
26+
id: u32,
27+
params: MctsParams,
28+
stop: &'a AtomicBool,
29+
book: Option<Vec<&'a str>>,
30+
) -> Self {
2631
Self {
2732
id,
2833
rng: Rand::with_seed(),
@@ -92,7 +97,6 @@ impl<'a, T: DatagenSupport> DatagenThread<'a, T> {
9297
T::from_fen(T::STARTPOS)
9398
};
9499

95-
96100
// play 8 or 9 random moves
97101
for _ in 0..(8 + (self.rng.rand_int() % 2)) {
98102
let mut moves = Vec::new();
@@ -129,7 +133,8 @@ impl<'a, T: DatagenSupport> DatagenThread<'a, T> {
129133

130134
// play out game
131135
loop {
132-
let mut searcher = Searcher::new(position.clone(), tree, self.params.clone(), policy, value);
136+
let mut searcher =
137+
Searcher::new(position.clone(), tree, self.params.clone(), policy, value);
133138

134139
let (bm, score) = searcher.search(limits, false, &mut 0, &None);
135140

src/bin/monty.rs

+6-4
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,12 @@
1-
use monty::{chess::{ValueNetwork, PolicyNetwork, Uci}, UciLike};
1+
use monty::{
2+
chess::{PolicyNetwork, Uci, ValueNetwork},
3+
UciLike,
4+
};
25

36
#[repr(C)]
47
struct Nets(ValueNetwork, PolicyNetwork);
58

6-
const NETS: Nets =
7-
unsafe { std::mem::transmute(*include_bytes!("../../resources/net.network")) };
9+
const NETS: Nets = unsafe { std::mem::transmute(*include_bytes!("../../resources/net.network")) };
810

911
static VALUE: ValueNetwork = NETS.0;
1012
static POLICY: PolicyNetwork = NETS.1;
@@ -19,4 +21,4 @@ fn main() {
1921
}
2022

2123
Uci::run(&POLICY, &VALUE);
22-
}
24+
}

src/bin/montyj.rs

+6-4
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,12 @@
1-
use monty::{shatranj::{Uci, PolicyNetwork}, UciLike, ValueNetwork};
1+
use monty::{
2+
shatranj::{PolicyNetwork, Uci},
3+
UciLike, ValueNetwork,
4+
};
25

36
#[repr(C)]
47
struct Nets(ValueNetwork<768, 8>, PolicyNetwork);
58

6-
const NETS: Nets =
7-
unsafe { std::mem::transmute(*include_bytes!("../../resources/net.network")) };
9+
const NETS: Nets = unsafe { std::mem::transmute(*include_bytes!("../../resources/net.network")) };
810

911
static VALUE: ValueNetwork<768, 8> = NETS.0;
1012
static POLICY: PolicyNetwork = NETS.1;
@@ -19,4 +21,4 @@ fn main() {
1921
}
2022

2123
Uci::run(&POLICY, &VALUE);
22-
}
24+
}

src/bin/montyxx.rs

+6-5
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,12 @@
1-
use monty::{ataxx::{Uai, PolicyNetwork}, UciLike, ValueNetwork};
2-
1+
use monty::{
2+
ataxx::{PolicyNetwork, Uai},
3+
UciLike, ValueNetwork,
4+
};
35

46
#[repr(C)]
57
struct Nets(ValueNetwork<2916, 256>, PolicyNetwork);
68

7-
const NETS: Nets =
8-
unsafe { std::mem::transmute(*include_bytes!("../../resources/net.network")) };
9+
const NETS: Nets = unsafe { std::mem::transmute(*include_bytes!("../../resources/net.network")) };
910

1011
static VALUE: ValueNetwork<2916, 256> = NETS.0;
1112
static POLICY: PolicyNetwork = NETS.1;
@@ -20,4 +21,4 @@ fn main() {
2021
}
2122

2223
Uai::run(&POLICY, &VALUE);
23-
}
24+
}

src/comm.rs

+11-5
Original file line numberDiff line numberDiff line change
@@ -15,10 +15,7 @@ pub trait UciLike: Sized {
1515

1616
fn options();
1717

18-
fn run(
19-
policy: &<Self::Game as GameRep>::Policy,
20-
value: &<Self::Game as GameRep>::Value,
21-
) {
18+
fn run(policy: &<Self::Game as GameRep>::Policy, value: &<Self::Game as GameRep>::Value) {
2219
let mut prev = None;
2320
let mut pos = Self::Game::default();
2421
let mut params = Self::Game::default_mcts_params();
@@ -41,7 +38,16 @@ pub trait UciLike: Sized {
4138
"setoption" => setoption(&commands, &mut params, &mut report_moves, &mut tree),
4239
"position" => position(commands, &mut pos, &mut prev, &mut tree),
4340
"go" => {
44-
let res = go(&commands, tree, prev, &pos, &params, report_moves, policy, value);
41+
let res = go(
42+
&commands,
43+
tree,
44+
prev,
45+
&pos,
46+
&params,
47+
report_moves,
48+
policy,
49+
value,
50+
);
4551

4652
tree = res.0;
4753
prev = Some(res.1);

src/games.rs

+2-1
Original file line numberDiff line numberDiff line change
@@ -54,7 +54,8 @@ pub trait GameRep: Clone + Default + Send + Sync {
5454

5555
fn get_policy_feats(&self) -> Self::PolicyInputs;
5656

57-
fn get_policy(&self, mov: Self::Move, feats: &Self::PolicyInputs, policy: &Self::Policy) -> f32;
57+
fn get_policy(&self, mov: Self::Move, feats: &Self::PolicyInputs, policy: &Self::Policy)
58+
-> f32;
5859

5960
fn get_value(&self, value: &Self::Value) -> i32;
6061

src/games/chess.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -147,7 +147,7 @@ impl GameRep for Chess {
147147
&self,
148148
mov: Self::Move,
149149
(feats, threats): &Self::PolicyInputs,
150-
policy: &Self::Policy
150+
policy: &Self::Policy,
151151
) -> f32 {
152152
policy.get(&self.board, &mov, feats, *threats)
153153
}

src/games/chess/board.rs

+1-5
Original file line numberDiff line numberDiff line change
@@ -160,11 +160,7 @@ impl Board {
160160

161161
pub fn map_value_features<F: FnMut(usize)>(&self, mut f: F) {
162162
let flip = self.stm() == Side::BLACK;
163-
let hm = if self.king_index() % 8 > 3 {
164-
7
165-
} else {
166-
0
167-
};
163+
let hm = if self.king_index() % 8 > 3 { 7 } else { 0 };
168164

169165
let mut threats = self.threats_by(self.stm() ^ 1);
170166
let mut defences = self.threats_by(self.stm());

src/games/chess/frc.rs

+4-1
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,10 @@ impl Castling {
4242
rook_files = [[0, 7]; 2];
4343
}
4444

45-
let mut ret = Self { rook_files, ..Default::default() };
45+
let mut ret = Self {
46+
rook_files,
47+
..Default::default()
48+
};
4649

4750
ret.castle_mask[usize::from(rook_files[0][0])] = 7;
4851
ret.castle_mask[usize::from(rook_files[0][1])] = 11;

src/games/chess/value.rs

+2-2
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ const SCALE: i32 = 400;
44

55
#[repr(C)]
66
pub struct ValueNetwork {
7-
l1: Layer<{768 * 4}, 512>,
7+
l1: Layer<{ 768 * 4 }, 512>,
88
l2: Layer<512, 16>,
99
l3: Layer<16, 16>,
1010
l4: Layer<16, 16>,
@@ -72,7 +72,7 @@ struct Accumulator<const HIDDEN: usize> {
7272
vals: [f32; HIDDEN],
7373
}
7474

75-
impl<const HIDDEN: usize> Accumulator<HIDDEN> {
75+
impl<const HIDDEN: usize> Accumulator<HIDDEN> {
7676
fn madd(&mut self, mul: f32, other: &Self) {
7777
for (i, &j) in self.vals.iter_mut().zip(other.vals.iter()) {
7878
*i += mul * j;

src/games/shatranj.rs

+6-1
Original file line numberDiff line numberDiff line change
@@ -129,7 +129,12 @@ impl GameRep for Shatranj {
129129
feats
130130
}
131131

132-
fn get_policy(&self, mov: Self::Move, feats: &goober::SparseVector, policy: &Self::Policy) -> f32 {
132+
fn get_policy(
133+
&self,
134+
mov: Self::Move,
135+
feats: &goober::SparseVector,
136+
policy: &Self::Policy,
137+
) -> f32 {
133138
policy.get(&self.board, &mov, feats)
134139
}
135140

src/lib.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ mod tree;
66
mod value;
77

88
pub use comm::UciLike;
9-
pub use games::{GameRep, GameState, ataxx, chess, shatranj};
9+
pub use games::{ataxx, chess, shatranj, GameRep, GameState};
1010
pub use mcts::{Limits, Searcher};
1111
pub use params::MctsParams;
1212
pub use tree::Tree;

0 commit comments

Comments
 (0)