vivekjoshy
diff --git a/‎.gitattributes‎
Lines changed: 1 addition & 0 deletions b/‎.gitattributes‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎benchmark/README.md‎
Lines changed: 12 additions & 0 deletions b/‎benchmark/README.md‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎benchmark/benchmark.py‎
Lines changed: 14 additions & 5 deletions b/‎benchmark/benchmark.py‎
Lines changed: 14 additions & 5 deletions
diff --git a/‎benchmark/data/pubg.7z‎
Lines changed: 3 additions & 0 deletions b/‎benchmark/data/pubg.7z‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎benchmark/processors/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎benchmark/processors/__init__.py‎
Lines changed: 1 addition & 0 deletions
@@ -1,2 +1,3 @@
 *.csv filter=lfs diff=lfs merge=lfs -text
 *.jsonl filter=lfs diff=lfs merge=lfs -text
+*.7z filter=lfs diff=lfs merge=lfs -text
@@ -133,3 +133,6 @@ dmypy.json
 
 # PDM
 /.pdm-build/
+
+# Data Files
+/benchmark/data/pubg.csv
@@ -0,0 +1,12 @@
+# Benchmark Instructions
+
+Simply run ``benchmark.py`` with a compatible Python version and choose the options.
+
+## Available Benchmarks
+
+- ``Win``: Compares win performance against TrueSkill.
+- ``Draw``: Predicts draws on standard chess matches.
+- ``Rank``: Predicts the rank of players.
+- ``Large``: Uses rank prediction on a large multi-faction dataset.
+
+The ``Large`` benchmark requires the ``pubg.csv`` file (around 1 GB) be extracted from ``pubg.7z`` and place in the ``data`` folder.
@@ -1,3 +1,4 @@
+from processors import Draw, Large, Rank, Win
 from prompt_toolkit import HTML
 from prompt_toolkit import print_formatted_text as print
 from prompt_toolkit import prompt
@@ -11,7 +12,6 @@
     ThurstoneMostellerFull,
     ThurstoneMostellerPart,
 )
-from processors import Draw, Rank, Win
 
 
 class NumberValidator(Validator):
@@ -39,7 +39,7 @@ def validate(self, document):
 model_names = {m.__name__: m for m in models}
 model_completer = WordCompleter(list(model_names.keys()))
 
-benchmark_types = [Win, Draw, Rank]
+benchmark_types = [Win, Draw, Rank, Large]
 benchmark_type_names = {_.__name__: _ for _ in benchmark_types}
 benchmark_types_completer = WordCompleter(list(benchmark_type_names.keys()))
 
@@ -92,6 +92,15 @@ def validate(self, document):
         )
         rank_processor.process()
         rank_processor.print_result()
-else:
-    print(HTML("<style fg='Red'>Processor Not Found</style>"))
-    quit()
+    elif input_benchmark_type == "Large":
+        large_processor = Large(
+            path="data/pubg.csv",
+            seed=input_seed,
+            minimum_matches=minimum_matches,
+            model=model,
+        )
+        large_processor.process()
+        large_processor.print_result()
+    else:
+        print(HTML("<style fg='Red'>Processor Not Found</style>"))
+        quit()
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3e24c9fdee00f5ca20a9da3ec05feff2e0305be6d3832eeecac995c3504f4e48
+size 131884839
@@ -1,3 +1,4 @@
 from .draw import Draw
+from .large import Large
 from .rank import Rank
 from .win import Win
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,3 @@`
`1`	`1`	`*.csv filter=lfs diff=lfs merge=lfs -text`
`2`	`2`	`*.jsonl filter=lfs diff=lfs merge=lfs -text`
	`3`	`+*.7z filter=lfs diff=lfs merge=lfs -text`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+version https://git-lfs.github.com/spec/v1`
	`2`	`+oid sha256:3e24c9fdee00f5ca20a9da3ec05feff2e0305be6d3832eeecac995c3504f4e48`
	`3`	`+size 131884839`