knoxel commited on
Commit
65fbc13
·
verified ·
1 Parent(s): fa1acc2

Upload results.json

Browse files
Files changed (1) hide show
  1. results.json +44 -0
results.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "paper": {
3
+ "title": "Less is More: Parameter-Free Text Classification with Gzip",
4
+ "arxiv_id": "2212.09410",
5
+ "authors": "Zhiying Jiang, Matthew Y. R. Yang, Mikhail Tsirlin, Raphael Tang, Jimmy Lin",
6
+ "year": 2022
7
+ },
8
+ "method": {
9
+ "name": "gzip + NCD + kNN",
10
+ "num_parameters": 0,
11
+ "requires_training": false,
12
+ "requires_gpu": false,
13
+ "description": "Normalized Compression Distance using gzip as compressor with k-nearest-neighbor classification. NCD(x,y) = (C(xy) - min(C(x),C(y))) / max(C(x),C(y))"
14
+ },
15
+ "dataset": "fancyzhx/ag_news",
16
+ "config": {
17
+ "train_samples_per_class": 500,
18
+ "total_train_samples": 2000,
19
+ "test_samples": 200,
20
+ "k_values_tested": [1, 2, 3, 5, 7],
21
+ "best_k": 7,
22
+ "compressor": "gzip",
23
+ "random_seed": 42
24
+ },
25
+ "best_result": {
26
+ "k": 7,
27
+ "accuracy": 0.775,
28
+ "macro_f1": 0.773
29
+ },
30
+ "sweep_results": {
31
+ "k1": {"accuracy": 0.725, "macro_f1": 0.720},
32
+ "k2": {"accuracy": 0.725, "macro_f1": 0.720},
33
+ "k3": {"accuracy": 0.735, "macro_f1": 0.733},
34
+ "k5": {"accuracy": 0.760, "macro_f1": 0.755},
35
+ "k7": {"accuracy": 0.775, "macro_f1": 0.773}
36
+ },
37
+ "paper_comparison": {
38
+ "paper_full_train_accuracy": 0.937,
39
+ "paper_bert_accuracy": 0.944,
40
+ "our_accuracy": 0.775,
41
+ "our_train_fraction": "2000/120000"
42
+ },
43
+ "hardware": "CPU only (cpu-basic, 2 vCPU)"
44
+ }