/ pyod / utils / knowledge / benchmarks.json
benchmarks.json
 1  {
 2    "ADBench": {
 3      "paper": {"id": "adbench", "short": "Han et al., NeurIPS 2022"},
 4      "scope": "tabular",
 5      "n_datasets": 57,
 6      "n_algorithms": 30,
 7      "rankings": {
 8        "overall_top_5": ["ECOD", "IForest", "KNN", "COPOD", "HBOS"],
 9        "high_dim_top_3": ["ECOD", "COPOD", "IForest"],
10        "low_dim_top_3": ["KNN", "LOF", "CBLOF"]
11      },
12      "key_finding": "No single algorithm dominates; ensemble of top-5 is robust"
13    },
14    "NLP_ADBench": {
15      "paper": {"id": "nlp_adbench", "short": "Li et al., EMNLP 2025"},
16      "scope": "text",
17      "n_datasets": 8,
18      "n_algorithms": 19,
19      "rankings": {
20        "overall_top_5": ["OpenAI+LUNAR", "OpenAI+LOF", "OpenAI+AE", "MiniLM+KNN", "BERT+LOF"]
21      },
22      "key_finding": "Embedding quality >> detector choice; two-step beats end-to-end"
23    },
24    "TSB_AD": {
25      "paper": {"id": "tsb_ad", "short": "Liu & Paparrizos, NeurIPS 2024"},
26      "scope": "time_series",
27      "n_datasets": 1070,
28      "n_algorithms": 40,
29      "rankings": {
30        "overall_top_5": ["IForest", "LOF", "POLY", "KNN", "KShapeAD"],
31        "subsequence_top_3": ["MatrixProfile", "SAND", "Series2Graph"]
32      },
33      "key_finding": "Classical methods competitive with deep; MatrixProfile strong on subsequence anomalies"
34    },
35    "BOND": {
36      "paper": {"id": "liu2022bond", "short": "Liu et al., NeurIPS 2022"},
37      "scope": "graph",
38      "n_datasets": 14,
39      "n_algorithms": 14,
40      "rankings": {
41        "deep_top_3": ["DOMINANT", "CoLA", "CONAD"],
42        "classical_top_2": ["Radar", "ANOMALOUS"]
43      },
44      "key_finding": "DOMINANT and CoLA are most reliable deep methods; classical MF methods competitive on small graphs"
45    }
46  }