# Import the PyFLAGR modules for rank aggregation
import pyflagr.Linear as Linear
import pyflagr.Majoritarian as Majoritarian
import pyflagr.MarkovChains as MarkovChains
import pyflagr.Kemeny as Kemeny
import pyflagr.RRA as RRA
import pyflagr.Weighted as Weighted
import pyflagr.Comparator as Comparator

# The input data file with the input lists to be aggregated.
lists = '../testdata/testdata.csv'

# The input data file with the relevance judgements.
qrels = '../testdata/testdata_qrels.csv'

EV_PTS = 10

cmp = Comparator.Comparator(EV_PTS)

cmp.add_aggregator("CombSUM-Rank", Linear.CombSUM(norm='rank', eval_pts=EV_PTS))
cmp.add_aggregator("CombSUM-Borda", Linear.CombSUM(norm='borda', eval_pts=EV_PTS))
cmp.add_aggregator("CombSUM-Score", Linear.CombSUM(norm='score', eval_pts=EV_PTS))
cmp.add_aggregator("CombMNZ-Rank", Linear.CombMNZ(norm='rank', eval_pts=EV_PTS))
cmp.add_aggregator("CombMNZ-Borda", Linear.CombMNZ(norm='borda', eval_pts=EV_PTS))
cmp.add_aggregator("CombMNZ-Score", Linear.CombMNZ(norm='score', eval_pts=EV_PTS))
cmp.add_aggregator("Condorcet", Majoritarian.CondorcetWinners(eval_pts=EV_PTS))
cmp.add_aggregator("Copeland", Majoritarian.CopelandWinners(eval_pts=EV_PTS))
cmp.add_aggregator("Outranking Approach", Majoritarian.OutrankingApproach(preference=0, veto=0.75, concordance=0,
                                                                          discordance=0.25, eval_pts=EV_PTS))
cmp.add_aggregator("MC1", MarkovChains.MC1(max_iterations=50, ergodic_number=0.15, eval_pts=EV_PTS))
cmp.add_aggregator("MC2", MarkovChains.MC2(max_iterations=50, ergodic_number=0.15, eval_pts=EV_PTS))
cmp.add_aggregator("MC3", MarkovChains.MC3(max_iterations=50, ergodic_number=0.15, eval_pts=EV_PTS))
cmp.add_aggregator("MC4", MarkovChains.MC4(max_iterations=50, ergodic_number=0.15, eval_pts=EV_PTS))
cmp.add_aggregator("MCT", MarkovChains.MCT(max_iterations=50, ergodic_number=0.15, eval_pts=EV_PTS))
cmp.add_aggregator("RRA-Exact", RRA.RRA(exact=True, eval_pts=EV_PTS))
cmp.add_aggregator("RRA", RRA.RRA(exact=False, eval_pts=EV_PTS))
cmp.add_aggregator("PrefRel", Weighted.PreferenceRelationsGraph(alpha=0.1, beta=0.5, eval_pts=EV_PTS))
cmp.add_aggregator("Agglomerative", Weighted.Agglomerative(c1=0.1, c2=0.2, eval_pts=EV_PTS))
cmp.add_aggregator("DIBRA", Weighted.DIBRA(aggregator='combsum:borda', gamma=1.2, prune=None, w_norm='minmax',
                                           eval_pts=EV_PTS))
cmp.add_aggregator("DIBRA-Prune", Weighted.DIBRA(aggregator='combsum:borda', gamma=1.2, prune='low', w_norm='minmax',
                                                 d1=0.3, d2=0.05, eval_pts=EV_PTS))
cmp.add_aggregator("DIBRA-Prune-WISE", Weighted.DIBRA(aggregator='combsum:borda', gamma=1.2, prune='wire', w_norm='minmax',
                                                 num_buckets=5, d1=0.5, d2=1.0, eval_pts=EV_PTS))

cmp.aggregate(input_file=lists, rels_file=qrels)

Running CombSUM-Rank ...
Running CombSUM-Borda ...
Running CombSUM-Score ...
Running CombMNZ-Rank ...
Running CombMNZ-Borda ...
Running CombMNZ-Score ...
Running Condorcet ...
Running Copeland ...
Running Outranking Approach ...
Running MC1 ...
Running MC2 ...
Running MC3 ...
Running MC4 ...
Running MCT ...
Running RRA-Exact ...
Running RRA ...
Running PrefRel ...
Running Agglomerative ...
Running DIBRA ...
Running DIBRA-Prune ...
Running DIBRA-Prune-WISE ...

cmp.results

df = cmp.get_results(cutoff=5, metric=["map", "precision", "ndcg"], query='all')

print(df.shape)
df.style.format(precision=4)

(21, 11)

latex_code = cmp.convert_to_latex(dec_pts=4, cutoff=EV_PTS, metric=["map", "precision", "ndcg"], query='all')
# print(latex_code)

C:\Users\Leo\anaconda3\lib\site-packages\pyflagr\Comparator.py:118: FutureWarning: In future versions `DataFrame.to_latex` is expected to utilise the base implementation of `Styler.to_latex` for formatting and rendering. The arguments signature may therefore change. It is recommended instead to use `DataFrame.style.to_latex` which also contains additional functionality.
  return self.get_results(cutoff, metric, query).round(dec_pts).to_latex()

cmp.plot_average_precision((16, 7), True, query='all')

cmp.plot_metric(EV_PTS, metric='precision', plot_type='bar', dimensions=(16,8), show_grid=True, query='all')

cmp.plot_metric(EV_PTS, metric='precision', plot_type='line', dimensions=(16,8), show_grid=True, query='all')

	q	num_ret	num_rel	num_rel_ret	Mean Average Precision (MAP)	P_1	P_2	P_3	P_4	P_5	...	ndcg_cut_2	ndcg_cut_3	ndcg_cut_4	ndcg_cut_5	ndcg_cut_6	ndcg_cut_7	ndcg_cut_8	ndcg_cut_9	ndcg_cut_10	Method
0	Topic 1	100	48	48	0.534255	1.00	1.0	0.666667	0.50	0.40	...	1.000000	0.765361	0.636682	0.553146	0.493523	0.539929	0.496846	0.532447	0.498572	CombSUM-Rank
1	Topic 2	100	46	46	0.539673	0.00	0.5	0.666667	0.50	0.40	...	0.386853	0.530721	0.441492	0.383566	0.450011	0.500404	0.540269	0.572798	0.536356	CombSUM-Rank
2	Topic 3	100	40	40	0.442181	1.00	1.0	0.666667	0.50	0.40	...	1.000000	0.765361	0.636682	0.553146	0.493523	0.448304	0.492326	0.528247	0.558260	CombSUM-Rank
3	Topic 4	100	40	40	0.427771	0.00	0.0	0.000000	0.25	0.20	...	0.000000	0.000000	0.168128	0.146068	0.130324	0.210008	0.273045	0.253726	0.301204	CombSUM-Rank
4	Topic 5	100	54	54	0.656236	1.00	1.0	1.000000	1.00	1.00	...	1.000000	1.000000	1.000000	1.000000	1.000000	1.000000	0.920205	0.855096	0.864315	CombSUM-Rank
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
16	Topic 17	99	48	47	0.598559	1.00	1.0	0.666667	0.50	0.60	...	1.000000	0.765361	0.636682	0.684352	0.718375	0.744179	0.684798	0.707100	0.662114	DIBRA-Prune-WISE
17	Topic 18	100	39	39	0.507380	1.00	1.0	0.666667	0.75	0.80	...	1.000000	0.765361	0.804810	0.830420	0.848699	0.770936	0.709420	0.659224	0.617284	DIBRA-Prune-WISE
18	Topic 19	100	45	45	0.461626	1.00	1.0	1.000000	1.00	0.80	...	1.000000	1.000000	1.000000	0.868795	0.775148	0.704125	0.727734	0.676243	0.633220	DIBRA-Prune-WISE
19	Topic 20	100	45	45	0.533849	1.00	1.0	1.000000	1.00	0.80	...	1.000000	1.000000	1.000000	0.868795	0.775148	0.704125	0.647940	0.602094	0.563788	DIBRA-Prune-WISE
20	all	1990	926	921	0.491976	0.55	0.5	0.516667	0.55	0.55	...	0.511315	0.520392	0.542183	0.543208	0.533161	0.516379	0.511082	0.513836	0.506594	DIBRA-Prune-WISE

	Mean Average Precision (MAP)	P_1	P_2	P_3	P_4	P_5	ndcg_cut_1	ndcg_cut_2	ndcg_cut_3	ndcg_cut_4	ndcg_cut_5
Method
CombSUM-Rank	0.4855	0.4500	0.4750	0.4167	0.4500	0.4400	0.4500	0.4693	0.4296	0.4498	0.4433
CombSUM-Borda	0.4836	0.5000	0.4750	0.4167	0.4250	0.4200	0.5000	0.4807	0.4383	0.4402	0.4350
CombSUM-Score	0.4854	0.4000	0.4750	0.4500	0.4625	0.4400	0.4000	0.4580	0.4444	0.4538	0.4401
CombMNZ-Rank	0.4853	0.5000	0.5000	0.4167	0.4375	0.4100	0.5000	0.5000	0.4413	0.4512	0.4314
CombMNZ-Borda	0.4849	0.5500	0.4500	0.4833	0.5000	0.4700	0.5500	0.4726	0.4908	0.5007	0.4810
CombMNZ-Score	0.4848	0.5000	0.5000	0.4167	0.4375	0.4100	0.5000	0.5000	0.4413	0.4512	0.4314
Condorcet	0.4801	0.5000	0.4750	0.4333	0.4125	0.4300	0.5000	0.4807	0.4500	0.4332	0.4420
Copeland	0.4820	0.5000	0.4500	0.4167	0.4000	0.4100	0.5000	0.4613	0.4352	0.4209	0.4247
Outranking Approach	0.4817	0.5000	0.4250	0.4333	0.4125	0.4400	0.5000	0.4420	0.4439	0.4281	0.4441
MC1	0.4876	0.6500	0.5750	0.5000	0.4750	0.4600	0.6500	0.5920	0.5352	0.5125	0.4977
MC2	0.4876	0.6500	0.5750	0.5000	0.4750	0.4600	0.6500	0.5920	0.5352	0.5125	0.4977
MC3	0.5057	0.5000	0.4750	0.5667	0.5250	0.5200	0.5000	0.4807	0.5439	0.5197	0.5171
MC4	0.4810	0.5000	0.5000	0.4167	0.4125	0.4200	0.5000	0.5000	0.4413	0.4344	0.4364
MCT	0.4813	0.4500	0.5000	0.4667	0.5000	0.4800	0.4500	0.4887	0.4679	0.4901	0.4783
RRA-Exact	0.4379	0.0500	0.1500	0.1833	0.2625	0.2800	0.5500	0.5887	0.5444	0.5369	0.5190
RRA	0.4906	0.5500	0.6250	0.5333	0.4875	0.4800	0.5500	0.6080	0.5475	0.5143	0.5058
PrefRel	0.4850	0.5500	0.5000	0.4667	0.4375	0.4400	0.5500	0.5113	0.4852	0.4625	0.4608
Agglomerative	0.2563	0.4000	0.4000	0.4000	0.4250	0.4700	0.4000	0.4000	0.4000	0.4168	0.4474
DIBRA	0.4919	0.5000	0.4750	0.5667	0.5625	0.5400	0.5000	0.4807	0.5439	0.5449	0.5324
DIBRA-Prune	0.5021	0.5500	0.5500	0.5500	0.5625	0.5900	0.5500	0.5500	0.5500	0.5584	0.5770
DIBRA-Prune-WISE	0.4920	0.5500	0.5000	0.5167	0.5500	0.5500	0.5500	0.5113	0.5204	0.5422	0.5432

Rank	Relevant	$\text{Precision}@k$	$\text{Recall}@k$	$F1@k$	$DCG@k$	$IDCG@k$	$nDCG@k$	$AP@k$
1	Yes	$1.00$	$0.25$	$0.40$	$1.00$	$1.00$	$1.00$	$1.00$
2	No	$0.50$	$0.25$	$0.33$	$1.00$	$1.63$	$0.61$	$1.00$
3	Yes	$0.67$	$0.50$	$0.62$	$1.50$	$2.13$	$0.70$	$0.83$
4	Yes	$0.75$	$0.75$	$0.75$	$1.93$	$2.56$	$0.75$	$0.81$
5	No	$0.60$	$0.75$	$0.66$	$1.93$	$2.56$	$0.75$	$0.81$
6	Yes	$0.67$	$1.00$	$0.80$	$2.29$	$2.56$	$0.89$	$0.77$
7	No	$0.57$	$1.00$	$0.73$	$2.29$	$2.56$	$0.89$	$0.77$
8	No	$0.50$	$1.00$	$0.66$	$2.29$	$2.56$	$0.89$	$0.77$

Comparing rank aggregation algorithms with PyFLAGR¶

Installation¶

Downloads, Documentation, Version and License¶

Importing and using PyFLAGR¶

Input/Output files¶

The `Comparator` class¶

Class constructor¶

The `aggregators` array and the `add_aggregator` member function¶

The `aggregate()` member function¶

The `results` Dataframe¶

Retrieving the evaluation results with `get_results()`¶

Converting to LaTeX¶

Plots: Mean Average Precision¶

Plots: Evaluation measures at specific cutoff points¶

Appendix: Evaluation measures¶

$\text{Precision@}k$¶

$\text{Recall@}k$¶

$F1@k$¶

Discounted Cumulative Gain ($DCG@k$)¶

Normalized Discounted Cumulative Gain ($nDCG@k$)¶

Average Precision ($AP$)¶

Mean Average Precision (MAP)¶

Example¶

Example calculations at the 5th element of the list (@5)¶

Comparing rank aggregation algorithms with PyFLAGR¶

Installation¶

Downloads, Documentation, Version and License¶

Importing and using PyFLAGR¶

Input/Output files¶

The Comparator class¶

Class constructor¶

The aggregators array and the add_aggregator member function¶

The aggregate() member function¶

The results Dataframe¶

Retrieving the evaluation results with get_results()¶

Converting to LaTeX¶

Plots: Mean Average Precision¶

Plots: Evaluation measures at specific cutoff points¶

Appendix: Evaluation measures¶

$\text{Precision@}k$¶

$\text{Recall@}k$¶

$F1@k$¶

Discounted Cumulative Gain ($DCG@k$)¶

Normalized Discounted Cumulative Gain ($nDCG@k$)¶

Average Precision ($AP$)¶

Mean Average Precision (MAP)¶

Example¶

Example calculations at the 5th element of the list (@5)¶

The `Comparator` class¶

The `aggregators` array and the `add_aggregator` member function¶

The `aggregate()` member function¶

The `results` Dataframe¶

Retrieving the evaluation results with `get_results()`¶