# Import the PyFLAGR modules for rank aggregation
import pyflagr.Linear as Linear
import pyflagr.Majoritarian as Majoritarian
import pyflagr.MarkovChains as MarkovChains
import pyflagr.Kemeny as Kemeny
import pyflagr.RRA as RRA
import pyflagr.Weighted as Weighted

# Code snippet for displaying dataframes side by side
from IPython.display import display_html
from itertools import chain,cycle
def display_side_by_side(*args,titles=cycle([''])):
    html_str=''
    x = 1
    for df,title in zip(args, chain(titles,cycle(['</br>'])) ):
        html_str+='<th style="text-align:center"><td style="vertical-align:top">'
        html_str+=f'<h2 style="text-align: center;">{title}</h2>'
        html_str+=df.to_html().replace('table','table style="display:inline"')
        html_str+='</td></th>'
    display_html(html_str,raw=True)

# The input data file with the input lists to be aggregated.
lists = '../testdata/testdata.csv'

# The input data file with the relevance judgements.
qrels = '../testdata/testdata_qrels.csv'

csum = Linear.CombSUM(norm='rank', eval_pts=5)

# In this case, rels_file has been specified, so PyFLAGR returns two non-blank dataframes:
# * df_out contains the aggregate list produced by the selected algorithm
# * df_eval contains the effectiveness evaluation based on the relevance judgments in the rels_file
df_out, df_eval = csum.aggregate(input_file=lists, rels_file=qrels)

display_side_by_side(df_out.head(20), df_eval, titles=['Aggregate list', 'Evaluation'])

csum = Linear.CombSUM(norm='score')

# In this case, rels_file has NOT been specified, so PyFLAGR returns two dataframes,
# * df_out contains the aggregate list produced by the selected algorithm
# * df_eval is blank
df_out, df_eval = csum.aggregate(input_file=lists)

display_side_by_side(df_out.head(20), df_eval, titles=['Aggregate list','Evaluation'])

borda = Linear.BordaCount(eval_pts=7)

df_out, df_eval = borda.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

sborda = Linear.SimpleBordaCount(eval_pts=7)

df_out, df_eval = sborda.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

# Equivalent code for Borda Count: This one produces the same results as the previous code block
csum = Linear.CombSUM(norm='borda', eval_pts=7)

df_out, df_eval = csum.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

cmnz = Linear.CombMNZ(norm='rank', eval_pts=7)

df_out, df_eval = cmnz.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

condorcet = Majoritarian.CondorcetWinners(eval_pts=7)

df_out, df_eval = condorcet.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

copeland = Majoritarian.CopelandWinners(eval_pts=7)

df_out, df_eval = copeland.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

outrank = Majoritarian.OutrankingApproach(eval_pts=7)

df_out, df_eval = outrank.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

mch = MarkovChains.MC1(eval_pts=7, max_iterations=50)

df_out, df_eval = mch.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

mch = MarkovChains.MC2(eval_pts=7, max_iterations=50)

df_out, df_eval = mch.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

mch = MarkovChains.MC3(eval_pts=7, max_iterations=50)

df_out, df_eval = mch.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

mch = MarkovChains.MC4(eval_pts=7, max_iterations=50)

df_out, df_eval = mch.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

mch = MarkovChains.MCT(eval_pts=7, max_iterations=50)

df_out, df_eval = mch.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

robust = RRA.RRA(eval_pts=7, exact=True)

df_out, df_eval = robust.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

prf_graph = Weighted.PreferenceRelationsGraph(alpha=0.1, beta=0.5, eval_pts=7)

df_out, df_eval = prf_graph.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

agg = Weighted.Agglomerative(c1=0.1, c2=0.2, eval_pts=7)

df_out, df_eval = agg.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

method_1 = Weighted.DIBRA(aggregator='outrank', eval_pts=7)

df_out, df_eval = method_1.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

method_2 = Weighted.DIBRA(eval_pts=7, gamma=1.5, prune='low', d1=0.3, d2=0.05)

df_out, df_eval = method_2.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

method_3 = Weighted.DIBRA(eval_pts=7, aggregator="outrank")

df_out, df_eval = method_3.aggregate(input_file=lists, rels_file=qrels)
df_eval.tail(1)

Parameter	Type	Default Value	Values
`input_file`	String - Required, unless `input_df` is set.	Empty String	A CSV file that contains the input lists to be aggregated.
`input_df`	Pandas DataFrame - Required, unless `input_file` is set.	`None`	A Pandas DataFrame that contains the input lists to be aggregated. Note: If both `input_file` and `input_df` are set, only the former is used; the latter is ignored.
`rels_file`	String, Optional.	Empty String	A CSV file that contains the relevance judgements of the involved list elements. If such a file is passed, FLAGR will evaluate the generated aggregate list/s by computing several retrieval effectiveness evaluation measures. The results of the evaluation will be stored in the `eval_df` DataFrame. Otherwise, no evaluation will take place and `eval_df` will be empty. Read more on the evaluation of rank aggregation quality.
`rels_df`	Pandas DataFrame, Optional.	`None`	A Pandas DataFrame that contains the relevance judgements of the involved list elements. If such a dataframe is passed, FLAGR will evaluate the generated aggregate list/s by computing several retrieval effectiveness evaluation measures. The results of the evaluation will be stored in the `eval_df` DataFrame. Otherwise, no evaluation will take place and `eval_df` will be empty. Read more on the evaluation of rank aggregation quality. Note: If both `rels_file` and `rels_df` are set, only the former is used; the latter is ignored.
`output_dir`	String, Optional.	Temporary directory (OS-specific)	The directory where the output files (aggregate lists and evaluation) will be stored. If it is not set, the default location will be used.

Parameter	Type	Default Value	Values
`eval_pts`	Integer, Optional. Considered only if `rels_file` or `rels_df` is set.	10	Determines the elements in the aggregate list on which the evaluation measures (i.e. Precision, and nDCG) will be computed. For example, for `eval_pts=10` FLAGR will compute $P@1, P@2, ... P@10$, and $N@1, N@2, ..., N@10$.
`norm`	String, Optional.	`borda`	Rank or score normalization methods: `borda`: The aggregation is performed by normalizing the element rankings according to the Borda normalization method. Equivalent to the `BordaCount` function. `rank`: The aggregation is performed by normalizing the element rankings according to the Rank normalization method. `score`: The aggregation is performed by normalizing the element scores according to the Score normalization method. `z-score`: The aggregation is performed by normalizing the element scores according to the Z-Score normalization method. `simple-borda`: Similar to `borda` normalization but no partial score is assigned to an element if it is not ranked by a voter.

	Query	Voter	ItemID	Rank	Score	Aggregator
0	1	PyFLAGR	Q1-E39	1	13.466667	101
1	1	PyFLAGR	Q1-E48	2	12.933333	101
2	1	PyFLAGR	Q1-E23	3	11.933333	101
3	1	PyFLAGR	Q1-E85	4	11.400000	101
4	1	PyFLAGR	Q1-E95	5	11.366667	101
5	1	PyFLAGR	Q1-E94	6	11.300000	101
6	1	PyFLAGR	Q1-E33	7	11.000000	101
7	1	PyFLAGR	Q1-E63	8	10.700000	101
8	1	PyFLAGR	Q1-E100	9	10.666667	101
9	1	PyFLAGR	Q1-E5	10	10.433333	101
10	1	PyFLAGR	Q1-E43	11	10.300000	101
11	1	PyFLAGR	Q1-E32	12	10.000000	101
12	1	PyFLAGR	Q1-E35	13	9.933333	101
13	1	PyFLAGR	Q1-E88	14	9.933333	101
14	1	PyFLAGR	Q1-E16	15	9.666667	101
15	1	PyFLAGR	Q1-E56	16	9.566667	101
16	1	PyFLAGR	Q1-E84	17	9.533333	101
17	1	PyFLAGR	Q1-E3	18	9.466667	101
18	1	PyFLAGR	Q1-E89	19	9.400000	101
19	1	PyFLAGR	Q1-E62	20	9.400000	101

	q	num_ret	num_rel	num_rel_ret	map	P_1	P_2	P_3	P_4	P_5	recall_1	recall_2	recall_3	recall_4	recall_5	dcg_cut_1	dcg_cut_2	dcg_cut_3	dcg_cut_4	dcg_cut_5	ndcg_cut_1	ndcg_cut_2	ndcg_cut_3	ndcg_cut_4	ndcg_cut_5
0	Topic 1	100	48	48	0.534255	1.00	1.000	0.666667	0.50	0.40	0.020833	0.041667	0.041667	0.041667	0.041667	1.00	1.630930	1.630930	1.630930	1.630930	1.00	1.000000	0.765361	0.636682	0.553146
1	Topic 2	100	46	46	0.539673	0.00	0.500	0.666667	0.50	0.40	0.000000	0.021739	0.043478	0.043478	0.043478	0.00	0.630930	1.130930	1.130930	1.130930	0.00	0.386853	0.530721	0.441492	0.383566
2	Topic 3	100	40	40	0.442181	1.00	1.000	0.666667	0.50	0.40	0.025000	0.050000	0.050000	0.050000	0.050000	1.00	1.630930	1.630930	1.630930	1.630930	1.00	1.000000	0.765361	0.636682	0.553146
3	Topic 4	100	40	40	0.427771	0.00	0.000	0.000000	0.25	0.20	0.000000	0.000000	0.000000	0.025000	0.025000	0.00	0.000000	0.000000	0.430677	0.430677	0.00	0.000000	0.000000	0.168128	0.146068
4	Topic 5	100	54	54	0.656236	1.00	1.000	1.000000	1.00	1.00	0.018519	0.037037	0.055556	0.074074	0.092593	1.00	1.630930	2.130930	2.561606	2.948459	1.00	1.000000	1.000000	1.000000	1.000000
5	Topic 6	100	50	50	0.496233	0.00	0.500	0.333333	0.25	0.40	0.000000	0.020000	0.020000	0.020000	0.040000	0.00	0.630930	0.630930	0.630930	1.017783	0.00	0.386853	0.296082	0.246302	0.345191
6	Topic 7	100	48	48	0.413981	0.00	0.000	0.000000	0.00	0.20	0.000000	0.000000	0.000000	0.000000	0.020833	0.00	0.000000	0.000000	0.000000	0.386853	0.00	0.000000	0.000000	0.000000	0.131205
7	Topic 8	100	48	48	0.487902	1.00	0.500	0.666667	0.75	0.60	0.020833	0.020833	0.041667	0.062500	0.062500	1.00	1.000000	1.500000	1.930677	1.930677	1.00	0.613147	0.703918	0.753698	0.654809
8	Topic 9	100	48	48	0.415008	0.00	0.500	0.333333	0.50	0.40	0.000000	0.020833	0.020833	0.041667	0.041667	0.00	0.630930	0.630930	1.061606	1.061606	0.00	0.386853	0.296082	0.414430	0.360055
9	Topic 10	100	50	50	0.480995	0.00	0.500	0.333333	0.50	0.40	0.000000	0.020000	0.020000	0.040000	0.040000	0.00	0.630930	0.630930	1.061606	1.061606	0.00	0.386853	0.296082	0.414430	0.360055
10	Topic 11	100	51	51	0.536177	1.00	0.500	0.333333	0.50	0.60	0.019608	0.019608	0.019608	0.039216	0.058824	1.00	1.000000	1.000000	1.430677	1.817529	1.00	0.613147	0.469279	0.558508	0.616434
11	Topic 12	100	38	38	0.406823	1.00	0.500	0.333333	0.25	0.20	0.026316	0.026316	0.026316	0.026316	0.026316	1.00	1.000000	1.000000	1.000000	1.000000	1.00	0.613147	0.469279	0.390380	0.339160
12	Topic 13	100	43	43	0.487894	1.00	1.000	0.666667	0.50	0.40	0.023256	0.046512	0.046512	0.046512	0.046512	1.00	1.630930	1.630930	1.630930	1.630930	1.00	1.000000	0.765361	0.636682	0.553146
13	Topic 14	100	45	45	0.470907	0.00	0.000	0.000000	0.25	0.20	0.000000	0.000000	0.000000	0.022222	0.022222	0.00	0.000000	0.000000	0.430677	0.430677	0.00	0.000000	0.000000	0.168128	0.146068
14	Topic 15	100	48	48	0.420168	0.00	0.000	0.000000	0.00	0.20	0.000000	0.000000	0.000000	0.000000	0.020833	0.00	0.000000	0.000000	0.000000	0.386853	0.00	0.000000	0.000000	0.000000	0.131205
15	Topic 16	100	52	52	0.506824	0.00	0.000	0.333333	0.50	0.40	0.000000	0.000000	0.019231	0.038462	0.038462	0.00	0.000000	0.500000	0.930677	0.930677	0.00	0.000000	0.234639	0.363318	0.315648
16	Topic 17	100	48	48	0.557906	0.00	0.000	0.333333	0.25	0.40	0.000000	0.000000	0.020833	0.020833	0.041667	0.00	0.000000	0.500000	0.500000	0.886853	0.00	0.000000	0.234639	0.195190	0.300785
17	Topic 18	100	39	39	0.509445	1.00	1.000	0.666667	0.75	0.80	0.025641	0.051282	0.051282	0.076923	0.102564	1.00	1.630930	1.630930	2.061606	2.448459	1.00	1.000000	0.765361	0.804810	0.830420
18	Topic 19	100	45	45	0.426503	0.00	0.000	0.333333	0.50	0.40	0.000000	0.000000	0.022222	0.044444	0.044444	0.00	0.000000	0.500000	0.930677	0.930677	0.00	0.000000	0.234639	0.363318	0.315648
19	Topic 20	100	45	45	0.492781	1.00	1.000	0.666667	0.75	0.80	0.022222	0.044444	0.044444	0.066667	0.088889	1.00	1.630930	1.630930	2.061606	2.448459	1.00	1.000000	0.765361	0.804810	0.830420
20	all	2000	926	926	0.485483	0.45	0.475	0.416667	0.45	0.44	0.010111	0.021014	0.027182	0.038999	0.047423	0.45	0.765465	0.915465	1.152337	1.307078	0.45	0.469343	0.429608	0.449849	0.443309

	Query	Voter	ItemID	Rank	Score	Aggregator
0	1	PyFLAGR	Q1-E39	1	13.206937	102
1	1	PyFLAGR	Q1-E48	2	12.517291	102
2	1	PyFLAGR	Q1-E23	3	11.551781	102
3	1	PyFLAGR	Q1-E95	4	11.137948	102
4	1	PyFLAGR	Q1-E85	5	11.103479	102
5	1	PyFLAGR	Q1-E94	6	10.965562	102
6	1	PyFLAGR	Q1-E33	7	10.689677	102
7	1	PyFLAGR	Q1-E63	8	10.379323	102
8	1	PyFLAGR	Q1-E100	9	10.344844	102
9	1	PyFLAGR	Q1-E5	10	10.241416	102
10	1	PyFLAGR	Q1-E43	11	10.103458	102
11	1	PyFLAGR	Q1-E88	12	9.689687	102
12	1	PyFLAGR	Q1-E35	13	9.689687	102
13	1	PyFLAGR	Q1-E32	14	9.620729	102
14	1	PyFLAGR	Q1-E16	15	9.413802	102
15	1	PyFLAGR	Q1-E56	16	9.379333	102
16	1	PyFLAGR	Q1-E84	17	9.241396	102
17	1	PyFLAGR	Q1-E3	18	9.206927	102
18	1	PyFLAGR	Q1-E89	19	9.206917	102
19	1	PyFLAGR	Q1-E62	20	9.103500	102

(Py)FLAGR¶

Installation¶

Downloads, Documentation, Version and License¶

Importing and using PyFLAGR¶

General Description¶

Input/Output files¶

PyFLAGR Code examples¶

Linear combination methods¶

`CombSUM`¶

Aggregate list

Evaluation

Aggregate list

Evaluation

`BordaCount` and `SimpleBordaCount`¶

`CombMNZ`¶

Majoritarian methods¶

`CondorcetWinners`¶

`CopelandWinners`¶

`OutrankingApproach`¶

Markov Chain methods¶

`MC1`, `MC2`, `MC3`, `MC4`, and `MCT`¶

`RRA`: Robust Rank Aggregation¶

Weighted methods¶

`PreferenceRelationsGraph`¶

`Agglomerative`¶

`DIBRA`: Iterative Distance-Based Aggregation¶

Parameter	Type	Default Value	Values
`eval_pts`	Integer, Optional. Considered only if `rels_file` or `rels_df` is set.	10	Determines the elements in the aggregate list on which the evaluation measures (i.e. Precision, and nDCG) will be computed. For example, for `eval_pts=10` FLAGR will compute $P@1, P@2, ... P@10$, and $N@1, N@2, ..., N@10$.
`aggregator`	Hyperparameter, String, Optional.	`combsum:borda`	The baseline aggregation method. An extended weighted variant of the baseline method is applied internally by plugging the computed voter weights. The list of supported values includes: `combsum:borda`: CombSUM with Borda rank normalization. `combsum:rank`: CombSUM with rankings normalization. `combsum:score`: CombSUM with score min-max normalization. `combsum:z-score`: CombSUM with score z-normalization. `combsum:simple-borda`: CombSUM with simple Borda normalization. `combmnz:borda`: CombMNZ with Borda rank normalization. `combmnz:rank`: CombMNZ with rankings normalization. `combmnz:score`: CombMNZ with score min-max normalization. `combmnz:z-score`: CombMNZ with score z-normalization. `combmnz:simple-borda`: CombMNZ with simple Borda normalization. `condorcet`: The Condorcet Winners method. `copeland`: The Copeland Winners method. `outrank`: The Outranking Approach.
`w_norm`	Hyperparameter, String, Optional.	`minmax`	The voter weights normalization method. The list of supported values includes: `none`: The voter weights will not be normalized. `minmax`: The voter weights will be normalized with min-max scaling. `z`: The voter weights will be z-normalized
`dist`	Hyperparameter, String, Optional.	`cosine`	The metric that is used to measure the distance between an input list and the temporary aggregate list. The list of supported values includes: `rho`: The Spearman's $\rho$ correlation coefficient. `cosine`: Cosine similarity of the lists' vector representations. `tau`: The Kendall's $\tau$ correlation coefficient. `footrule`: A scaled variant of Spearman's Footrule distance.
`gamma`	Hyperparameter, Float, Optional.	1.50	The $\gamma$ hyper-parameter that determines the steplength of weight learning.
`prune`	Hyperparameter, Boolean, Optional.	`None`	Triggers a weight-dependant list pruning mechanism. The list of supported values includes: `None`: No pruning takes place (i.e., all list elements are preserved) `low`: The list pruning method of Akritidis et al., 2022. `wire`: The item selection method of Akritidis and Bozanis, 2025.
`num_buckets`	Hyperparameter, Integer, Optional.	3	The number of voter buckets, used in the list pruning method of Akritidis and Bozanis, 2025. Applies only if `prune='wire'`.
`d1`	Hyperparameter, Float, Optional. Used only when `prune is not None`	0.4	The hyperparameter $\delta_1$ of the weight-dependant list pruning mechanism. Applies only if `prune is not None`.
`d2`	Hyperparameter, Float, Optional. Used only when `prune is not None`	0.1	The hyperparameter $\delta_2$ of the weight-dependant list pruning mechanism. Applies only if `prune is not None`.
`tol`	Hyperparameter, Float, Optional.	0.01	Controls the convergence precision. This tolerance threshold represents the minimum precision of the difference between the voter weight in an iteration and the voter weight of the previous iteration.
`max_iter`	Hyperparameter, Integer, Optional.	50	Controls the maximum number of iterations. FLAGR will stop the execution of DIBRA if the requested number of iterations have been performed, even if the voter weights have not fully converged.
`pref`	Hyperparameter, Float, Optional.	0	Preference threshold. Applies only if `aggregator=outrank`.
`veto`	Hyperparameter, Float, Optional.	0.75	Veto threshold. Applies only if `aggregator=outrank`.
`conc`	Hyperparameter, Float, Optional.	0	Concordance threshold. Applies only if `aggregator=outrank`.
`disc`	Hyperparameter, Float, Optional.	0.25	Discordance threshold. Applies only if `aggregator=outrank`.

(Py)FLAGR¶

Installation¶

Downloads, Documentation, Version and License¶

Importing and using PyFLAGR¶

General Description¶

Input/Output files¶

PyFLAGR Code examples¶

Linear combination methods¶

CombSUM¶

Aggregate list

Evaluation

Aggregate list

Evaluation

BordaCount and SimpleBordaCount¶

CombMNZ¶

Majoritarian methods¶

CondorcetWinners¶

CopelandWinners¶

OutrankingApproach¶

Markov Chain methods¶

MC1, MC2, MC3, MC4, and MCT¶

RRA: Robust Rank Aggregation¶

Weighted methods¶

PreferenceRelationsGraph¶

Agglomerative¶

DIBRA: Iterative Distance-Based Aggregation¶

`CombSUM`¶

`BordaCount` and `SimpleBordaCount`¶

`CombMNZ`¶

`CondorcetWinners`¶

`CopelandWinners`¶

`OutrankingApproach`¶

`MC1`, `MC2`, `MC3`, `MC4`, and `MCT`¶

`RRA`: Robust Rank Aggregation¶

`PreferenceRelationsGraph`¶

`Agglomerative`¶

`DIBRA`: Iterative Distance-Based Aggregation¶