in sourcecode/scoring/post_selection_similarity_old.py [0:0]
def _tuples_to_df(tuples, name="pairRatings"):
leftRater, rightRater, tweetId = zip(*tuples)
df = pd.DataFrame(
{
"leftRaterId": np.array(leftRater),
"rightRaterId": np.array(rightRater),
"tweetId": np.array(tweetId),
}
)
print(len(df))
df = df.drop_duplicates()
print(len(df))
df = (
df.groupby(["leftRaterId", "rightRaterId"])
.count()
.reset_index(drop=False)
.rename(columns={"tweetId": name})
)
print(len(df))
return df