def _tuples_to_df()

in sourcecode/scoring/post_selection_similarity_old.py [0:0]


def _tuples_to_df(tuples, name="pairRatings"):
  leftRater, rightRater, tweetId = zip(*tuples)
  df = pd.DataFrame(
    {
      "leftRaterId": np.array(leftRater),
      "rightRaterId": np.array(rightRater),
      "tweetId": np.array(tweetId),
    }
  )
  print(len(df))
  df = df.drop_duplicates()
  print(len(df))
  df = (
    df.groupby(["leftRaterId", "rightRaterId"])
    .count()
    .reset_index(drop=False)
    .rename(columns={"tweetId": name})
  )
  print(len(df))
  return df