argilla-io · davidberenstein1957 · Nov 26, 2023 · Nov 21, 2023 · Nov 21, 2023 · Nov 22, 2023
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -28,6 +28,7 @@ These are the section headers that we use:
 - Fixed error in `ArgillaTrainer`, with numerical labels, using `RatingQuestion` instead of `RankingQuestion` ([#4171](https://github.com/argilla-io/argilla/pull/4171))
 - Fixed error in `ArgillaTrainer`, now we can train for `extractive_question_answering` using a validation sample ([#4204](https://github.com/argilla-io/argilla/pull/4204))
 - Fixed error in `ArgillaTrainer`, when training for `sentence-similarity` it didn't work with a list of values per record ([#4211](https://github.com/argilla-io/argilla/pull/4211))
+- Fixed error in the unification strategy for `RankingQuestion` ([#4295](https://github.com/argilla-io/argilla/pull/4295))
 
 ### Changed
 

diff --git a/src/argilla/client/feedback/unification.py b/src/argilla/client/feedback/unification.py
@@ -45,7 +45,9 @@ class UnifiedValueSchema(ValueSchema):
         >>> value = {"value": "Yes", "strategy": "majority"}
     """
 
-    strategy: Union["RatingQuestionStrategy", "LabelQuestionStrategy", "MultiLabelQuestionStrategy"]
+    strategy: Union[
+        "RatingQuestionStrategy", "LabelQuestionStrategy", "MultiLabelQuestionStrategy", "RankingQuestionStrategy"
+    ]
 
 
 class RatingQuestionStrategyMixin:
@@ -202,13 +204,11 @@ def unify_responses(self, records: List[FeedbackRecord], question: str):
 class RankingQuestionStrategy(RatingQuestionStrategyMixin, Enum):
     """
     Options:
-        - "mean": the mean value of the rankings
         - "majority": the majority value of the rankings
         - "max": the max value of the rankings
         - "min": the min value of the rankings
     """
 
-    MEAN: str = "mean"
     MAJORITY: str = "majority"
     MAX: str = "max"
     MIN: str = "min"
@@ -238,29 +238,36 @@ def _aggregate(self, records: List[FeedbackRecord], question: str):
             # only allow for submitted responses
             responses = [resp for resp in rec.responses if resp.status == "submitted"]
             # get responses with a value that is most frequent
-            ratings = []
+            total_values = []
+            total_ranks = []
             for resp in responses:
                 if question in resp.values:
+                    values = []
+                    ranks = []
                     for value in resp.values[question].value:
-                        ratings.append([value.value, value.rank])
-            if not ratings:
+                        values.append(value.value)
+                        ranks.append(value.rank)
+
+                    total_values.append(tuple(values))
+                    total_ranks.append(tuple(ranks))
+
+            if not total_values:
                 continue
-            df = pd.DataFrame(ratings, columns=["value", "rank"])
+            df = pd.DataFrame({"value": total_values, "rank": total_ranks})
+
             # unified response
-            if self.value == self.MEAN.value:
-                df = df.groupby("value", sort=False).mean().reset_index()
-                df = df.sort_values(by="rank", ascending=True)
-            elif self.value == self.MAX.value:
-                df = df.groupby("value", sort=False).min().reset_index()  # inverse due to higher rank better
-                df = df.sort_values(by="rank", ascending=True)
+            if self.value == self.MAX.value:
+                df = df[df["rank"] == df["rank"].max()]
             elif self.value == self.MIN.value:
-                df = df.groupby("value", sort=False).max().reset_index()  # inverse due to higher rank better
+                df = df[df["rank"] == df["rank"].min()]
             else:
                 raise ValueError("Invalid aggregation method")
-            options = df["value"].tolist()
-            if options:
-                unified_value = options[0]
-                rec._unified_responses[question] = [UnifiedValueSchema(value=unified_value, strategy=self.value)]
+
+            if len(df) > 0:
+                # Extract the first of the possible values (in case there is more than one).
+                unified_rank = [{"rank": item[1], "value": item[0]} for item in zip(*df.iloc[0].to_list())]
+                rec._unified_responses[question] = [UnifiedValueSchema(value=unified_rank, strategy=self.value)]
+
         return records
 
     def _majority(self, records: List[FeedbackRecord], question: str):
@@ -288,21 +295,30 @@ def _majority(self, records: List[FeedbackRecord], question: str):
             # only allow for submitted responses
             responses = [resp for resp in rec.responses if resp.status == "submitted"]
             # get responses with a value that is most frequent
+            ranks = []
             for resp in responses:
                 if question in resp.values:
+                    rank_per_response = []
                     for value in resp.values[question].value:
-                        counter.update([value.value] * value.rank)
+                        rank_per_response.append((value.rank, value.value))
+                    ranks.append(tuple(rank_per_response))
+
+            counter.update(ranks)
             if not counter.values():
                 continue
-            # Find the minimum count
-            min_count = min(counter.values())
-            # Get a list of values with the minimum count
-            least_common_values = [value for value, count in counter.items() if count == min_count]
-            if len(least_common_values) > 1:
-                majority_value = random.choice(least_common_values)
+            # Find the maximum count
+            max_count = max(counter.values())
+            # Get a list of values with the maximum count
+            most_common_values = [value for value, count in counter.items() if count == max_count]
+            if len(most_common_values) > 1:
+                majority_value = random.choice(most_common_values)
             else:
-                majority_value = counter.most_common()[-1][0]
-            rec._unified_responses[question] = [UnifiedValueSchema(value=majority_value, strategy=self.value)]
+                majority_value = counter.most_common()[0][0]
+
+            # Recreate the final ranking
+            majority_rank = [{"rank": item[0], "value": item[1]} for item in majority_value]
+            rec._unified_responses[question] = [UnifiedValueSchema(value=majority_rank, strategy=self.value)]
+
         return records
 
 

diff --git a/tests/integration/client/feedback/test_unification.py b/tests/integration/client/feedback/test_unification.py
@@ -70,10 +70,9 @@ def test_rating_question_strategy(strategy, unified_response):
 @pytest.mark.parametrize(
     "strategy, unified_response",
     [
-        ("mean", [{"value": "yes", "strategy": "mean"}]),
-        ("majority", [{"value": "yes", "strategy": "majority"}]),
-        ("max", [{"value": "no", "strategy": "max"}]),
-        ("min", [{"value": "yes", "strategy": "min"}]),
+        ("majority", [{"value": [{"rank": 2, "value": "yes"}, {"rank": 3, "value": "no"}], "strategy": "majority"}]),
+        ("max", [{"value": [{"rank": 2, "value": "yes"}, {"rank": 3, "value": "no"}], "strategy": "max"}]),
+        ("min", [{"value": [{"rank": 2, "value": "yes"}, {"rank": 1, "value": "no"}], "strategy": "min"}]),
     ],
 )
 def test_ranking_question_strategy(strategy, unified_response):