Add ConsistentXLMModel (facebookresearch#913)

Summary: Pull Request resolved: facebookresearch#913 Add an XLM model that accepts two text columns (and no label columns) as input. The model will evaluate (soft) predictions on the reference text input and treat that as the target distribution for the text in the "tokens" text input. This can be used for example when the two text columns are translations of each other (possibly multi-tasked with a regular labeled task). Reviewed By: rutyrinott Differential Revision: D16786687 fbshipit-source-id: a62d3ec4c27cc7e891375d38459ba1621e5b9d9d
geof90 · Aug 17, 2019 · 90a00c3 · 90a00c3
1 parent e32c2a5
commit 90a00c3
Show file tree

Hide file tree

Showing 3 changed files with 19 additions and 4 deletions.
diff --git a/pytext/metric_reporters/__init__.py b/pytext/metric_reporters/__init__.py
@@ -9,7 +9,7 @@
 from .compositional_metric_reporter import CompositionalMetricReporter
 from .intent_slot_detection_metric_reporter import IntentSlotMetricReporter
 from .language_model_metric_reporter import LanguageModelMetricReporter
-from .metric_reporter import MetricReporter
+from .metric_reporter import MetricReporter, PureLossMetricReporter
 from .pairwise_ranking_metric_reporter import PairwiseRankingMetricReporter
 from .regression_metric_reporter import RegressionMetricReporter
 from .squad_metric_reporter import SquadMetricReporter
@@ -32,4 +32,5 @@
     "CompositionalMetricReporter",
     "PairwiseRankingMetricReporter",
     "SequenceTaggingMetricReporter",
+    "PureLossMetricReporter",
 ]
diff --git a/pytext/metric_reporters/metric_reporter.py b/pytext/metric_reporters/metric_reporter.py
@@ -11,6 +11,8 @@
 from pytext.utils import cuda
 from pytext.utils.meter import TimeMeter
 
+from .channel import ConsoleChannel
+
 
 class MetricReporter(Component):
     """
@@ -268,3 +270,14 @@ def compare_metric(self, new_metric, old_metric):
         if new == old:
             return False
         return (new < old) == self.lower_is_better
+
+
+class PureLossMetricReporter(MetricReporter):
+    lower_is_better = True
+
+    @classmethod
+    def from_config(cls, config, *args, **kwargs):
+        return cls([ConsoleChannel()], config.pep_format)
+
+    def calculate_metric(self):
+        return self.calculate_loss()
diff --git a/pytext/task/tasks.py b/pytext/task/tasks.py
@@ -28,6 +28,7 @@
     LanguageModelMetricReporter,
     MultiLabelClassificationMetricReporter,
     PairwiseRankingMetricReporter,
+    PureLossMetricReporter,
     RegressionMetricReporter,
     SequenceTaggingMetricReporter,
     SquadMetricReporter,
@@ -153,9 +154,9 @@ def format_prediction(cls, predictions, scores, context, target_meta):
 class DocumentClassificationTask(NewTask):
     class Config(NewTask.Config):
         model: BaseModel.Config = DocModel.Config()
-        metric_reporter: ClassificationMetricReporter.Config = (
-            ClassificationMetricReporter.Config()
-        )
+        metric_reporter: Union[
+            ClassificationMetricReporter.Config, PureLossMetricReporter.Config
+        ] = (ClassificationMetricReporter.Config())
         #   for multi-label classification task,
         #   choose MultiLabelClassificationMetricReporter