minimaxir · MohamedAliRashad · May 22, 2021 · May 28, 2021 · May 28, 2021
diff --git a/README.md b/README.md
@@ -1,5 +1,7 @@
 # aitextgen
 
+[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://github.com/MohamedAliRashad/aitextgen/blob/colab-tutorial/train_aitextgen.ipynb)
+
 A robust Python tool for text-based AI training and generation using [OpenAI's](https://openai.com) [GPT-2](https://openai.com/blog/better-language-models/) and [EleutherAI's](https://www.eleuther.ai) [GPT Neo/GPT-3](https://github.com/EleutherAI/gpt-neo) architecture.
 
 aitextgen is a Python package that leverages [PyTorch](https://pytorch.org), [Hugging Face Transformers](https://github.com/huggingface/transformers) and [pytorch-lightning](https://github.com/PyTorchLightning/pytorch-lightning) with specific optimizations for text generation using GPT-2, plus _many_ added features. It is the successor to [textgenrnn](https://github.com/minimaxir/textgenrnn) and [gpt-2-simple](https://github.com/minimaxir/gpt-2-simple), taking the best of both packages:

diff --git a/aitextgen/aitextgen.py b/aitextgen/aitextgen.py
@@ -72,6 +72,7 @@ class aitextgen:
     tokenizer = None
     vocab_file = os.path.join(STATIC_PATH, "gpt2_vocab.json")
     merges_file = os.path.join(STATIC_PATH, "gpt2_merges.txt")
+    models = ["124M", "355M", "774M", "1558M"]
     bos_token = "<|endoftext|>"
     eos_token = "<|endoftext|>"
     unk_token = "<|endoftext|>"
@@ -123,12 +124,7 @@ def __init__(
             if not os.path.isfile(
                 os.path.join(cache_dir, f"pytorch_model_{tf_gpt2}.bin")
             ):
-                assert tf_gpt2 in [
-                    "124M",
-                    "355M",
-                    "774M",
-                    "1558M",
-                ], "Invalid TensorFlow GPT-2 model size."
+                assert tf_gpt2 in self.models, "Invalid TensorFlow GPT-2 model size."
 
                 logger.info(
                     f"Downloading the {tf_gpt2} GPT-2 TensorFlow weights/config "
@@ -863,3 +859,6 @@ def __repr__(self) -> str:
         num_params_m = int(sum(p.numel() for p in self.model.parameters()) / 10 ** 6)
         model_name = type(self.model.config).__name__.replace("Config", "")
         return f"{model_name} loaded with {num_params_m}M parameters."
+
+    def list_models(self) -> None:
+        print("\n".join(self.models))