magicslabnu
/

OutEffHop-opt-125m

Text Generation

text-generation-inference

Model card Files Files and versions Community

robinzixuan commited on Jun 7

Commit

64f43b6

•

1 Parent(s): e20d3f0

Update configuration_opt.py

Files changed (1) hide show

configuration_opt.py +3 -0

configuration_opt.py CHANGED Viewed

@@ -20,6 +20,8 @@ from ...utils import logging
 logger = logging.get_logger(__name__)
 class OPTConfig(PretrainedConfig):
     r"""
@@ -51,6 +53,7 @@ class OPTConfig(PretrainedConfig):
             The maximum sequence length that this model might ever be used with. Typically set this to something large
             just in case (e.g., 512 or 1024 or 2048).
         do_layer_norm_before (`bool`, *optional*, defaults to `True`):
             Whether to perform layer normalization before the attention block.
         word_embed_proj_dim (`int`, *optional*):
             `word_embed_proj_dim` can be set to down-project word embeddings, *e.g.* `opt-350m`. Defaults to

 logger = logging.get_logger(__name__)
+OPTConfig.register_for_auto_class()
 class OPTConfig(PretrainedConfig):
     r"""
             The maximum sequence length that this model might ever be used with. Typically set this to something large
             just in case (e.g., 512 or 1024 or 2048).
         do_layer_norm_before (`bool`, *optional*, defaults to `True`):
             Whether to perform layer normalization before the attention block.
         word_embed_proj_dim (`int`, *optional*):
             `word_embed_proj_dim` can be set to down-project word embeddings, *e.g.* `opt-350m`. Defaults to