Update configuration_baichuan.py
#4
by
wangvince
- opened
configuration_baichuan.py
CHANGED
@@ -46,6 +46,7 @@ class BaichuanConfig(PretrainedConfig):
|
|
46 |
bos_token_id=1,
|
47 |
eos_token_id=2,
|
48 |
tie_word_embeddings=False,
|
|
|
49 |
**kwargs,
|
50 |
):
|
51 |
self.vocab_size = vocab_size
|
@@ -58,6 +59,7 @@ class BaichuanConfig(PretrainedConfig):
|
|
58 |
self.initializer_range = initializer_range
|
59 |
self.rms_norm_eps = rms_norm_eps
|
60 |
self.use_cache = use_cache
|
|
|
61 |
super().__init__(
|
62 |
pad_token_id=pad_token_id,
|
63 |
bos_token_id=bos_token_id,
|
|
|
46 |
bos_token_id=1,
|
47 |
eos_token_id=2,
|
48 |
tie_word_embeddings=False,
|
49 |
+
z_loss_weight=0,
|
50 |
**kwargs,
|
51 |
):
|
52 |
self.vocab_size = vocab_size
|
|
|
59 |
self.initializer_range = initializer_range
|
60 |
self.rms_norm_eps = rms_norm_eps
|
61 |
self.use_cache = use_cache
|
62 |
+
self.z_loss_weight = z_loss_weight
|
63 |
super().__init__(
|
64 |
pad_token_id=pad_token_id,
|
65 |
bos_token_id=bos_token_id,
|