Joe99 commited on
Commit
2f2094a
1 Parent(s): 611782c

gpt2cleaner v2

Browse files
Files changed (3) hide show
  1. README.md +1 -17
  2. adapter_config.json +3 -0
  3. adapter_model.safetensors +1 -1
README.md CHANGED
@@ -198,22 +198,6 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
198
  [More Information Needed]
199
 
200
 
201
- ## Training procedure
202
-
203
-
204
- The following `bitsandbytes` quantization config was used during training:
205
- - quant_method: bitsandbytes
206
- - load_in_8bit: False
207
- - load_in_4bit: True
208
- - llm_int8_threshold: 6.0
209
- - llm_int8_skip_modules: None
210
- - llm_int8_enable_fp32_cpu_offload: False
211
- - llm_int8_has_fp16_weight: False
212
- - bnb_4bit_quant_type: nf4
213
- - bnb_4bit_use_double_quant: False
214
- - bnb_4bit_compute_dtype: float16
215
-
216
  ### Framework versions
217
 
218
-
219
- - PEFT 0.6.3.dev0
 
198
  [More Information Needed]
199
 
200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
201
  ### Framework versions
202
 
203
+ - PEFT 0.7.1.dev0
 
adapter_config.json CHANGED
@@ -8,8 +8,11 @@
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
 
11
  "lora_alpha": 16,
12
  "lora_dropout": 0.05,
 
 
13
  "modules_to_save": [
14
  "embed_tokens",
15
  "lm_head"
 
8
  "init_lora_weights": true,
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
+ "loftq_config": {},
12
  "lora_alpha": 16,
13
  "lora_dropout": 0.05,
14
+ "megatron_config": null,
15
+ "megatron_core": "megatron.core",
16
  "modules_to_save": [
17
  "embed_tokens",
18
  "lm_head"
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c7068b13c3d20bd7b703c5fb985e4612f74af1f0c79bdb46e48bd8f3a53de01
3
  size 160899440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b272753c4f25e8b3412f529d56f8276a82d59ad0a9436dbf49eba539595e46b0
3
  size 160899440