ayousanz commited on
Commit
3d053ac
1 Parent(s): ee0a539

Upload folder using huggingface_hub

Browse files
Files changed (21) hide show
  1. .gitattributes +5 -0
  2. line-corporation/japanese-large-lm-3.6b-instruction-sft/Constant_251_attr__value +3 -0
  3. line-corporation/japanese-large-lm-3.6b-instruction-sft/Constant_265_attr__value +3 -0
  4. line-corporation/japanese-large-lm-3.6b-instruction-sft/_gpt_neox_layers.0_attention_rotary_emb_Constant_5_attr__value +0 -0
  5. line-corporation/japanese-large-lm-3.6b-instruction-sft/_gpt_neox_layers.0_attention_rotary_emb_Constant_attr__value +0 -0
  6. line-corporation/japanese-large-lm-3.6b-instruction-sft/config.json +30 -0
  7. line-corporation/japanese-large-lm-3.6b-instruction-sft/generation_config.json +7 -0
  8. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model.onnx +3 -0
  9. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model.onnx_data +3 -0
  10. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_merged.onnx +3 -0
  11. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_merged.onnx_data +3 -0
  12. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_merged_quantized.onnx +3 -0
  13. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_quantized.onnx +3 -0
  14. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_with_past_model.onnx +3 -0
  15. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_with_past_model.onnx_data +3 -0
  16. line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_with_past_model_quantized.onnx +3 -0
  17. line-corporation/japanese-large-lm-3.6b-instruction-sft/quantize_config.json +103 -0
  18. line-corporation/japanese-large-lm-3.6b-instruction-sft/special_tokens_map.json +9 -0
  19. line-corporation/japanese-large-lm-3.6b-instruction-sft/spiece.model +3 -0
  20. line-corporation/japanese-large-lm-3.6b-instruction-sft/tokenizer.json +0 -0
  21. line-corporation/japanese-large-lm-3.6b-instruction-sft/tokenizer_config.json +18 -0
.gitattributes CHANGED
@@ -84,3 +84,8 @@ line-corporation/japanese-large-lm-3.6b/Constant_265_attr__value filter=lfs diff
84
  line-corporation/japanese-large-lm-3.6b/onnx/decoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
85
  line-corporation/japanese-large-lm-3.6b/onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
86
  line-corporation/japanese-large-lm-3.6b/onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
84
  line-corporation/japanese-large-lm-3.6b/onnx/decoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
85
  line-corporation/japanese-large-lm-3.6b/onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
86
  line-corporation/japanese-large-lm-3.6b/onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
87
+ line-corporation/japanese-large-lm-3.6b-instruction-sft/Constant_251_attr__value filter=lfs diff=lfs merge=lfs -text
88
+ line-corporation/japanese-large-lm-3.6b-instruction-sft/Constant_265_attr__value filter=lfs diff=lfs merge=lfs -text
89
+ line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model.onnx_data filter=lfs diff=lfs merge=lfs -text
90
+ line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_merged.onnx_data filter=lfs diff=lfs merge=lfs -text
91
+ line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_with_past_model.onnx_data filter=lfs diff=lfs merge=lfs -text
line-corporation/japanese-large-lm-3.6b-instruction-sft/Constant_251_attr__value ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83dd5f1a5a07912d2e7dbb73b75edeb2ce4c1f1d6ec48144a887bd4a4f72325b
3
+ size 4194304
line-corporation/japanese-large-lm-3.6b-instruction-sft/Constant_265_attr__value ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83dd5f1a5a07912d2e7dbb73b75edeb2ce4c1f1d6ec48144a887bd4a4f72325b
3
+ size 4194304
line-corporation/japanese-large-lm-3.6b-instruction-sft/_gpt_neox_layers.0_attention_rotary_emb_Constant_5_attr__value ADDED
Binary file (786 kB). View file
 
line-corporation/japanese-large-lm-3.6b-instruction-sft/_gpt_neox_layers.0_attention_rotary_emb_Constant_attr__value ADDED
Binary file (786 kB). View file
 
line-corporation/japanese-large-lm-3.6b-instruction-sft/config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "line-corporation/japanese-large-lm-3.6b-instruction-sft",
3
+ "architectures": [
4
+ "GPTNeoXForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 2,
8
+ "classifier_dropout": 0.1,
9
+ "end_token_id": 2,
10
+ "eos_token_id": 2,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout": 0.0,
13
+ "hidden_size": 3072,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 12288,
16
+ "layer_norm_eps": 1e-05,
17
+ "max_position_embeddings": 2048,
18
+ "model_type": "gpt_neox",
19
+ "num_attention_heads": 32,
20
+ "num_hidden_layers": 30,
21
+ "pad_token_id": 2,
22
+ "rope_scaling": null,
23
+ "rotary_emb_base": 10000,
24
+ "rotary_pct": 1.0,
25
+ "tie_word_embeddings": true,
26
+ "transformers_version": "4.33.2",
27
+ "use_cache": true,
28
+ "use_parallel_residual": false,
29
+ "vocab_size": 51200
30
+ }
line-corporation/japanese-large-lm-3.6b-instruction-sft/generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "eos_token_id": 2,
5
+ "pad_token_id": 2,
6
+ "transformers_version": "4.33.2"
7
+ }
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:881ddc0179e87aa4caf5ea232fcdfdec1e7e69e3b87299685ca9874c77a5b327
3
+ size 7663132
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:796c3b148c409ff8bc0e11a465ff047406da57c4b3788ae60394fd87de650b87
3
+ size 14223507456
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0767fe2f1fbacff44c82b957b2d01739b10eb5f8635658aa321be6f9649ed52c
3
+ size 15338526
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_merged.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:796c3b148c409ff8bc0e11a465ff047406da57c4b3788ae60394fd87de650b87
3
+ size 14223507456
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d38239bd24deffc63511bded47024df7a073af1a0a2ebb9b1ccce0c8d77f7712
3
+ size 3580420639
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c46a0e04cf13873c3891a78bcd7e4d9406c044de6fd74b1b4d60dae39c9e29d3
3
+ size 3572007330
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b37bbf91f27a17eee7c54d8202b85d32f3a7084546d383af4af3a6a09a5e4712
3
+ size 7705851
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_with_past_model.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:796c3b148c409ff8bc0e11a465ff047406da57c4b3788ae60394fd87de650b87
3
+ size 14223507456
line-corporation/japanese-large-lm-3.6b-instruction-sft/onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc3df701553c78d65852172534070ed7703b53f4e029ffac7fc285a63d035aa
3
+ size 3572057146
line-corporation/japanese-large-lm-3.6b-instruction-sft/quantize_config.json ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "decoder_model_merged": {
6
+ "op_types": [
7
+ "Div",
8
+ "Mul",
9
+ "GatherElements",
10
+ "Sqrt",
11
+ "Sub",
12
+ "Concat",
13
+ "Erf",
14
+ "Cast",
15
+ "Expand",
16
+ "Pow",
17
+ "Where",
18
+ "Squeeze",
19
+ "Add",
20
+ "Softmax",
21
+ "Tile",
22
+ "Shape",
23
+ "Transpose",
24
+ "If",
25
+ "Reshape",
26
+ "Slice",
27
+ "ConstantOfShape",
28
+ "Neg",
29
+ "Constant",
30
+ "Gather",
31
+ "MatMul",
32
+ "Unsqueeze",
33
+ "ReduceMean",
34
+ "Range"
35
+ ],
36
+ "weight_type": "QInt8"
37
+ },
38
+ "decoder_model": {
39
+ "op_types": [
40
+ "Div",
41
+ "Mul",
42
+ "GatherElements",
43
+ "Sqrt",
44
+ "Sub",
45
+ "Concat",
46
+ "Erf",
47
+ "Cast",
48
+ "Expand",
49
+ "Pow",
50
+ "Where",
51
+ "Squeeze",
52
+ "Add",
53
+ "Softmax",
54
+ "Tile",
55
+ "Shape",
56
+ "Transpose",
57
+ "Reshape",
58
+ "Slice",
59
+ "ConstantOfShape",
60
+ "Neg",
61
+ "Constant",
62
+ "Gather",
63
+ "MatMul",
64
+ "Unsqueeze",
65
+ "ReduceMean",
66
+ "Range"
67
+ ],
68
+ "weight_type": "QInt8"
69
+ },
70
+ "decoder_with_past_model": {
71
+ "op_types": [
72
+ "Div",
73
+ "Mul",
74
+ "GatherElements",
75
+ "Sqrt",
76
+ "Sub",
77
+ "Concat",
78
+ "Erf",
79
+ "Cast",
80
+ "Expand",
81
+ "Pow",
82
+ "Where",
83
+ "Squeeze",
84
+ "Add",
85
+ "Softmax",
86
+ "Tile",
87
+ "Shape",
88
+ "Transpose",
89
+ "Reshape",
90
+ "Slice",
91
+ "ConstantOfShape",
92
+ "Neg",
93
+ "Constant",
94
+ "Gather",
95
+ "MatMul",
96
+ "Unsqueeze",
97
+ "ReduceMean",
98
+ "Range"
99
+ ],
100
+ "weight_type": "QInt8"
101
+ }
102
+ }
103
+ }
line-corporation/japanese-large-lm-3.6b-instruction-sft/special_tokens_map.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<cls>",
4
+ "eos_token": "</s>",
5
+ "mask_token": "<mask>",
6
+ "pad_token": "</s>",
7
+ "sep_token": "<sep>",
8
+ "unk_token": "<unk>"
9
+ }
line-corporation/japanese-large-lm-3.6b-instruction-sft/spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c5c56a739832923347681ed8a03a9cbf5afb6d1fe60089a5b01dd2dd063ab71
3
+ size 1208648
line-corporation/japanese-large-lm-3.6b-instruction-sft/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
line-corporation/japanese-large-lm-3.6b-instruction-sft/tokenizer_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": null,
3
+ "bos_token": "<s>",
4
+ "clean_up_tokenization_spaces": true,
5
+ "cls_token": "<cls>",
6
+ "do_lower_case": false,
7
+ "eos_token": "</s>",
8
+ "extra_ids": 0,
9
+ "keep_accents": true,
10
+ "legacy": true,
11
+ "mask_token": "<mask>",
12
+ "model_max_length": 1000000000000000019884624838656,
13
+ "pad_token": "<pad>",
14
+ "sep_token": "<sep>",
15
+ "sp_model_kwargs": {},
16
+ "tokenizer_class": "T5Tokenizer",
17
+ "unk_token": "<unk>"
18
+ }