doberst commited on
Commit
9bd4806
1 Parent(s): dd5e04b

Upload 11 files

Browse files
README.md CHANGED
@@ -1,3 +1,37 @@
1
- ---
2
- license: llama2
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: llama2
3
+ inference: false
4
+ tags: [green, llmware-rag, p7, ov]
5
+ ---
6
+
7
+ # dragon-llama-2-ov
8
+
9
+ <!-- Provide a quick summary of what the model is/does. -->
10
+
11
+ **dragon-llama-2-ov** is an OpenVino int4 quantized version of Dragon Llama-2, providing a very fast, very small inference implementation, optimized for AI PCs using Intel GPU, CPU and NPU.
12
+
13
+ [**dragon-llama-2**](https://huggingface.co/llmware/dragon-llama-2-7b-v0) is a fact-based question-answering model, optimized for complex business documents.
14
+
15
+ Get started right away with [OpenVino](https://github.com/openvinotoolkit/openvino)
16
+
17
+ Looking for AI PC solutions and demos, contact us at [llmware](https://www.llmware.ai)
18
+
19
+
20
+ ### Model Description
21
+
22
+ - **Developed by:** llmware
23
+ - **Model type:** llama2
24
+ - **Parameters:** 7 billion
25
+ - **Model Parent:** llmware/dragon-llama-2-v0
26
+ - **Language(s) (NLP):** English
27
+ - **License:** llama2-community-license
28
+ - **Uses:** Fact-based question-answering
29
+ - **RAG Benchmark Accuracy Score:** 97.25
30
+ - **Quantization:** int4
31
+
32
+
33
+ ## Model Card Contact
34
+
35
+ [llmware on hf](https://www.huggingface.co/llmware)
36
+
37
+ [llmware website](https://www.llmware.ai)
config.json ADDED
@@ -0,0 +1,183 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "llmware/dragon-llama-7b-v0",
3
+ "architectures": [
4
+ "Llama2ForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "dim": 4096,
10
+ "eos_token_id": 2,
11
+ "ffn_dim_multiplier": null,
12
+ "hidden_act": "silu",
13
+ "hidden_size": 4096,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 11008,
16
+ "max_batch_size": 32,
17
+ "max_position_embeddings": 2048,
18
+ "max_seq_len": 2048,
19
+ "mlp_bias": false,
20
+ "model_class": "llama2",
21
+ "model_repo_folder_path": "llama2-7b-base",
22
+ "model_size": "7b",
23
+ "model_type": "llama",
24
+ "multiple_of": 256,
25
+ "n_heads": 32,
26
+ "n_kv_heads": null,
27
+ "n_layers": 32,
28
+ "norm_eps": 1e-05,
29
+ "num_attention_heads": 32,
30
+ "num_hidden_layers": 32,
31
+ "num_key_value_heads": 32,
32
+ "pad_token_id": -1,
33
+ "pretraining_base": "llama2-7b-2t-tokens",
34
+ "pretraining_tp": 1,
35
+ "rms_norm_eps": 1e-06,
36
+ "rope_scaling": null,
37
+ "rope_theta": 10000.0,
38
+ "tie_word_embeddings": false,
39
+ "transformers_version": "4.41.2",
40
+ "use_cache": true,
41
+ "vocab_size": 32000,
42
+ "prompt_wrapper": "human_bot",
43
+ "prompt_format": "<human> {context_passage} \n {question} \n<bot>:",
44
+ "prompt_format_dict": {"main_start": "<human>: ", "main_stop": "\n", "start_llm_response": "<bot>:"},
45
+ "tokenizer_local": "tokenizer_ll2.json",
46
+ "tokenizer_config": {"bos_id": [1], "bos_token": ["<s>"], "eod_id": [2], "eos_token": ["</s>"]},
47
+ "model_parent": "llmware/dragon-llama-7b-v0",
48
+ "description": "Dragon-Llama-2-7B",
49
+ "quantization": "int4",
50
+ "context_window": 4096,
51
+ "model_family": "OVGenModel",
52
+ "parameters": 7.0,
53
+ "test_set": [
54
+ {
55
+ "query": "What is the total amount of the invoice?",
56
+ "answer": "$22,500.00",
57
+ "context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
58
+ "sample_number": 0,
59
+ "tokens": 138,
60
+ "category": "core"
61
+ },
62
+ {
63
+ "query": "What is the invoice number?",
64
+ "answer": "#0001",
65
+ "context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
66
+ "sample_number": 1,
67
+ "tokens": 138,
68
+ "category": "core"
69
+ },
70
+ {
71
+ "query": "What is a list of the items being purchased?",
72
+ "answer": "•Front End Engineering Service;\n•Back End Engineering Service;\n•Quality Assurance Manager",
73
+ "context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
74
+ "sample_number": 2,
75
+ "tokens": 138,
76
+ "category": "core"
77
+ },
78
+ {
79
+ "query": "What is the name of the contact for question?",
80
+ "answer": "Bia Hermes",
81
+ "context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
82
+ "sample_number": 3,
83
+ "tokens": 138,
84
+ "category": "core"
85
+ },
86
+ {
87
+ "query": "What is the PO number?",
88
+ "answer": "#1000",
89
+ "context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
90
+ "sample_number": 4,
91
+ "tokens": 138,
92
+ "category": "core"
93
+ },
94
+ {
95
+ "query": "When is payment due?",
96
+ "answer": "within 30 days of 01/01/2022",
97
+ "context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
98
+ "sample_number": 5,
99
+ "tokens": 138,
100
+ "category": "core"
101
+ },
102
+ {
103
+ "query": "When is payment due?",
104
+ "answer": "May 3, 2022",
105
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
106
+ "sample_number": 6,
107
+ "tokens": 139,
108
+ "category": "core"
109
+ },
110
+ {
111
+ "query": "What is the subtotal amount?",
112
+ "answer": "4150.00",
113
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
114
+ "sample_number": 7,
115
+ "tokens": 139,
116
+ "category": "core"
117
+ },
118
+ {
119
+ "query": "What is the total amount?",
120
+ "answer": "4565.00",
121
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
122
+ "sample_number": 8,
123
+ "tokens": 139,
124
+ "category": "core"
125
+ },
126
+ {
127
+ "query": "What is a list of the purchased items?",
128
+ "answer": "•30 Boxes of Printer Paper;\n•10 Printer Cartridges;\n•5 Laser Printers.",
129
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
130
+ "sample_number": 9,
131
+ "tokens": 139,
132
+ "category": "core"
133
+ },
134
+ {
135
+ "query": "What is the invoice number?",
136
+ "answer": "234",
137
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
138
+ "sample_number": 10,
139
+ "tokens": 139,
140
+ "category": "core"
141
+ },
142
+ {
143
+ "query": "What is the name of the two companies?",
144
+ "answer": "ABC Company and Delta Inc.",
145
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
146
+ "sample_number": 11,
147
+ "tokens": 139,
148
+ "category": "core"
149
+ },
150
+ {
151
+ "query": "How many boxes of paper are being purchased?",
152
+ "answer": "30",
153
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
154
+ "sample_number": 12,
155
+ "tokens": 139,
156
+ "category": "core"
157
+ },
158
+ {
159
+ "query": "What are the payment terms?",
160
+ "answer": "Due on Receipt",
161
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
162
+ "sample_number": 13,
163
+ "tokens": 139,
164
+ "category": "core"
165
+ },
166
+ {
167
+ "query": "What is the address of ABC Company?",
168
+ "answer": "8675 River Run Road, Marlington, CT 09392",
169
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
170
+ "sample_number": 14,
171
+ "tokens": 139,
172
+ "category": "core"
173
+ },
174
+ {
175
+ "query": "What is the date of the invoice?",
176
+ "answer": "March 3, 2022",
177
+ "context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
178
+ "sample_number": 15,
179
+ "tokens": 139,
180
+ "category": "core"
181
+ }]
182
+ }
183
+ }
openvino_detokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9556d0a1f310629e217450ac4198c49f5457f1a69e22ce7c9f8e81fab4d530a7
3
+ size 499723
openvino_detokenizer.xml ADDED
@@ -0,0 +1,97 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="detokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="Parameter_176136" type="Parameter" version="opset1">
5
+ <data shape="?,?" element_type="i64" />
6
+ <output>
7
+ <port id="0" precision="I64" names="Parameter_176136">
8
+ <dim>-1</dim>
9
+ <dim>-1</dim>
10
+ </port>
11
+ </output>
12
+ </layer>
13
+ <layer id="1" name="Constant_176116" type="Const" version="opset1">
14
+ <data element_type="u8" shape="499723" offset="0" size="499723" />
15
+ <output>
16
+ <port id="0" precision="U8">
17
+ <dim>499723</dim>
18
+ </port>
19
+ </output>
20
+ </layer>
21
+ <layer id="2" name="Convert_176146" type="Convert" version="opset1">
22
+ <data destination_type="i32" />
23
+ <input>
24
+ <port id="0" precision="I64">
25
+ <dim>-1</dim>
26
+ <dim>-1</dim>
27
+ </port>
28
+ </input>
29
+ <output>
30
+ <port id="1" precision="I32">
31
+ <dim>-1</dim>
32
+ <dim>-1</dim>
33
+ </port>
34
+ </output>
35
+ </layer>
36
+ <layer id="3" name="SentencepieceDetokenizer_176137" type="SentencepieceDetokenizer" version="extension">
37
+ <input>
38
+ <port id="0" precision="U8">
39
+ <dim>499723</dim>
40
+ </port>
41
+ <port id="1" precision="I32">
42
+ <dim>-1</dim>
43
+ <dim>-1</dim>
44
+ </port>
45
+ </input>
46
+ <output>
47
+ <port id="2" precision="I32">
48
+ <dim>-1</dim>
49
+ </port>
50
+ <port id="3" precision="I32">
51
+ <dim>-1</dim>
52
+ </port>
53
+ <port id="4" precision="U8">
54
+ <dim>-1</dim>
55
+ </port>
56
+ </output>
57
+ </layer>
58
+ <layer id="4" name="StringTensorPack_176138" type="StringTensorPack" version="extension">
59
+ <data mode="begins_ends" />
60
+ <input>
61
+ <port id="0" precision="I32">
62
+ <dim>-1</dim>
63
+ </port>
64
+ <port id="1" precision="I32">
65
+ <dim>-1</dim>
66
+ </port>
67
+ <port id="2" precision="U8">
68
+ <dim>-1</dim>
69
+ </port>
70
+ </input>
71
+ <output>
72
+ <port id="3" precision="STRING" names="string_output">
73
+ <dim>-1</dim>
74
+ </port>
75
+ </output>
76
+ </layer>
77
+ <layer id="5" name="Result_176139" type="Result" version="opset1">
78
+ <input>
79
+ <port id="0" precision="STRING">
80
+ <dim>-1</dim>
81
+ </port>
82
+ </input>
83
+ </layer>
84
+ </layers>
85
+ <edges>
86
+ <edge from-layer="0" from-port="0" to-layer="2" to-port="0" />
87
+ <edge from-layer="1" from-port="0" to-layer="3" to-port="0" />
88
+ <edge from-layer="2" from-port="1" to-layer="3" to-port="1" />
89
+ <edge from-layer="3" from-port="2" to-layer="4" to-port="0" />
90
+ <edge from-layer="3" from-port="3" to-layer="4" to-port="1" />
91
+ <edge from-layer="3" from-port="4" to-layer="4" to-port="2" />
92
+ <edge from-layer="4" from-port="3" to-layer="5" to-port="0" />
93
+ </edges>
94
+ <rt_info>
95
+ <eos_token_id value="2" />
96
+ </rt_info>
97
+ </net>
openvino_model.xml ADDED
The diff for this file is too large to render. See raw diff
 
openvino_tokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ec38b843ff6c229ec650d242feaad2c9e4fa694c69d5e20a8e68b95a878c7ad
3
+ size 499731
openvino_tokenizer.xml ADDED
@@ -0,0 +1,231 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="tokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="string_input" type="Parameter" version="opset1">
5
+ <data shape="?" element_type="string" />
6
+ <output>
7
+ <port id="0" precision="STRING" names="string_input">
8
+ <dim>-1</dim>
9
+ </port>
10
+ </output>
11
+ </layer>
12
+ <layer id="1" name="Constant_176122" type="Const" version="opset1">
13
+ <data element_type="i32" shape="" offset="0" size="4" />
14
+ <output>
15
+ <port id="0" precision="I32" />
16
+ </output>
17
+ </layer>
18
+ <layer id="2" name="Constant_176115" type="Const" version="opset1">
19
+ <data element_type="u8" shape="499723" offset="4" size="499723" />
20
+ <output>
21
+ <port id="0" precision="U8">
22
+ <dim>499723</dim>
23
+ </port>
24
+ </output>
25
+ </layer>
26
+ <layer id="3" name="SentencepieceTokenizer_176118" type="SentencepieceTokenizer" version="extension">
27
+ <data nbest_size="0" alpha="0" add_bos="true" add_eos="false" reverse="false" />
28
+ <input>
29
+ <port id="0" precision="U8">
30
+ <dim>499723</dim>
31
+ </port>
32
+ <port id="1" precision="STRING">
33
+ <dim>-1</dim>
34
+ </port>
35
+ </input>
36
+ <output>
37
+ <port id="2" precision="I64">
38
+ <dim>-1</dim>
39
+ <dim>2</dim>
40
+ </port>
41
+ <port id="3" precision="I32">
42
+ <dim>-1</dim>
43
+ </port>
44
+ <port id="4" precision="I64">
45
+ <dim>2</dim>
46
+ </port>
47
+ </output>
48
+ </layer>
49
+ <layer id="4" name="Broadcast_176123" type="Broadcast" version="opset3">
50
+ <data mode="numpy" />
51
+ <input>
52
+ <port id="0" precision="I32" />
53
+ <port id="1" precision="I64">
54
+ <dim>2</dim>
55
+ </port>
56
+ </input>
57
+ <output>
58
+ <port id="2" precision="I32">
59
+ <dim>-1</dim>
60
+ <dim>-1</dim>
61
+ </port>
62
+ </output>
63
+ </layer>
64
+ <layer id="5" name="Constant_176124" type="Const" version="opset1">
65
+ <data element_type="i32" shape="" offset="499727" size="4" />
66
+ <output>
67
+ <port id="0" precision="I32" />
68
+ </output>
69
+ </layer>
70
+ <layer id="6" name="ShapeOf_176125" type="ShapeOf" version="opset3">
71
+ <data output_type="i64" />
72
+ <input>
73
+ <port id="0" precision="I32">
74
+ <dim>-1</dim>
75
+ </port>
76
+ </input>
77
+ <output>
78
+ <port id="1" precision="I64">
79
+ <dim>1</dim>
80
+ </port>
81
+ </output>
82
+ </layer>
83
+ <layer id="7" name="Broadcast_176126" type="Broadcast" version="opset3">
84
+ <data mode="numpy" />
85
+ <input>
86
+ <port id="0" precision="I32" />
87
+ <port id="1" precision="I64">
88
+ <dim>1</dim>
89
+ </port>
90
+ </input>
91
+ <output>
92
+ <port id="2" precision="I32">
93
+ <dim>-1</dim>
94
+ </port>
95
+ </output>
96
+ </layer>
97
+ <layer id="8" name="ScatterNDUpdate_176130" type="ScatterNDUpdate" version="opset4">
98
+ <input>
99
+ <port id="0" precision="I32">
100
+ <dim>-1</dim>
101
+ <dim>-1</dim>
102
+ </port>
103
+ <port id="1" precision="I64">
104
+ <dim>-1</dim>
105
+ <dim>2</dim>
106
+ </port>
107
+ <port id="2" precision="I32">
108
+ <dim>-1</dim>
109
+ </port>
110
+ </input>
111
+ <output>
112
+ <port id="3" precision="I32">
113
+ <dim>-1</dim>
114
+ <dim>-1</dim>
115
+ </port>
116
+ </output>
117
+ </layer>
118
+ <layer id="9" name="ScatterNDUpdate_176130" type="Convert" version="opset1">
119
+ <data destination_type="i64" />
120
+ <input>
121
+ <port id="0" precision="I32">
122
+ <dim>-1</dim>
123
+ <dim>-1</dim>
124
+ </port>
125
+ </input>
126
+ <output>
127
+ <port id="1" precision="I64" names="attention_mask">
128
+ <dim>-1</dim>
129
+ <dim>-1</dim>
130
+ </port>
131
+ </output>
132
+ </layer>
133
+ <layer id="11" name="Constant_176119" type="Const" version="opset1">
134
+ <data element_type="i32" shape="" offset="0" size="4" />
135
+ <output>
136
+ <port id="0" precision="I32" />
137
+ </output>
138
+ </layer>
139
+ <layer id="12" name="Broadcast_176120" type="Broadcast" version="opset3">
140
+ <data mode="numpy" />
141
+ <input>
142
+ <port id="0" precision="I32" />
143
+ <port id="1" precision="I64">
144
+ <dim>2</dim>
145
+ </port>
146
+ </input>
147
+ <output>
148
+ <port id="2" precision="I32">
149
+ <dim>-1</dim>
150
+ <dim>-1</dim>
151
+ </port>
152
+ </output>
153
+ </layer>
154
+ <layer id="13" name="ScatterNDUpdate_176121" type="ScatterNDUpdate" version="opset4">
155
+ <input>
156
+ <port id="0" precision="I32">
157
+ <dim>-1</dim>
158
+ <dim>-1</dim>
159
+ </port>
160
+ <port id="1" precision="I64">
161
+ <dim>-1</dim>
162
+ <dim>2</dim>
163
+ </port>
164
+ <port id="2" precision="I32">
165
+ <dim>-1</dim>
166
+ </port>
167
+ </input>
168
+ <output>
169
+ <port id="3" precision="I32">
170
+ <dim>-1</dim>
171
+ <dim>-1</dim>
172
+ </port>
173
+ </output>
174
+ </layer>
175
+ <layer id="14" name="ScatterNDUpdate_176121" type="Convert" version="opset1">
176
+ <data destination_type="i64" />
177
+ <input>
178
+ <port id="0" precision="I32">
179
+ <dim>-1</dim>
180
+ <dim>-1</dim>
181
+ </port>
182
+ </input>
183
+ <output>
184
+ <port id="1" precision="I64" names="input_ids">
185
+ <dim>-1</dim>
186
+ <dim>-1</dim>
187
+ </port>
188
+ </output>
189
+ </layer>
190
+ <layer id="15" name="Result_176131" type="Result" version="opset1">
191
+ <input>
192
+ <port id="0" precision="I64">
193
+ <dim>-1</dim>
194
+ <dim>-1</dim>
195
+ </port>
196
+ </input>
197
+ </layer>
198
+ <layer id="10" name="Result_176132" type="Result" version="opset1">
199
+ <input>
200
+ <port id="0" precision="I64">
201
+ <dim>-1</dim>
202
+ <dim>-1</dim>
203
+ </port>
204
+ </input>
205
+ </layer>
206
+ </layers>
207
+ <edges>
208
+ <edge from-layer="0" from-port="0" to-layer="3" to-port="1" />
209
+ <edge from-layer="1" from-port="0" to-layer="4" to-port="0" />
210
+ <edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
211
+ <edge from-layer="3" from-port="4" to-layer="4" to-port="1" />
212
+ <edge from-layer="3" from-port="3" to-layer="6" to-port="0" />
213
+ <edge from-layer="3" from-port="2" to-layer="8" to-port="1" />
214
+ <edge from-layer="3" from-port="4" to-layer="12" to-port="1" />
215
+ <edge from-layer="3" from-port="2" to-layer="13" to-port="1" />
216
+ <edge from-layer="3" from-port="3" to-layer="13" to-port="2" />
217
+ <edge from-layer="4" from-port="2" to-layer="8" to-port="0" />
218
+ <edge from-layer="5" from-port="0" to-layer="7" to-port="0" />
219
+ <edge from-layer="6" from-port="1" to-layer="7" to-port="1" />
220
+ <edge from-layer="7" from-port="2" to-layer="8" to-port="2" />
221
+ <edge from-layer="8" from-port="3" to-layer="9" to-port="0" />
222
+ <edge from-layer="9" from-port="1" to-layer="10" to-port="0" />
223
+ <edge from-layer="11" from-port="0" to-layer="12" to-port="0" />
224
+ <edge from-layer="12" from-port="2" to-layer="13" to-port="0" />
225
+ <edge from-layer="13" from-port="3" to-layer="14" to-port="0" />
226
+ <edge from-layer="14" from-port="1" to-layer="15" to-port="0" />
227
+ </edges>
228
+ <rt_info>
229
+ <eos_token_id value="2" />
230
+ </rt_info>
231
+ </net>
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
+ size 499723
tokenizer_config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_prefix_space": true,
5
+ "added_tokens_decoder": {
6
+ "0": {
7
+ "content": "<unk>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false,
12
+ "special": true
13
+ },
14
+ "1": {
15
+ "content": "<s>",
16
+ "lstrip": false,
17
+ "normalized": false,
18
+ "rstrip": false,
19
+ "single_word": false,
20
+ "special": true
21
+ },
22
+ "2": {
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": false,
26
+ "rstrip": false,
27
+ "single_word": false,
28
+ "special": true
29
+ }
30
+ },
31
+ "bos_token": "<s>",
32
+ "clean_up_tokenization_spaces": false,
33
+ "eos_token": "</s>",
34
+ "legacy": true,
35
+ "model_max_length": 1000000000000000019884624838656,
36
+ "pad_token": null,
37
+ "sp_model_kwargs": {},
38
+ "spaces_between_special_tokens": false,
39
+ "tokenizer_class": "LlamaTokenizer",
40
+ "unk_token": "<unk>",
41
+ "use_default_system_prompt": false
42
+ }