Upload 11 files
Browse files- README.md +37 -3
- config.json +183 -0
- openvino_detokenizer.bin +3 -0
- openvino_detokenizer.xml +97 -0
- openvino_model.xml +0 -0
- openvino_tokenizer.bin +3 -0
- openvino_tokenizer.xml +231 -0
- special_tokens_map.json +23 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +42 -0
README.md
CHANGED
@@ -1,3 +1,37 @@
|
|
1 |
-
---
|
2 |
-
license: llama2
|
3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: llama2
|
3 |
+
inference: false
|
4 |
+
tags: [green, llmware-rag, p7, ov]
|
5 |
+
---
|
6 |
+
|
7 |
+
# dragon-llama-2-ov
|
8 |
+
|
9 |
+
<!-- Provide a quick summary of what the model is/does. -->
|
10 |
+
|
11 |
+
**dragon-llama-2-ov** is an OpenVino int4 quantized version of Dragon Llama-2, providing a very fast, very small inference implementation, optimized for AI PCs using Intel GPU, CPU and NPU.
|
12 |
+
|
13 |
+
[**dragon-llama-2**](https://huggingface.co/llmware/dragon-llama-2-7b-v0) is a fact-based question-answering model, optimized for complex business documents.
|
14 |
+
|
15 |
+
Get started right away with [OpenVino](https://github.com/openvinotoolkit/openvino)
|
16 |
+
|
17 |
+
Looking for AI PC solutions and demos, contact us at [llmware](https://www.llmware.ai)
|
18 |
+
|
19 |
+
|
20 |
+
### Model Description
|
21 |
+
|
22 |
+
- **Developed by:** llmware
|
23 |
+
- **Model type:** llama2
|
24 |
+
- **Parameters:** 7 billion
|
25 |
+
- **Model Parent:** llmware/dragon-llama-2-v0
|
26 |
+
- **Language(s) (NLP):** English
|
27 |
+
- **License:** llama2-community-license
|
28 |
+
- **Uses:** Fact-based question-answering
|
29 |
+
- **RAG Benchmark Accuracy Score:** 97.25
|
30 |
+
- **Quantization:** int4
|
31 |
+
|
32 |
+
|
33 |
+
## Model Card Contact
|
34 |
+
|
35 |
+
[llmware on hf](https://www.huggingface.co/llmware)
|
36 |
+
|
37 |
+
[llmware website](https://www.llmware.ai)
|
config.json
ADDED
@@ -0,0 +1,183 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "llmware/dragon-llama-7b-v0",
|
3 |
+
"architectures": [
|
4 |
+
"Llama2ForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"dim": 4096,
|
10 |
+
"eos_token_id": 2,
|
11 |
+
"ffn_dim_multiplier": null,
|
12 |
+
"hidden_act": "silu",
|
13 |
+
"hidden_size": 4096,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 11008,
|
16 |
+
"max_batch_size": 32,
|
17 |
+
"max_position_embeddings": 2048,
|
18 |
+
"max_seq_len": 2048,
|
19 |
+
"mlp_bias": false,
|
20 |
+
"model_class": "llama2",
|
21 |
+
"model_repo_folder_path": "llama2-7b-base",
|
22 |
+
"model_size": "7b",
|
23 |
+
"model_type": "llama",
|
24 |
+
"multiple_of": 256,
|
25 |
+
"n_heads": 32,
|
26 |
+
"n_kv_heads": null,
|
27 |
+
"n_layers": 32,
|
28 |
+
"norm_eps": 1e-05,
|
29 |
+
"num_attention_heads": 32,
|
30 |
+
"num_hidden_layers": 32,
|
31 |
+
"num_key_value_heads": 32,
|
32 |
+
"pad_token_id": -1,
|
33 |
+
"pretraining_base": "llama2-7b-2t-tokens",
|
34 |
+
"pretraining_tp": 1,
|
35 |
+
"rms_norm_eps": 1e-06,
|
36 |
+
"rope_scaling": null,
|
37 |
+
"rope_theta": 10000.0,
|
38 |
+
"tie_word_embeddings": false,
|
39 |
+
"transformers_version": "4.41.2",
|
40 |
+
"use_cache": true,
|
41 |
+
"vocab_size": 32000,
|
42 |
+
"prompt_wrapper": "human_bot",
|
43 |
+
"prompt_format": "<human> {context_passage} \n {question} \n<bot>:",
|
44 |
+
"prompt_format_dict": {"main_start": "<human>: ", "main_stop": "\n", "start_llm_response": "<bot>:"},
|
45 |
+
"tokenizer_local": "tokenizer_ll2.json",
|
46 |
+
"tokenizer_config": {"bos_id": [1], "bos_token": ["<s>"], "eod_id": [2], "eos_token": ["</s>"]},
|
47 |
+
"model_parent": "llmware/dragon-llama-7b-v0",
|
48 |
+
"description": "Dragon-Llama-2-7B",
|
49 |
+
"quantization": "int4",
|
50 |
+
"context_window": 4096,
|
51 |
+
"model_family": "OVGenModel",
|
52 |
+
"parameters": 7.0,
|
53 |
+
"test_set": [
|
54 |
+
{
|
55 |
+
"query": "What is the total amount of the invoice?",
|
56 |
+
"answer": "$22,500.00",
|
57 |
+
"context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
|
58 |
+
"sample_number": 0,
|
59 |
+
"tokens": 138,
|
60 |
+
"category": "core"
|
61 |
+
},
|
62 |
+
{
|
63 |
+
"query": "What is the invoice number?",
|
64 |
+
"answer": "#0001",
|
65 |
+
"context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
|
66 |
+
"sample_number": 1,
|
67 |
+
"tokens": 138,
|
68 |
+
"category": "core"
|
69 |
+
},
|
70 |
+
{
|
71 |
+
"query": "What is a list of the items being purchased?",
|
72 |
+
"answer": "•Front End Engineering Service;\n•Back End Engineering Service;\n•Quality Assurance Manager",
|
73 |
+
"context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
|
74 |
+
"sample_number": 2,
|
75 |
+
"tokens": 138,
|
76 |
+
"category": "core"
|
77 |
+
},
|
78 |
+
{
|
79 |
+
"query": "What is the name of the contact for question?",
|
80 |
+
"answer": "Bia Hermes",
|
81 |
+
"context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
|
82 |
+
"sample_number": 3,
|
83 |
+
"tokens": 138,
|
84 |
+
"category": "core"
|
85 |
+
},
|
86 |
+
{
|
87 |
+
"query": "What is the PO number?",
|
88 |
+
"answer": "#1000",
|
89 |
+
"context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
|
90 |
+
"sample_number": 4,
|
91 |
+
"tokens": 138,
|
92 |
+
"category": "core"
|
93 |
+
},
|
94 |
+
{
|
95 |
+
"query": "When is payment due?",
|
96 |
+
"answer": "within 30 days of 01/01/2022",
|
97 |
+
"context": "Services Vendor Inc. \n100 Elm Street Pleasantville, NY \nTO Alpha Inc. 5900 1st Street Los Angeles, CA \nDescription Front End Engineering Service $5000.00 \n Back End Engineering Service $7500.00 \n Quality Assurance Manager $10,000.00 \n Total Amount $22,500.00 \nMake all checks payable to Services Vendor Inc. Payment is due within 30 days.If you have any questions concerning this invoice, contact Bia Hermes. THANK YOU FOR YOUR BUSINESS! INVOICE INVOICE # 0001 DATE 01/01/2022 FOR Alpha Project P.O. # 1000",
|
98 |
+
"sample_number": 5,
|
99 |
+
"tokens": 138,
|
100 |
+
"category": "core"
|
101 |
+
},
|
102 |
+
{
|
103 |
+
"query": "When is payment due?",
|
104 |
+
"answer": "May 3, 2022",
|
105 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
106 |
+
"sample_number": 6,
|
107 |
+
"tokens": 139,
|
108 |
+
"category": "core"
|
109 |
+
},
|
110 |
+
{
|
111 |
+
"query": "What is the subtotal amount?",
|
112 |
+
"answer": "4150.00",
|
113 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
114 |
+
"sample_number": 7,
|
115 |
+
"tokens": 139,
|
116 |
+
"category": "core"
|
117 |
+
},
|
118 |
+
{
|
119 |
+
"query": "What is the total amount?",
|
120 |
+
"answer": "4565.00",
|
121 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
122 |
+
"sample_number": 8,
|
123 |
+
"tokens": 139,
|
124 |
+
"category": "core"
|
125 |
+
},
|
126 |
+
{
|
127 |
+
"query": "What is a list of the purchased items?",
|
128 |
+
"answer": "•30 Boxes of Printer Paper;\n•10 Printer Cartridges;\n•5 Laser Printers.",
|
129 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
130 |
+
"sample_number": 9,
|
131 |
+
"tokens": 139,
|
132 |
+
"category": "core"
|
133 |
+
},
|
134 |
+
{
|
135 |
+
"query": "What is the invoice number?",
|
136 |
+
"answer": "234",
|
137 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
138 |
+
"sample_number": 10,
|
139 |
+
"tokens": 139,
|
140 |
+
"category": "core"
|
141 |
+
},
|
142 |
+
{
|
143 |
+
"query": "What is the name of the two companies?",
|
144 |
+
"answer": "ABC Company and Delta Inc.",
|
145 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
146 |
+
"sample_number": 11,
|
147 |
+
"tokens": 139,
|
148 |
+
"category": "core"
|
149 |
+
},
|
150 |
+
{
|
151 |
+
"query": "How many boxes of paper are being purchased?",
|
152 |
+
"answer": "30",
|
153 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
154 |
+
"sample_number": 12,
|
155 |
+
"tokens": 139,
|
156 |
+
"category": "core"
|
157 |
+
},
|
158 |
+
{
|
159 |
+
"query": "What are the payment terms?",
|
160 |
+
"answer": "Due on Receipt",
|
161 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
162 |
+
"sample_number": 13,
|
163 |
+
"tokens": 139,
|
164 |
+
"category": "core"
|
165 |
+
},
|
166 |
+
{
|
167 |
+
"query": "What is the address of ABC Company?",
|
168 |
+
"answer": "8675 River Run Road, Marlington, CT 09392",
|
169 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
170 |
+
"sample_number": 14,
|
171 |
+
"tokens": 139,
|
172 |
+
"category": "core"
|
173 |
+
},
|
174 |
+
{
|
175 |
+
"query": "What is the date of the invoice?",
|
176 |
+
"answer": "March 3, 2022",
|
177 |
+
"context": "Invoice DATE March 3, 2022\tINVOICE NO 234\tABC Company 8675 River Run Road Marlington, CT 09392 INVOICE TO Delta Inc. 8723 Wilton Boulevard Los Angeles, CA HEBE HERACLES\tLASER PRINTER\tPAYMENT TERMS DUE DATE Due on Receipt May 3, 2022 QUANTITY DESCRIPTION UNIT PRICE LINE TOTAL 30 \tBoxes of Printer Paper\t$30\t$900 10\tPrinter Cartridges\t$75 $750 5\tLaser printers\t$500.00 $2500.00 Subtotal 4150.00 Sales Tax 10% Total 4565.00",
|
178 |
+
"sample_number": 15,
|
179 |
+
"tokens": 139,
|
180 |
+
"category": "core"
|
181 |
+
}]
|
182 |
+
}
|
183 |
+
}
|
openvino_detokenizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9556d0a1f310629e217450ac4198c49f5457f1a69e22ce7c9f8e81fab4d530a7
|
3 |
+
size 499723
|
openvino_detokenizer.xml
ADDED
@@ -0,0 +1,97 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<?xml version="1.0"?>
|
2 |
+
<net name="detokenizer" version="11">
|
3 |
+
<layers>
|
4 |
+
<layer id="0" name="Parameter_176136" type="Parameter" version="opset1">
|
5 |
+
<data shape="?,?" element_type="i64" />
|
6 |
+
<output>
|
7 |
+
<port id="0" precision="I64" names="Parameter_176136">
|
8 |
+
<dim>-1</dim>
|
9 |
+
<dim>-1</dim>
|
10 |
+
</port>
|
11 |
+
</output>
|
12 |
+
</layer>
|
13 |
+
<layer id="1" name="Constant_176116" type="Const" version="opset1">
|
14 |
+
<data element_type="u8" shape="499723" offset="0" size="499723" />
|
15 |
+
<output>
|
16 |
+
<port id="0" precision="U8">
|
17 |
+
<dim>499723</dim>
|
18 |
+
</port>
|
19 |
+
</output>
|
20 |
+
</layer>
|
21 |
+
<layer id="2" name="Convert_176146" type="Convert" version="opset1">
|
22 |
+
<data destination_type="i32" />
|
23 |
+
<input>
|
24 |
+
<port id="0" precision="I64">
|
25 |
+
<dim>-1</dim>
|
26 |
+
<dim>-1</dim>
|
27 |
+
</port>
|
28 |
+
</input>
|
29 |
+
<output>
|
30 |
+
<port id="1" precision="I32">
|
31 |
+
<dim>-1</dim>
|
32 |
+
<dim>-1</dim>
|
33 |
+
</port>
|
34 |
+
</output>
|
35 |
+
</layer>
|
36 |
+
<layer id="3" name="SentencepieceDetokenizer_176137" type="SentencepieceDetokenizer" version="extension">
|
37 |
+
<input>
|
38 |
+
<port id="0" precision="U8">
|
39 |
+
<dim>499723</dim>
|
40 |
+
</port>
|
41 |
+
<port id="1" precision="I32">
|
42 |
+
<dim>-1</dim>
|
43 |
+
<dim>-1</dim>
|
44 |
+
</port>
|
45 |
+
</input>
|
46 |
+
<output>
|
47 |
+
<port id="2" precision="I32">
|
48 |
+
<dim>-1</dim>
|
49 |
+
</port>
|
50 |
+
<port id="3" precision="I32">
|
51 |
+
<dim>-1</dim>
|
52 |
+
</port>
|
53 |
+
<port id="4" precision="U8">
|
54 |
+
<dim>-1</dim>
|
55 |
+
</port>
|
56 |
+
</output>
|
57 |
+
</layer>
|
58 |
+
<layer id="4" name="StringTensorPack_176138" type="StringTensorPack" version="extension">
|
59 |
+
<data mode="begins_ends" />
|
60 |
+
<input>
|
61 |
+
<port id="0" precision="I32">
|
62 |
+
<dim>-1</dim>
|
63 |
+
</port>
|
64 |
+
<port id="1" precision="I32">
|
65 |
+
<dim>-1</dim>
|
66 |
+
</port>
|
67 |
+
<port id="2" precision="U8">
|
68 |
+
<dim>-1</dim>
|
69 |
+
</port>
|
70 |
+
</input>
|
71 |
+
<output>
|
72 |
+
<port id="3" precision="STRING" names="string_output">
|
73 |
+
<dim>-1</dim>
|
74 |
+
</port>
|
75 |
+
</output>
|
76 |
+
</layer>
|
77 |
+
<layer id="5" name="Result_176139" type="Result" version="opset1">
|
78 |
+
<input>
|
79 |
+
<port id="0" precision="STRING">
|
80 |
+
<dim>-1</dim>
|
81 |
+
</port>
|
82 |
+
</input>
|
83 |
+
</layer>
|
84 |
+
</layers>
|
85 |
+
<edges>
|
86 |
+
<edge from-layer="0" from-port="0" to-layer="2" to-port="0" />
|
87 |
+
<edge from-layer="1" from-port="0" to-layer="3" to-port="0" />
|
88 |
+
<edge from-layer="2" from-port="1" to-layer="3" to-port="1" />
|
89 |
+
<edge from-layer="3" from-port="2" to-layer="4" to-port="0" />
|
90 |
+
<edge from-layer="3" from-port="3" to-layer="4" to-port="1" />
|
91 |
+
<edge from-layer="3" from-port="4" to-layer="4" to-port="2" />
|
92 |
+
<edge from-layer="4" from-port="3" to-layer="5" to-port="0" />
|
93 |
+
</edges>
|
94 |
+
<rt_info>
|
95 |
+
<eos_token_id value="2" />
|
96 |
+
</rt_info>
|
97 |
+
</net>
|
openvino_model.xml
ADDED
The diff for this file is too large to render.
See raw diff
|
|
openvino_tokenizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ec38b843ff6c229ec650d242feaad2c9e4fa694c69d5e20a8e68b95a878c7ad
|
3 |
+
size 499731
|
openvino_tokenizer.xml
ADDED
@@ -0,0 +1,231 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
<?xml version="1.0"?>
|
2 |
+
<net name="tokenizer" version="11">
|
3 |
+
<layers>
|
4 |
+
<layer id="0" name="string_input" type="Parameter" version="opset1">
|
5 |
+
<data shape="?" element_type="string" />
|
6 |
+
<output>
|
7 |
+
<port id="0" precision="STRING" names="string_input">
|
8 |
+
<dim>-1</dim>
|
9 |
+
</port>
|
10 |
+
</output>
|
11 |
+
</layer>
|
12 |
+
<layer id="1" name="Constant_176122" type="Const" version="opset1">
|
13 |
+
<data element_type="i32" shape="" offset="0" size="4" />
|
14 |
+
<output>
|
15 |
+
<port id="0" precision="I32" />
|
16 |
+
</output>
|
17 |
+
</layer>
|
18 |
+
<layer id="2" name="Constant_176115" type="Const" version="opset1">
|
19 |
+
<data element_type="u8" shape="499723" offset="4" size="499723" />
|
20 |
+
<output>
|
21 |
+
<port id="0" precision="U8">
|
22 |
+
<dim>499723</dim>
|
23 |
+
</port>
|
24 |
+
</output>
|
25 |
+
</layer>
|
26 |
+
<layer id="3" name="SentencepieceTokenizer_176118" type="SentencepieceTokenizer" version="extension">
|
27 |
+
<data nbest_size="0" alpha="0" add_bos="true" add_eos="false" reverse="false" />
|
28 |
+
<input>
|
29 |
+
<port id="0" precision="U8">
|
30 |
+
<dim>499723</dim>
|
31 |
+
</port>
|
32 |
+
<port id="1" precision="STRING">
|
33 |
+
<dim>-1</dim>
|
34 |
+
</port>
|
35 |
+
</input>
|
36 |
+
<output>
|
37 |
+
<port id="2" precision="I64">
|
38 |
+
<dim>-1</dim>
|
39 |
+
<dim>2</dim>
|
40 |
+
</port>
|
41 |
+
<port id="3" precision="I32">
|
42 |
+
<dim>-1</dim>
|
43 |
+
</port>
|
44 |
+
<port id="4" precision="I64">
|
45 |
+
<dim>2</dim>
|
46 |
+
</port>
|
47 |
+
</output>
|
48 |
+
</layer>
|
49 |
+
<layer id="4" name="Broadcast_176123" type="Broadcast" version="opset3">
|
50 |
+
<data mode="numpy" />
|
51 |
+
<input>
|
52 |
+
<port id="0" precision="I32" />
|
53 |
+
<port id="1" precision="I64">
|
54 |
+
<dim>2</dim>
|
55 |
+
</port>
|
56 |
+
</input>
|
57 |
+
<output>
|
58 |
+
<port id="2" precision="I32">
|
59 |
+
<dim>-1</dim>
|
60 |
+
<dim>-1</dim>
|
61 |
+
</port>
|
62 |
+
</output>
|
63 |
+
</layer>
|
64 |
+
<layer id="5" name="Constant_176124" type="Const" version="opset1">
|
65 |
+
<data element_type="i32" shape="" offset="499727" size="4" />
|
66 |
+
<output>
|
67 |
+
<port id="0" precision="I32" />
|
68 |
+
</output>
|
69 |
+
</layer>
|
70 |
+
<layer id="6" name="ShapeOf_176125" type="ShapeOf" version="opset3">
|
71 |
+
<data output_type="i64" />
|
72 |
+
<input>
|
73 |
+
<port id="0" precision="I32">
|
74 |
+
<dim>-1</dim>
|
75 |
+
</port>
|
76 |
+
</input>
|
77 |
+
<output>
|
78 |
+
<port id="1" precision="I64">
|
79 |
+
<dim>1</dim>
|
80 |
+
</port>
|
81 |
+
</output>
|
82 |
+
</layer>
|
83 |
+
<layer id="7" name="Broadcast_176126" type="Broadcast" version="opset3">
|
84 |
+
<data mode="numpy" />
|
85 |
+
<input>
|
86 |
+
<port id="0" precision="I32" />
|
87 |
+
<port id="1" precision="I64">
|
88 |
+
<dim>1</dim>
|
89 |
+
</port>
|
90 |
+
</input>
|
91 |
+
<output>
|
92 |
+
<port id="2" precision="I32">
|
93 |
+
<dim>-1</dim>
|
94 |
+
</port>
|
95 |
+
</output>
|
96 |
+
</layer>
|
97 |
+
<layer id="8" name="ScatterNDUpdate_176130" type="ScatterNDUpdate" version="opset4">
|
98 |
+
<input>
|
99 |
+
<port id="0" precision="I32">
|
100 |
+
<dim>-1</dim>
|
101 |
+
<dim>-1</dim>
|
102 |
+
</port>
|
103 |
+
<port id="1" precision="I64">
|
104 |
+
<dim>-1</dim>
|
105 |
+
<dim>2</dim>
|
106 |
+
</port>
|
107 |
+
<port id="2" precision="I32">
|
108 |
+
<dim>-1</dim>
|
109 |
+
</port>
|
110 |
+
</input>
|
111 |
+
<output>
|
112 |
+
<port id="3" precision="I32">
|
113 |
+
<dim>-1</dim>
|
114 |
+
<dim>-1</dim>
|
115 |
+
</port>
|
116 |
+
</output>
|
117 |
+
</layer>
|
118 |
+
<layer id="9" name="ScatterNDUpdate_176130" type="Convert" version="opset1">
|
119 |
+
<data destination_type="i64" />
|
120 |
+
<input>
|
121 |
+
<port id="0" precision="I32">
|
122 |
+
<dim>-1</dim>
|
123 |
+
<dim>-1</dim>
|
124 |
+
</port>
|
125 |
+
</input>
|
126 |
+
<output>
|
127 |
+
<port id="1" precision="I64" names="attention_mask">
|
128 |
+
<dim>-1</dim>
|
129 |
+
<dim>-1</dim>
|
130 |
+
</port>
|
131 |
+
</output>
|
132 |
+
</layer>
|
133 |
+
<layer id="11" name="Constant_176119" type="Const" version="opset1">
|
134 |
+
<data element_type="i32" shape="" offset="0" size="4" />
|
135 |
+
<output>
|
136 |
+
<port id="0" precision="I32" />
|
137 |
+
</output>
|
138 |
+
</layer>
|
139 |
+
<layer id="12" name="Broadcast_176120" type="Broadcast" version="opset3">
|
140 |
+
<data mode="numpy" />
|
141 |
+
<input>
|
142 |
+
<port id="0" precision="I32" />
|
143 |
+
<port id="1" precision="I64">
|
144 |
+
<dim>2</dim>
|
145 |
+
</port>
|
146 |
+
</input>
|
147 |
+
<output>
|
148 |
+
<port id="2" precision="I32">
|
149 |
+
<dim>-1</dim>
|
150 |
+
<dim>-1</dim>
|
151 |
+
</port>
|
152 |
+
</output>
|
153 |
+
</layer>
|
154 |
+
<layer id="13" name="ScatterNDUpdate_176121" type="ScatterNDUpdate" version="opset4">
|
155 |
+
<input>
|
156 |
+
<port id="0" precision="I32">
|
157 |
+
<dim>-1</dim>
|
158 |
+
<dim>-1</dim>
|
159 |
+
</port>
|
160 |
+
<port id="1" precision="I64">
|
161 |
+
<dim>-1</dim>
|
162 |
+
<dim>2</dim>
|
163 |
+
</port>
|
164 |
+
<port id="2" precision="I32">
|
165 |
+
<dim>-1</dim>
|
166 |
+
</port>
|
167 |
+
</input>
|
168 |
+
<output>
|
169 |
+
<port id="3" precision="I32">
|
170 |
+
<dim>-1</dim>
|
171 |
+
<dim>-1</dim>
|
172 |
+
</port>
|
173 |
+
</output>
|
174 |
+
</layer>
|
175 |
+
<layer id="14" name="ScatterNDUpdate_176121" type="Convert" version="opset1">
|
176 |
+
<data destination_type="i64" />
|
177 |
+
<input>
|
178 |
+
<port id="0" precision="I32">
|
179 |
+
<dim>-1</dim>
|
180 |
+
<dim>-1</dim>
|
181 |
+
</port>
|
182 |
+
</input>
|
183 |
+
<output>
|
184 |
+
<port id="1" precision="I64" names="input_ids">
|
185 |
+
<dim>-1</dim>
|
186 |
+
<dim>-1</dim>
|
187 |
+
</port>
|
188 |
+
</output>
|
189 |
+
</layer>
|
190 |
+
<layer id="15" name="Result_176131" type="Result" version="opset1">
|
191 |
+
<input>
|
192 |
+
<port id="0" precision="I64">
|
193 |
+
<dim>-1</dim>
|
194 |
+
<dim>-1</dim>
|
195 |
+
</port>
|
196 |
+
</input>
|
197 |
+
</layer>
|
198 |
+
<layer id="10" name="Result_176132" type="Result" version="opset1">
|
199 |
+
<input>
|
200 |
+
<port id="0" precision="I64">
|
201 |
+
<dim>-1</dim>
|
202 |
+
<dim>-1</dim>
|
203 |
+
</port>
|
204 |
+
</input>
|
205 |
+
</layer>
|
206 |
+
</layers>
|
207 |
+
<edges>
|
208 |
+
<edge from-layer="0" from-port="0" to-layer="3" to-port="1" />
|
209 |
+
<edge from-layer="1" from-port="0" to-layer="4" to-port="0" />
|
210 |
+
<edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
|
211 |
+
<edge from-layer="3" from-port="4" to-layer="4" to-port="1" />
|
212 |
+
<edge from-layer="3" from-port="3" to-layer="6" to-port="0" />
|
213 |
+
<edge from-layer="3" from-port="2" to-layer="8" to-port="1" />
|
214 |
+
<edge from-layer="3" from-port="4" to-layer="12" to-port="1" />
|
215 |
+
<edge from-layer="3" from-port="2" to-layer="13" to-port="1" />
|
216 |
+
<edge from-layer="3" from-port="3" to-layer="13" to-port="2" />
|
217 |
+
<edge from-layer="4" from-port="2" to-layer="8" to-port="0" />
|
218 |
+
<edge from-layer="5" from-port="0" to-layer="7" to-port="0" />
|
219 |
+
<edge from-layer="6" from-port="1" to-layer="7" to-port="1" />
|
220 |
+
<edge from-layer="7" from-port="2" to-layer="8" to-port="2" />
|
221 |
+
<edge from-layer="8" from-port="3" to-layer="9" to-port="0" />
|
222 |
+
<edge from-layer="9" from-port="1" to-layer="10" to-port="0" />
|
223 |
+
<edge from-layer="11" from-port="0" to-layer="12" to-port="0" />
|
224 |
+
<edge from-layer="12" from-port="2" to-layer="13" to-port="0" />
|
225 |
+
<edge from-layer="13" from-port="3" to-layer="14" to-port="0" />
|
226 |
+
<edge from-layer="14" from-port="1" to-layer="15" to-port="0" />
|
227 |
+
</edges>
|
228 |
+
<rt_info>
|
229 |
+
<eos_token_id value="2" />
|
230 |
+
</rt_info>
|
231 |
+
</net>
|
special_tokens_map.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"unk_token": {
|
17 |
+
"content": "<unk>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
}
|
23 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
|
3 |
+
size 499723
|
tokenizer_config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"add_prefix_space": true,
|
5 |
+
"added_tokens_decoder": {
|
6 |
+
"0": {
|
7 |
+
"content": "<unk>",
|
8 |
+
"lstrip": false,
|
9 |
+
"normalized": false,
|
10 |
+
"rstrip": false,
|
11 |
+
"single_word": false,
|
12 |
+
"special": true
|
13 |
+
},
|
14 |
+
"1": {
|
15 |
+
"content": "<s>",
|
16 |
+
"lstrip": false,
|
17 |
+
"normalized": false,
|
18 |
+
"rstrip": false,
|
19 |
+
"single_word": false,
|
20 |
+
"special": true
|
21 |
+
},
|
22 |
+
"2": {
|
23 |
+
"content": "</s>",
|
24 |
+
"lstrip": false,
|
25 |
+
"normalized": false,
|
26 |
+
"rstrip": false,
|
27 |
+
"single_word": false,
|
28 |
+
"special": true
|
29 |
+
}
|
30 |
+
},
|
31 |
+
"bos_token": "<s>",
|
32 |
+
"clean_up_tokenization_spaces": false,
|
33 |
+
"eos_token": "</s>",
|
34 |
+
"legacy": true,
|
35 |
+
"model_max_length": 1000000000000000019884624838656,
|
36 |
+
"pad_token": null,
|
37 |
+
"sp_model_kwargs": {},
|
38 |
+
"spaces_between_special_tokens": false,
|
39 |
+
"tokenizer_class": "LlamaTokenizer",
|
40 |
+
"unk_token": "<unk>",
|
41 |
+
"use_default_system_prompt": false
|
42 |
+
}
|