Raj-Sanjay-Shah commited on
Commit
8727172
1 Parent(s): cecdebf

Upload 4 files

Browse files
Files changed (2) hide show
  1. config.json +6 -7
  2. tokenizer_config.json +1 -1
config.json CHANGED
@@ -1,20 +1,19 @@
1
  {
2
- "_name_or_path": "/datadrive/finance/electra/out/checkpoint-142000",
3
  "architectures": [
4
- "ElectraForLanguageModelingModel"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
- "embedding_size": 128,
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
10
- "hidden_size": 256,
11
  "initializer_range": 0.02,
12
- "intermediate_size": 1024,
13
  "layer_norm_eps": 1e-12,
14
  "max_position_embeddings": 512,
15
  "model_type": "electra",
16
- "num_attention_heads": 4,
17
- "num_hidden_layers": 12,
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
20
  "summary_activation": "gelu",
 
1
  {
 
2
  "architectures": [
3
+ "ElectraForPreTraining"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
+ "embedding_size": 1024,
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 1024,
10
  "initializer_range": 0.02,
11
+ "intermediate_size": 4096,
12
  "layer_norm_eps": 1e-12,
13
  "max_position_embeddings": 512,
14
  "model_type": "electra",
15
+ "num_attention_heads": 16,
16
+ "num_hidden_layers": 24,
17
  "pad_token_id": 0,
18
  "position_embedding_type": "absolute",
19
  "summary_activation": "gelu",
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"do_lower_case": true, "do_basic_tokenize": true, "never_split": null, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "name_or_path": "/datadrive/finance/electra/out/checkpoint-142000", "train_file": "/home/azureuser/finance/data/train.txt", "special_tokens_map_file": "/datadrive/finance/electra/out/checkpoint-142000/special_tokens_map.json", "tokenizer_file": null}
 
1
+ {"do_lower_case": true, "do_basic_tokenize": true, "never_split": null, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "name_or_path": "/datadrive/finance/electra/out/checkpoint-142000", "special_tokens_map_file": "/datadrive/finance/electra/out/checkpoint-142000/special_tokens_map.json", "tokenizer_file": null}