bastasie commited on
Commit
6293d0c
1 Parent(s): 73c74d4

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +9 -32
config.json CHANGED
@@ -1,38 +1,15 @@
1
  {
2
  "model_type": "CustomModel",
3
- "architecture": "Feedforward Neural Network with Ba-inspired Activation Function",
4
  "input_size": 512,
5
  "hidden_size": 128,
6
  "output_size": 768,
7
- "activation_function": {
8
- "name": "Ba-inspired Activation",
9
- "details": {
10
- "weights_initialization": "Random Normal Distribution",
11
- "a": 0.5,
12
- "epsilon": 1e-6,
13
- "function": "epsilon * torch.cos(np.pi * a * fractional_inspired * torch.log(torch.abs(fractional_inspired) + epsilon))"
14
- }
15
- },
16
- "tokenizer": "bert-base-uncased",
17
- "training_details": {
18
- "optimizer": "AdamW",
19
- "learning_rate": 5e-5,
20
- "loss_function": "CrossEntropyLoss",
21
- "batch_size": 8,
22
- "epochs": 3,
23
- "dataset": "Custom Dataset from JSON Lines File",
24
- "dataset_preprocessing": {
25
- "max_length": 512,
26
- "padding": true,
27
- "truncation": true
28
- }
29
- },
30
- "performance": {
31
- "final_accuracy": "Dependent on specific run and dataset",
32
- "final_loss": "Dependent on specific run and dataset"
33
- },
34
- "usage": {
35
- "inference": "Model can be used for tasks requiring sequence classification. Ensure input size matches model configuration.",
36
- "additional_notes": "Model and tokenizer need to be loaded with Hugging Face's transformers library for usage."
37
- }
38
  }
 
1
  {
2
  "model_type": "CustomModel",
3
+ "architecture": "CustomModel",
4
  "input_size": 512,
5
  "hidden_size": 128,
6
  "output_size": 768,
7
+ "vocab_size": 30522, // Example vocab size, adjust according to your tokenizer's vocabulary
8
+ "layer_norm_epsilon": 1e-12,
9
+ "hidden_dropout_prob": 0.1,
10
+ "num_attention_heads": 12, // Adjust if your model uses attention mechanisms
11
+ "attention_probs_dropout_prob": 0.1,
12
+ "intermediate_size": 3072, // Example size, adjust based on your model's architecture
13
+ "num_hidden_layers": 12, // Adjust based on your model's depth
14
+ "initializer_range": 0.02
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15
  }