File size: 2,487 Bytes
dedcdce
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
{
  "os":  "Linux-6.8.0-45-generic-x86_64-with-glibc2.39",
  "python":  "3.12.3",
  "startedAt":  "2024-10-07T10:21:12.262430Z",
  "args":  [
    "--model_name_or_path=openai/whisper-large-v3",
    "--dataset_name=mozilla-foundation/common_voice_17_0",
    "--dataset_config_name=eu",
    "--language=basque",
    "--train_split_name=train+validation",
    "--eval_split_name=test",
    "--model_index_name=Whisper Large Basque",
    "--max_steps=10000",
    "--output_dir=./",
    "--per_device_train_batch_size=16",
    "--per_device_eval_batch_size=8",
    "--gradient_accumulation_steps=1",
    "--logging_steps=25",
    "--learning_rate=4.375e-6",
    "--warmup_steps=500",
    "--evaluation_strategy=steps",
    "--eval_steps=500",
    "--save_strategy=steps",
    "--save_steps=1000",
    "--generation_max_length=228",
    "--length_column_name=input_length",
    "--max_duration_in_seconds=30",
    "--text_column_name=sentence",
    "--freeze_feature_encoder=False",
    "--report_to=tensorboard",
    "--metric_for_best_model=wer",
    "--greater_is_better=False",
    "--load_best_model_at_end",
    "--gradient_checkpointing",
    "--fp16",
    "--overwrite_output_dir",
    "--do_train",
    "--do_eval",
    "--predict_with_generate",
    "--do_normalize_eval",
    "--streaming",
    "--push_to_hub",
    "--resume_from_checkpoint=./checkpoint-9000/",
    "--report_to",
    "wandb",
    "--run_name",
    "whisper-large-eu"
  ],
  "program":  "/home/tknika/whisper-large-eu/run_speech_recognition_seq2seq_streaming.py",
  "codePath":  "run_speech_recognition_seq2seq_streaming.py",
  "git":  {
    "remote":  "https://huggingface.co/xezpeleta/whisper-large-eu",
    "commit":  "45227421df6af8836af459c374361e7303a68aea"
  },
  "email":  "[email protected]",
  "root":  "/home/tknika/whisper-large-eu",
  "host":  "tknika",
  "username":  "tknika",
  "executable":  "/home/tknika/whisper-large-eu/.venv/bin/python",
  "codePathLocal":  "run_speech_recognition_seq2seq_streaming.py",
  "cpu_count":  8,
  "cpu_count_logical":  8,
  "gpu":  "[NVIDIA L40-48Q]",
  "gpu_count":  1,
  "disk":  {
    "/":  {
      "total":  "314615791616",
      "used":  "265683288064"
    }
  },
  "memory":  {
    "total":  "33654026240"
  },
  "cpu":  {
    "count":  8,
    "countLogical":  8
  },
  "gpu_nvidia":  [
    {
      "name":  "NVIDIA L40-48Q",
      "memoryTotal":  "51539607552",
      "cudaCores":  18176,
      "architecture":  "Ada"
    }
  ],
  "cudaVersion":  "12.4"
}