Upload trained model
Browse files- additional_decoder_block.pt +3 -0
- classifier.pt +3 -0
- config.json +48 -0
- generation_config.json +12 -0
- log_eval.txt +1 -0
- log_eval_word_level.txt +1 -0
- preprocessor_config.json +14 -0
- runs/Jan28_04-07-30_isl-gpu43/events.out.tfevents.1738066100.isl-gpu43.2836202.0 +3 -0
- runs/Jan28_04-07-30_isl-gpu43/events.out.tfevents.1738066363.isl-gpu43.2836202.1 +3 -0
- training_args.bin +3 -0
- training_args.json +1 -0
additional_decoder_block.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:198def521215c52aeb9e7335bbdb28d48540dcae5c0c174b08049e6e3b52b52a
|
3 |
+
size 37809834
|
classifier.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bebcb2604d12f63ecc15d5bab8cefe508bf150fed8ccf0b36fd5fc8995afcd9b
|
3 |
+
size 4739176
|
config.json
ADDED
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"activation_dropout": 0.0,
|
3 |
+
"activation_function": "gelu",
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"WhisperWithExtraDecoderAndClassifier"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"begin_suppress_tokens": [
|
10 |
+
220,
|
11 |
+
50256
|
12 |
+
],
|
13 |
+
"bos_token_id": 50256,
|
14 |
+
"classifier_proj_size": 256,
|
15 |
+
"d_model": 384,
|
16 |
+
"decoder_attention_heads": 6,
|
17 |
+
"decoder_ffn_dim": 1536,
|
18 |
+
"decoder_layerdrop": 0.0,
|
19 |
+
"decoder_layers": 4,
|
20 |
+
"decoder_start_token_id": 50257,
|
21 |
+
"dropout": 0.0,
|
22 |
+
"encoder_attention_heads": 6,
|
23 |
+
"encoder_ffn_dim": 1536,
|
24 |
+
"encoder_layerdrop": 0.0,
|
25 |
+
"encoder_layers": 4,
|
26 |
+
"eos_token_id": 50256,
|
27 |
+
"init_std": 0.02,
|
28 |
+
"is_encoder_decoder": true,
|
29 |
+
"mask_feature_length": 10,
|
30 |
+
"mask_feature_min_masks": 0,
|
31 |
+
"mask_feature_prob": 0.0,
|
32 |
+
"mask_time_length": 10,
|
33 |
+
"mask_time_min_masks": 2,
|
34 |
+
"mask_time_prob": 0.05,
|
35 |
+
"max_source_positions": 1500,
|
36 |
+
"max_target_positions": 448,
|
37 |
+
"median_filter_width": 7,
|
38 |
+
"model_type": "whisper",
|
39 |
+
"num_hidden_layers": 4,
|
40 |
+
"num_mel_bins": 80,
|
41 |
+
"pad_token_id": 50256,
|
42 |
+
"scale_embedding": false,
|
43 |
+
"torch_dtype": "float32",
|
44 |
+
"transformers_version": "4.45.2",
|
45 |
+
"use_cache": true,
|
46 |
+
"use_weighted_layer_sum": false,
|
47 |
+
"vocab_size": 51865
|
48 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"begin_suppress_tokens": [
|
4 |
+
220,
|
5 |
+
50256
|
6 |
+
],
|
7 |
+
"bos_token_id": 50256,
|
8 |
+
"decoder_start_token_id": 50257,
|
9 |
+
"eos_token_id": 50256,
|
10 |
+
"pad_token_id": 50256,
|
11 |
+
"transformers_version": "4.45.2"
|
12 |
+
}
|
log_eval.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"eval_accuracy": 0.22032726434662364, "eval_precision": 0.12059765208110992, "eval_recall": 0.8385899814471243, "eval_f1": 0.21087007231163984}{"eval_accuracy": 0.9057692307692308, "eval_precision": 0.6382978723404256, "eval_recall": 0.4838709677419355, "eval_f1": 0.5504587155963303}{"eval_accuracy": 0.9461538461538461, "eval_precision": 0.7931034482758621, "eval_recall": 0.7419354838709677, "eval_f1": 0.7666666666666667}{"eval_accuracy": 0.8826923076923077, "eval_precision": 0.5053763440860215, "eval_recall": 0.7580645161290323, "eval_f1": 0.6064516129032258}{"eval_accuracy": 0.9288461538461539, "eval_precision": 0.7906976744186046, "eval_recall": 0.5483870967741935, "eval_f1": 0.6476190476190476}{"eval_accuracy": 0.9346153846153846, "eval_precision": 0.7258064516129032, "eval_recall": 0.7258064516129032, "eval_f1": 0.7258064516129032}{"eval_accuracy": 0.9403846153846154, "eval_precision": 0.7719298245614035, "eval_recall": 0.7096774193548387, "eval_f1": 0.7394957983193278}{"eval_accuracy": 0.9423076923076923, "eval_precision": 0.7962962962962963, "eval_recall": 0.6935483870967742, "eval_f1": 0.7413793103448276}{"eval_accuracy": 0.9423076923076923, "eval_precision": 0.7962962962962963, "eval_recall": 0.6935483870967742, "eval_f1": 0.7413793103448276}{"eval_accuracy": 0.9280940308826918, "eval_precision": 0.8179271708683473, "eval_recall": 0.5417439703153989, "eval_f1": 0.6517857142857143}
|
log_eval_word_level.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
"Evaluate at WORD LEVEL:"{"eval_accuracy": 0.26597014925373136, "eval_precision": 0.14696370822853036, "eval_recall": 0.8279352226720648, "eval_f1": 0.24961855355508086}"Evaluate at WORD LEVEL:"{"eval_accuracy": 0.9188059701492537, "eval_precision": 0.8245614035087719, "eval_recall": 0.5708502024291497, "eval_f1": 0.6746411483253588}
|
preprocessor_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"chunk_length": 30,
|
3 |
+
"feature_extractor_type": "WhisperFeatureExtractor",
|
4 |
+
"feature_size": 80,
|
5 |
+
"hop_length": 160,
|
6 |
+
"n_fft": 400,
|
7 |
+
"n_samples": 480000,
|
8 |
+
"nb_max_frames": 3000,
|
9 |
+
"padding_side": "right",
|
10 |
+
"padding_value": 0.0,
|
11 |
+
"processor_class": "WhisperProcessor",
|
12 |
+
"return_attention_mask": false,
|
13 |
+
"sampling_rate": 16000
|
14 |
+
}
|
runs/Jan28_04-07-30_isl-gpu43/events.out.tfevents.1738066100.isl-gpu43.2836202.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0a272b4a909abd0071fe9e15f5a2f5f00eadbb43b0a6bb9ac2eb15f8e1fb813
|
3 |
+
size 11404
|
runs/Jan28_04-07-30_isl-gpu43/events.out.tfevents.1738066363.isl-gpu43.2836202.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93a0d3afd42012cbe3a5d1eeded3ef60e34a4e5f1c50d3bf90ab1c82e2618f47
|
3 |
+
size 590
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc4eb66cdb79b0b8227f481caccf361dbc590033a281b0b478b3588784c60019
|
3 |
+
size 5496
|
training_args.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "trained_models/whisper-small_expresso_final_before_gpt_2025_01_28__04_07_30", "overwrite_output_dir": true, "do_train": true, "do_eval": true, "do_predict": false, "eval_strategy": "steps", "prediction_loss_only": false, "per_device_train_batch_size": 2, "per_device_eval_batch_size": 4, "per_gpu_train_batch_size": null, "per_gpu_eval_batch_size": null, "gradient_accumulation_steps": 1, "eval_accumulation_steps": null, "eval_delay": 0, "torch_empty_cache_steps": null, "learning_rate": 0.0005, "weight_decay": 0.01, "adam_beta1": 0.9, "adam_beta2": 0.999, "adam_epsilon": 1e-08, "max_grad_norm": 1.0, "num_train_epochs": 2, "max_steps": -1, "lr_scheduler_type": "linear", "lr_scheduler_kwargs": {}, "warmup_ratio": 0.05, "warmup_steps": 0, "log_level": "passive", "log_level_replica": "warning", "log_on_each_node": true, "logging_dir": "trained_models/whisper-small_expresso_final_before_gpt_2025_01_28__04_07_30/runs/Jan28_04-07-30_isl-gpu43", "logging_strategy": "steps", "logging_first_step": false, "logging_steps": 10, "logging_nan_inf_filter": true, "save_strategy": "steps", "save_steps": 100, "save_total_limit": null, "save_safetensors": true, "save_on_each_node": false, "save_only_model": false, "restore_callback_states_from_checkpoint": false, "no_cuda": false, "use_cpu": false, "use_mps_device": false, "seed": 42, "data_seed": null, "jit_mode_eval": false, "use_ipex": false, "bf16": false, "fp16": false, "fp16_opt_level": "O1", "half_precision_backend": "auto", "bf16_full_eval": false, "fp16_full_eval": false, "tf32": null, "local_rank": 0, "ddp_backend": null, "tpu_num_cores": null, "tpu_metrics_debug": false, "debug": [], "dataloader_drop_last": false, "eval_steps": 20, "dataloader_num_workers": 0, "dataloader_prefetch_factor": null, "past_index": -1, "run_name": "trained_models/whisper-small_expresso_final_before_gpt_2025_01_28__04_07_30", "disable_tqdm": false, "remove_unused_columns": true, "label_names": ["labels_head", "whisper_labels", "sentence_index"], "load_best_model_at_end": false, "metric_for_best_model": null, "greater_is_better": null, "ignore_data_skip": false, "fsdp": [], "fsdp_min_num_params": 0, "fsdp_config": {"min_num_params": 0, "xla": false, "xla_fsdp_v2": false, "xla_fsdp_grad_ckpt": false}, "fsdp_transformer_layer_cls_to_wrap": null, "accelerator_config": {"split_batches": false, "dispatch_batches": null, "even_batches": true, "use_seedable_sampler": true, "non_blocking": false, "gradient_accumulation_kwargs": null}, "deepspeed": null, "label_smoothing_factor": 0.0, "optim": "adamw_torch", "optim_args": null, "adafactor": false, "group_by_length": false, "length_column_name": "length", "report_to": ["tensorboard", "wandb"], "ddp_find_unused_parameters": null, "ddp_bucket_cap_mb": null, "ddp_broadcast_buffers": null, "dataloader_pin_memory": true, "dataloader_persistent_workers": false, "skip_memory_metrics": true, "use_legacy_prediction_loop": false, "push_to_hub": false, "resume_from_checkpoint": null, "hub_model_id": null, "hub_strategy": "every_save", "hub_token": "<HUB_TOKEN>", "hub_private_repo": false, "hub_always_push": false, "gradient_checkpointing": false, "gradient_checkpointing_kwargs": null, "include_inputs_for_metrics": false, "eval_do_concat_batches": true, "fp16_backend": "auto", "evaluation_strategy": null, "push_to_hub_model_id": null, "push_to_hub_organization": null, "push_to_hub_token": "<PUSH_TO_HUB_TOKEN>", "mp_parameters": "", "auto_find_batch_size": false, "full_determinism": false, "torchdynamo": null, "ray_scope": "last", "ddp_timeout": 1800, "torch_compile": false, "torch_compile_backend": null, "torch_compile_mode": null, "dispatch_batches": null, "split_batches": null, "include_tokens_per_second": false, "include_num_input_tokens_seen": false, "neftune_noise_alpha": null, "optim_target_modules": null, "batch_eval_metrics": false, "eval_on_start": false, "use_liger_kernel": false, "eval_use_gather_object": false, "sortish_sampler": false, "predict_with_generate": false, "generation_max_length": 96, "generation_num_beams": null, "generation_config": null}
|