whisper-small-ar / training.log

New experiment

691d013 over 2 years ago

29.5 kB

	05/22/2023 13:20:20 - WARNING - __main__ - Process rank: 0, device: cuda:0, n_gpu: 2distributed training: True, 16-bits training: True
	05/22/2023 13:20:20 - INFO - __main__ - Training/evaluation parameters Seq2SeqTrainingArguments(
	_n_gpu=2,
	adafactor=False,
	adam_beta1=0.9,
	adam_beta2=0.999,
	adam_epsilon=1e-08,
	auto_find_batch_size=False,
	bf16=False,
	bf16_full_eval=False,
	data_seed=None,
	dataloader_drop_last=False,
	dataloader_num_workers=0,
	dataloader_pin_memory=True,
	ddp_backend=None,
	ddp_bucket_cap_mb=None,
	ddp_find_unused_parameters=None,
	ddp_timeout=1800,
	debug=[],
	deepspeed=None,
	disable_tqdm=False,
	do_eval=True,
	do_predict=False,
	do_train=True,
	eval_accumulation_steps=None,
	eval_delay=0,
	eval_steps=1000,
	evaluation_strategy=steps,
	fp16=True,
	fp16_backend=auto,
	fp16_full_eval=False,
	fp16_opt_level=O1,
	fsdp=[],
	fsdp_config={'fsdp_min_num_params': 0, 'xla': False, 'xla_fsdp_grad_ckpt': False},
	fsdp_min_num_params=0,
	fsdp_transformer_layer_cls_to_wrap=None,
	full_determinism=False,
	generation_config=None,
	generation_max_length=225,
	generation_num_beams=None,
	gradient_accumulation_steps=8,
	gradient_checkpointing=True,
	greater_is_better=False,
	group_by_length=False,
	half_precision_backend=auto,
	hub_model_id=None,
	hub_private_repo=False,
	hub_strategy=every_save,
	hub_token=<HUB_TOKEN>,
	ignore_data_skip=False,
	include_inputs_for_metrics=False,
	jit_mode_eval=False,
	label_names=None,
	label_smoothing_factor=0.0,
	learning_rate=1.75e-05,
	length_column_name=input_length,
	load_best_model_at_end=True,
	local_rank=0,
	log_level=passive,
	log_level_replica=warning,
	log_on_each_node=True,
	logging_dir=./runs/May22_13-20-19_crimv3mgpu016,
	logging_first_step=False,
	logging_nan_inf_filter=True,
	logging_steps=25,
	logging_strategy=steps,
	lr_scheduler_type=linear,
	max_grad_norm=1.0,
	max_steps=-1,
	metric_for_best_model=wer,
	mp_parameters=,
	no_cuda=False,
	num_train_epochs=30.0,
	optim=adamw_hf,
	optim_args=None,
	output_dir=./,
	overwrite_output_dir=True,
	past_index=-1,
	per_device_eval_batch_size=32,
	per_device_train_batch_size=32,
	predict_with_generate=True,
	prediction_loss_only=False,
	push_to_hub=True,
	push_to_hub_model_id=None,
	push_to_hub_organization=None,
	push_to_hub_token=<PUSH_TO_HUB_TOKEN>,
	ray_scope=last,
	remove_unused_columns=True,
	report_to=['wandb'],
	resume_from_checkpoint=None,
	run_name=./,
	save_on_each_node=False,
	save_safetensors=False,
	save_steps=1000,
	save_strategy=steps,
	save_total_limit=None,
	seed=42,
	sharded_ddp=[],
	skip_memory_metrics=True,
	sortish_sampler=False,
	tf32=None,
	torch_compile=False,
	torch_compile_backend=None,
	torch_compile_mode=None,
	torchdynamo=None,
	tpu_metrics_debug=False,
	tpu_num_cores=None,
	use_ipex=False,
	use_legacy_prediction_loop=False,
	use_mps_device=False,
	warmup_ratio=0.0,
	warmup_steps=4000,
	weight_decay=0.0,
	xpu_backend=None,
	)
	05/22/2023 13:20:20 - INFO - __main__ - Training/evaluation parameters Seq2SeqTrainingArguments(
	_n_gpu=2,
	adafactor=False,
	adam_beta1=0.9,
	adam_beta2=0.999,
	adam_epsilon=1e-08,
	auto_find_batch_size=False,
	bf16=False,
	bf16_full_eval=False,
	data_seed=None,
	dataloader_drop_last=False,
	dataloader_num_workers=0,
	dataloader_pin_memory=True,
	ddp_backend=None,
	ddp_bucket_cap_mb=None,
	ddp_find_unused_parameters=None,
	ddp_timeout=1800,
	debug=[],
	deepspeed=None,
	disable_tqdm=False,
	do_eval=True,
	do_predict=False,
	do_train=True,
	eval_accumulation_steps=None,
	eval_delay=0,
	eval_steps=1000,
	evaluation_strategy=steps,
	fp16=True,
	fp16_backend=auto,
	fp16_full_eval=False,
	fp16_opt_level=O1,
	fsdp=[],
	fsdp_config={'fsdp_min_num_params': 0, 'xla': False, 'xla_fsdp_grad_ckpt': False},
	fsdp_min_num_params=0,
	fsdp_transformer_layer_cls_to_wrap=None,
	full_determinism=False,
	generation_config=None,
	generation_max_length=225,
	generation_num_beams=None,
	gradient_accumulation_steps=8,
	gradient_checkpointing=True,
	greater_is_better=False,
	group_by_length=False,
	half_precision_backend=auto,
	hub_model_id=None,
	hub_private_repo=False,
	hub_strategy=every_save,
	hub_token=<HUB_TOKEN>,
	ignore_data_skip=False,
	include_inputs_for_metrics=False,
	jit_mode_eval=False,
	label_names=None,
	label_smoothing_factor=0.0,
	learning_rate=1.75e-05,
	length_column_name=input_length,
	load_best_model_at_end=True,
	local_rank=0,
	log_level=passive,
	log_level_replica=warning,
	log_on_each_node=True,
	logging_dir=./runs/May22_13-20-19_crimv3mgpu016,
	logging_first_step=False,
	logging_nan_inf_filter=True,
	logging_steps=25,
	logging_strategy=steps,
	lr_scheduler_type=linear,
	max_grad_norm=1.0,
	max_steps=-1,
	metric_for_best_model=wer,
	mp_parameters=,
	no_cuda=False,
	num_train_epochs=30.0,
	optim=adamw_hf,
	optim_args=None,
	output_dir=./,
	overwrite_output_dir=True,
	past_index=-1,
	per_device_eval_batch_size=32,
	per_device_train_batch_size=32,
	predict_with_generate=True,
	prediction_loss_only=False,
	push_to_hub=True,
	push_to_hub_model_id=None,
	push_to_hub_organization=None,
	push_to_hub_token=<PUSH_TO_HUB_TOKEN>,
	ray_scope=last,
	remove_unused_columns=True,
	report_to=['wandb'],
	resume_from_checkpoint=None,
	run_name=./,
	save_on_each_node=False,
	save_safetensors=False,
	save_steps=1000,
	save_strategy=steps,
	save_total_limit=None,
	seed=42,
	sharded_ddp=[],
	skip_memory_metrics=True,
	sortish_sampler=False,
	tf32=None,
	torch_compile=False,
	torch_compile_backend=None,
	torch_compile_mode=None,
	torchdynamo=None,
	tpu_metrics_debug=False,
	tpu_num_cores=None,
	use_ipex=False,
	use_legacy_prediction_loop=False,
	use_mps_device=False,
	warmup_ratio=0.0,
	warmup_steps=4000,
	weight_decay=0.0,
	xpu_backend=None,
	)
	[INFO\|configuration_utils.py:669] 2023-05-22 13:20:37,583 >> loading configuration file config.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/config.json
	[INFO\|configuration_utils.py:725] 2023-05-22 13:20:37,651 >> Model config WhisperConfig {
	"_name_or_path": "openai/whisper-small",
	"activation_dropout": 0.0,
	"activation_function": "gelu",
	"apply_spec_augment": false,
	"architectures": [
	"WhisperForConditionalGeneration"
	],
	"attention_dropout": 0.0,
	"begin_suppress_tokens": [
	220,
	50257
	],
	"bos_token_id": 50257,
	"classifier_proj_size": 256,
	"d_model": 768,
	"decoder_attention_heads": 12,
	"decoder_ffn_dim": 3072,
	"decoder_layerdrop": 0.0,
	"decoder_layers": 12,
	"decoder_start_token_id": 50258,
	"dropout": 0.0,
	"encoder_attention_heads": 12,
	"encoder_ffn_dim": 3072,
	"encoder_layerdrop": 0.0,
	"encoder_layers": 12,
	"eos_token_id": 50257,
	"forced_decoder_ids": [
	[
	1,
	50259
	],
	[
	2,
	50359
	],
	[
	3,
	50363
	]
	],
	"init_std": 0.02,
	"is_encoder_decoder": true,
	"mask_feature_length": 10,
	"mask_feature_min_masks": 0,
	"mask_feature_prob": 0.0,
	"mask_time_length": 10,
	"mask_time_min_masks": 2,
	"mask_time_prob": 0.05,
	"max_length": 448,
	"max_source_positions": 1500,
	"max_target_positions": 448,
	"model_type": "whisper",
	"num_hidden_layers": 12,
	"num_mel_bins": 80,
	"pad_token_id": 50257,
	"scale_embedding": false,
	"suppress_tokens": [
	1,
	2,
	7,
	8,
	9,
	10,
	14,
	25,
	26,
	27,
	28,
	29,
	31,
	58,
	59,
	60,
	61,
	62,
	63,
	90,
	91,
	92,
	93,
	359,
	503,
	522,
	542,
	873,
	893,
	902,
	918,
	922,
	931,
	1350,
	1853,
	1982,
	2460,
	2627,
	3246,
	3253,
	3268,
	3536,
	3846,
	3961,
	4183,
	4667,
	6585,
	6647,
	7273,
	9061,
	9383,
	10428,
	10929,
	11938,
	12033,
	12331,
	12562,
	13793,
	14157,
	14635,
	15265,
	15618,
	16553,
	16604,
	18362,
	18956,
	20075,
	21675,
	22520,
	26130,
	26161,
	26435,
	28279,
	29464,
	31650,
	32302,
	32470,
	36865,
	42863,
	47425,
	49870,
	50254,
	50258,
	50360,
	50361,
	50362
	],
	"torch_dtype": "float32",
	"transformers_version": "4.29.0.dev0",
	"use_cache": true,
	"use_weighted_layer_sum": false,
	"vocab_size": 51865
	}

	[INFO\|feature_extraction_utils.py:469] 2023-05-22 13:20:37,926 >> loading configuration file preprocessor_config.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/preprocessor_config.json
	[INFO\|feature_extraction_utils.py:511] 2023-05-22 13:20:37,955 >> Feature extractor WhisperFeatureExtractor {
	"chunk_length": 30,
	"feature_extractor_type": "WhisperFeatureExtractor",
	"feature_size": 80,
	"hop_length": 160,
	"n_fft": 400,
	"n_samples": 480000,
	"nb_max_frames": 3000,
	"padding_side": "right",
	"padding_value": 0.0,
	"processor_class": "WhisperProcessor",
	"return_attention_mask": false,
	"sampling_rate": 16000
	}

	[INFO\|tokenization_utils_base.py:1810] 2023-05-22 13:20:38,269 >> loading file vocab.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/vocab.json
	[INFO\|tokenization_utils_base.py:1810] 2023-05-22 13:20:38,269 >> loading file tokenizer.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/tokenizer.json
	[INFO\|tokenization_utils_base.py:1810] 2023-05-22 13:20:38,269 >> loading file merges.txt from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/merges.txt
	[INFO\|tokenization_utils_base.py:1810] 2023-05-22 13:20:38,269 >> loading file normalizer.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/normalizer.json
	[INFO\|tokenization_utils_base.py:1810] 2023-05-22 13:20:38,269 >> loading file added_tokens.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/added_tokens.json
	[INFO\|tokenization_utils_base.py:1810] 2023-05-22 13:20:38,269 >> loading file special_tokens_map.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/special_tokens_map.json
	[INFO\|tokenization_utils_base.py:1810] 2023-05-22 13:20:38,269 >> loading file tokenizer_config.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/tokenizer_config.json
	[INFO\|modeling_utils.py:2542] 2023-05-22 13:20:38,651 >> loading weights file pytorch_model.bin from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/pytorch_model.bin
	[INFO\|configuration_utils.py:577] 2023-05-22 13:20:47,050 >> Generate config GenerationConfig {
	"_from_model_config": true,
	"begin_suppress_tokens": [
	220,
	50257
	],
	"bos_token_id": 50257,
	"decoder_start_token_id": 50258,
	"eos_token_id": 50257,
	"max_length": 448,
	"pad_token_id": 50257,
	"transformers_version": "4.29.0.dev0",
	"use_cache": false
	}

	[INFO\|modeling_utils.py:3211] 2023-05-22 13:20:49,666 >> All model checkpoint weights were used when initializing WhisperForConditionalGeneration.

	[INFO\|modeling_utils.py:3219] 2023-05-22 13:20:49,666 >> All the weights of WhisperForConditionalGeneration were initialized from the model checkpoint at openai/whisper-small.
	If your task is similar to the task the model of the checkpoint was trained on, you can already use WhisperForConditionalGeneration for predictions without further training.
	[INFO\|configuration_utils.py:539] 2023-05-22 13:20:50,330 >> loading configuration file generation_config.json from cache at /home/local/QCRI/dizham/.cache/huggingface/hub/models--openai--whisper-small/snapshots/f6744499d1eba717bcf4d6be735e3d386ffb60ad/generation_config.json
	[INFO\|configuration_utils.py:577] 2023-05-22 13:20:50,331 >> Generate config GenerationConfig {
	"begin_suppress_tokens": [
	220,
	50257
	],
	"bos_token_id": 50257,
	"decoder_start_token_id": 50258,
	"eos_token_id": 50257,
	"forced_decoder_ids": [
	[
	1,
	null
	],
	[
	2,
	50359
	]
	],
	"is_multilingual": true,
	"lang_to_id": {
	"<\|af\|>": 50327,
	"<\|am\|>": 50334,
	"<\|ar\|>": 50272,
	"<\|as\|>": 50350,
	"<\|az\|>": 50304,
	"<\|ba\|>": 50355,
	"<\|be\|>": 50330,
	"<\|bg\|>": 50292,
	"<\|bn\|>": 50302,
	"<\|bo\|>": 50347,
	"<\|br\|>": 50309,
	"<\|bs\|>": 50315,
	"<\|ca\|>": 50270,
	"<\|cs\|>": 50283,
	"<\|cy\|>": 50297,
	"<\|da\|>": 50285,
	"<\|de\|>": 50261,
	"<\|el\|>": 50281,
	"<\|en\|>": 50259,
	"<\|es\|>": 50262,
	"<\|et\|>": 50307,
	"<\|eu\|>": 50310,
	"<\|fa\|>": 50300,
	"<\|fi\|>": 50277,
	"<\|fo\|>": 50338,
	"<\|fr\|>": 50265,
	"<\|gl\|>": 50319,
	"<\|gu\|>": 50333,
	"<\|haw\|>": 50352,
	"<\|ha\|>": 50354,
	"<\|he\|>": 50279,
	"<\|hi\|>": 50276,
	"<\|hr\|>": 50291,
	"<\|ht\|>": 50339,
	"<\|hu\|>": 50286,
	"<\|hy\|>": 50312,
	"<\|id\|>": 50275,
	"<\|is\|>": 50311,
	"<\|it\|>": 50274,
	"<\|ja\|>": 50266,
	"<\|jw\|>": 50356,
	"<\|ka\|>": 50329,
	"<\|kk\|>": 50316,
	"<\|km\|>": 50323,
	"<\|kn\|>": 50306,
	"<\|ko\|>": 50264,
	"<\|la\|>": 50294,
	"<\|lb\|>": 50345,
	"<\|ln\|>": 50353,
	"<\|lo\|>": 50336,
	"<\|lt\|>": 50293,
	"<\|lv\|>": 50301,
	"<\|mg\|>": 50349,
	"<\|mi\|>": 50295,
	"<\|mk\|>": 50308,
	"<\|ml\|>": 50296,
	"<\|mn\|>": 50314,
	"<\|mr\|>": 50320,
	"<\|ms\|>": 50282,
	"<\|mt\|>": 50343,
	"<\|my\|>": 50346,
	"<\|ne\|>": 50313,
	"<\|nl\|>": 50271,
	"<\|nn\|>": 50342,
	"<\|no\|>": 50288,
	"<\|oc\|>": 50328,
	"<\|pa\|>": 50321,
	"<\|pl\|>": 50269,
	"<\|ps\|>": 50340,
	"<\|pt\|>": 50267,
	"<\|ro\|>": 50284,
	"<\|ru\|>": 50263,
	"<\|sa\|>": 50344,
	"<\|sd\|>": 50332,
	"<\|si\|>": 50322,
	"<\|sk\|>": 50298,
	"<\|sl\|>": 50305,
	"<\|sn\|>": 50324,
	"<\|so\|>": 50326,
	"<\|sq\|>": 50317,
	"<\|sr\|>": 50303,
	"<\|su\|>": 50357,
	"<\|sv\|>": 50273,
	"<\|sw\|>": 50318,
	"<\|ta\|>": 50287,
	"<\|te\|>": 50299,
	"<\|tg\|>": 50331,
	"<\|th\|>": 50289,
	"<\|tk\|>": 50341,
	"<\|tl\|>": 50348,
	"<\|tr\|>": 50268,
	"<\|tt\|>": 50351,
	"<\|uk\|>": 50280,
	"<\|ur\|>": 50290,
	"<\|uz\|>": 50337,
	"<\|vi\|>": 50278,
	"<\|yi\|>": 50335,
	"<\|yo\|>": 50325,
	"<\|zh\|>": 50260
	},
	"max_initial_timestamp_index": 1,
	"max_length": 448,
	"no_timestamps_token_id": 50363,
	"pad_token_id": 50257,
	"return_timestamps": false,
	"suppress_tokens": [
	1,
	2,
	7,
	8,
	9,
	10,
	14,
	25,
	26,
	27,
	28,
	29,
	31,
	58,
	59,
	60,
	61,
	62,
	63,
	90,
	91,
	92,
	93,
	359,
	503,
	522,
	542,
	873,
	893,
	902,
	918,
	922,
	931,
	1350,
	1853,
	1982,
	2460,
	2627,
	3246,
	3253,
	3268,
	3536,
	3846,
	3961,
	4183,
	4667,
	6585,
	6647,
	7273,
	9061,
	9383,
	10428,
	10929,
	11938,
	12033,
	12331,
	12562,
	13793,
	14157,
	14635,
	15265,
	15618,
	16553,
	16604,
	18362,
	18956,
	20075,
	21675,
	22520,
	26130,
	26161,
	26435,
	28279,
	29464,
	31650,
	32302,
	32470,
	36865,
	42863,
	47425,
	49870,
	50254,
	50258,
	50358,
	50359,
	50360,
	50361,
	50362
	],
	"task_to_id": {
	"transcribe": 50359,
	"translate": 50358
	},
	"transformers_version": "4.29.0.dev0"
	}

	[INFO\|feature_extraction_utils.py:369] 2023-05-22 13:20:52,959 >> Feature extractor saved in ./preprocessor_config.json
	[INFO\|tokenization_utils_base.py:2181] 2023-05-22 13:20:52,962 >> tokenizer config file saved in ./tokenizer_config.json
	[INFO\|tokenization_utils_base.py:2188] 2023-05-22 13:20:52,965 >> Special tokens file saved in ./special_tokens_map.json
	[INFO\|configuration_utils.py:458] 2023-05-22 13:20:53,103 >> Configuration saved in ./config.json
	[INFO\|image_processing_utils.py:307] 2023-05-22 13:20:53,104 >> loading configuration file ./preprocessor_config.json
	[INFO\|feature_extraction_utils.py:467] 2023-05-22 13:20:53,134 >> loading configuration file ./preprocessor_config.json
	[INFO\|feature_extraction_utils.py:511] 2023-05-22 13:20:53,135 >> Feature extractor WhisperFeatureExtractor {
	"chunk_length": 30,
	"feature_extractor_type": "WhisperFeatureExtractor",
	"feature_size": 80,
	"hop_length": 160,
	"n_fft": 400,
	"n_samples": 480000,
	"nb_max_frames": 3000,
	"padding_side": "right",
	"padding_value": 0.0,
	"processor_class": "WhisperProcessor",
	"return_attention_mask": false,
	"sampling_rate": 16000
	}

	[INFO\|tokenization_utils_base.py:1808] 2023-05-22 13:20:53,136 >> loading file vocab.json
	[INFO\|tokenization_utils_base.py:1808] 2023-05-22 13:20:53,136 >> loading file tokenizer.json
	[INFO\|tokenization_utils_base.py:1808] 2023-05-22 13:20:53,136 >> loading file merges.txt
	[INFO\|tokenization_utils_base.py:1808] 2023-05-22 13:20:53,136 >> loading file normalizer.json
	[INFO\|tokenization_utils_base.py:1808] 2023-05-22 13:20:53,136 >> loading file added_tokens.json
	[INFO\|tokenization_utils_base.py:1808] 2023-05-22 13:20:53,136 >> loading file special_tokens_map.json
	[INFO\|tokenization_utils_base.py:1808] 2023-05-22 13:20:53,136 >> loading file tokenizer_config.json
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,201 >> Adding <\|startoftranscript\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,201 >> Adding <\|en\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|zh\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|de\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|es\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ru\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ko\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|fr\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ja\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|pt\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|tr\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|pl\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ca\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|nl\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ar\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|sv\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|it\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|id\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|hi\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|fi\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|vi\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|he\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|uk\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|el\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ms\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|cs\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ro\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|da\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|hu\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ta\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|no\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|th\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ur\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|hr\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|bg\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|lt\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|la\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|mi\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|ml\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|cy\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|sk\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,202 >> Adding <\|te\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|fa\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|lv\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|bn\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|sr\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|az\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|sl\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|kn\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|et\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|mk\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|br\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|eu\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|is\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|hy\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|ne\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|mn\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|bs\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|kk\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|sq\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|sw\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|gl\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|mr\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|pa\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|si\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|km\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|sn\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|yo\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|so\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|af\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|oc\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|ka\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|be\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|tg\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|sd\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|gu\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|am\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|yi\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|lo\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|uz\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|fo\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|ht\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,203 >> Adding <\|ps\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|tk\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|nn\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|mt\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|sa\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|lb\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|my\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|bo\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|tl\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|mg\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|as\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|tt\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|haw\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|ln\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|ha\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|ba\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|jw\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|su\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|translate\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|transcribe\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|startoflm\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|startofprev\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|nocaptions\|> to the vocabulary
	[INFO\|tokenization_utils.py:426] 2023-05-22 13:20:53,204 >> Adding <\|notimestamps\|> to the vocabulary
	/home/local/QCRI/dizham/kanari/whisper/whisper-small-ar/./ is already a clone of https://huggingface.co/danielizham/whisper-small-ar. Make sure you pull the latest changes with `repo.git_pull()`.
	05/22/2023 13:21:02 - WARNING - huggingface_hub.repository - /home/local/QCRI/dizham/kanari/whisper/whisper-small-ar/./ is already a clone of https://huggingface.co/danielizham/whisper-small-ar. Make sure you pull the latest changes with `repo.git_pull()`.
	Traceback (most recent call last):
	File "/home/local/QCRI/dizham/miniconda3/envs/whisper/lib/python3.9/site-packages/huggingface_hub/repository.py", line 987, in git_pull
	result = run_subprocess(command, self.local_dir)
	File "/home/local/QCRI/dizham/miniconda3/envs/whisper/lib/python3.9/site-packages/huggingface_hub/utils/_subprocess.py", line 83, in run_subprocess
	return subprocess.run(
	File "/home/local/QCRI/dizham/miniconda3/envs/whisper/lib/python3.9/subprocess.py", line 528, in run
	raise CalledProcessError(retcode, process.args,
	subprocess.CalledProcessError: Command '['git', 'pull']' returned non-zero exit status 128.

	During handling of the above exception, another exception occurred:

	Traceback (most recent call last):
	File "/home/local/QCRI/dizham/kanari/whisper/whisper-small-ar/run_speech_recognition_seq2seq_streaming.py", line 629, in <module>
	main()
	File "/home/local/QCRI/dizham/kanari/whisper/whisper-small-ar/run_speech_recognition_seq2seq_streaming.py", line 560, in main
	trainer = Seq2SeqTrainer(
	File "/home/local/QCRI/dizham/miniconda3/envs/whisper/lib/python3.9/site-packages/transformers/trainer_seq2seq.py", line 56, in __init__
	super().__init__(
	File "/home/local/QCRI/dizham/miniconda3/envs/whisper/lib/python3.9/site-packages/transformers/trainer.py", line 551, in __init__
	self.init_git_repo(at_init=True)
	File "/home/local/QCRI/dizham/miniconda3/envs/whisper/lib/python3.9/site-packages/transformers/trainer.py", line 3516, in init_git_repo
	self.repo.git_pull()
	File "/home/local/QCRI/dizham/miniconda3/envs/whisper/lib/python3.9/site-packages/huggingface_hub/repository.py", line 990, in git_pull
	raise EnvironmentError(exc.stderr)
	OSError: error: cannot pull with rebase: You have unstaged changes.
	error: please commit or stash them.