|
2024-09-09 11:53:51.396276: I tensorflow/core/util/port.cc:153] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`. |
|
2024-09-09 11:53:51.414891: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:485] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered |
|
2024-09-09 11:53:51.436268: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:8454] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered |
|
2024-09-09 11:53:51.442683: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1452] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered |
|
2024-09-09 11:53:51.458047: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations. |
|
To enable the following instructions: AVX2 AVX512F AVX512_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags. |
|
2024-09-09 11:53:52.683988: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT |
|
/usr/local/lib/python3.10/dist-packages/transformers/training_args.py:1525: FutureWarning: `evaluation_strategy` is deprecated and will be removed in version 4.46 of π€ Transformers. Use `eval_strategy` instead |
|
warnings.warn( |
|
09/09/2024 11:53:54 - WARNING - __main__ - Process rank: 0, device: cuda:0, n_gpu: 1distributed training: True, 16-bits training: False |
|
09/09/2024 11:53:54 - INFO - __main__ - Training/evaluation parameters TrainingArguments( |
|
_n_gpu=1, |
|
accelerator_config={'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None, 'use_configured_state': False}, |
|
adafactor=False, |
|
adam_beta1=0.9, |
|
adam_beta2=0.999, |
|
adam_epsilon=1e-08, |
|
auto_find_batch_size=False, |
|
batch_eval_metrics=False, |
|
bf16=False, |
|
bf16_full_eval=False, |
|
data_seed=None, |
|
dataloader_drop_last=False, |
|
dataloader_num_workers=0, |
|
dataloader_persistent_workers=False, |
|
dataloader_pin_memory=True, |
|
dataloader_prefetch_factor=None, |
|
ddp_backend=None, |
|
ddp_broadcast_buffers=None, |
|
ddp_bucket_cap_mb=None, |
|
ddp_find_unused_parameters=None, |
|
ddp_timeout=1800, |
|
debug=[], |
|
deepspeed=None, |
|
disable_tqdm=False, |
|
dispatch_batches=None, |
|
do_eval=True, |
|
do_predict=True, |
|
do_train=True, |
|
eval_accumulation_steps=None, |
|
eval_delay=0, |
|
eval_do_concat_batches=True, |
|
eval_on_start=False, |
|
eval_steps=None, |
|
eval_strategy=epoch, |
|
eval_use_gather_object=False, |
|
evaluation_strategy=epoch, |
|
fp16=False, |
|
fp16_backend=auto, |
|
fp16_full_eval=False, |
|
fp16_opt_level=O1, |
|
fsdp=[], |
|
fsdp_config={'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, |
|
fsdp_min_num_params=0, |
|
fsdp_transformer_layer_cls_to_wrap=None, |
|
full_determinism=False, |
|
gradient_accumulation_steps=2, |
|
gradient_checkpointing=False, |
|
gradient_checkpointing_kwargs=None, |
|
greater_is_better=True, |
|
group_by_length=False, |
|
half_precision_backend=auto, |
|
hub_always_push=False, |
|
hub_model_id=None, |
|
hub_private_repo=False, |
|
hub_strategy=every_save, |
|
hub_token=<HUB_TOKEN>, |
|
ignore_data_skip=False, |
|
include_inputs_for_metrics=False, |
|
include_num_input_tokens_seen=False, |
|
include_tokens_per_second=False, |
|
jit_mode_eval=False, |
|
label_names=None, |
|
label_smoothing_factor=0.0, |
|
learning_rate=5e-05, |
|
length_column_name=length, |
|
load_best_model_at_end=True, |
|
local_rank=0, |
|
log_level=passive, |
|
log_level_replica=warning, |
|
log_on_each_node=True, |
|
logging_dir=/content/dissertation/scripts/ner/output/tb, |
|
logging_first_step=False, |
|
logging_nan_inf_filter=True, |
|
logging_steps=500, |
|
logging_strategy=steps, |
|
lr_scheduler_kwargs={}, |
|
lr_scheduler_type=linear, |
|
max_grad_norm=1.0, |
|
max_steps=-1, |
|
metric_for_best_model=f1, |
|
mp_parameters=, |
|
neftune_noise_alpha=None, |
|
no_cuda=False, |
|
num_train_epochs=10.0, |
|
optim=adamw_torch, |
|
optim_args=None, |
|
optim_target_modules=None, |
|
output_dir=/content/dissertation/scripts/ner/output, |
|
overwrite_output_dir=True, |
|
past_index=-1, |
|
per_device_eval_batch_size=8, |
|
per_device_train_batch_size=32, |
|
prediction_loss_only=False, |
|
push_to_hub=True, |
|
push_to_hub_model_id=None, |
|
push_to_hub_organization=None, |
|
push_to_hub_token=<PUSH_TO_HUB_TOKEN>, |
|
ray_scope=last, |
|
remove_unused_columns=True, |
|
report_to=['tensorboard'], |
|
restore_callback_states_from_checkpoint=False, |
|
resume_from_checkpoint=None, |
|
run_name=/content/dissertation/scripts/ner/output, |
|
save_on_each_node=False, |
|
save_only_model=False, |
|
save_safetensors=True, |
|
save_steps=500, |
|
save_strategy=epoch, |
|
save_total_limit=None, |
|
seed=42, |
|
skip_memory_metrics=True, |
|
split_batches=None, |
|
tf32=None, |
|
torch_compile=False, |
|
torch_compile_backend=None, |
|
torch_compile_mode=None, |
|
torch_empty_cache_steps=None, |
|
torchdynamo=None, |
|
tpu_metrics_debug=False, |
|
tpu_num_cores=None, |
|
use_cpu=False, |
|
use_ipex=False, |
|
use_legacy_prediction_loop=False, |
|
use_mps_device=False, |
|
warmup_ratio=0.0, |
|
warmup_steps=0, |
|
weight_decay=0.0, |
|
) |
|
Downloading builder script: 0%| | 0.00/3.91k [00:00<?, ?B/s]
Downloading builder script: 100%|ββββββββββ| 3.91k/3.91k [00:00<00:00, 16.3kB/s]
Downloading builder script: 100%|ββββββββββ| 3.91k/3.91k [00:00<00:00, 16.3kB/s] |
|
Downloading data: 0%| | 0.00/16.7M [00:00<?, ?B/s]
Downloading data: 63%|βββββββ | 10.5M/16.7M [00:01<00:00, 8.91MB/s]
Downloading data: 100%|ββββββββββ| 16.7M/16.7M [00:01<00:00, 10.8MB/s]
Downloading data: 100%|ββββββββββ| 16.7M/16.7M [00:01<00:00, 10.3MB/s] |
|
Downloading data: 0%| | 0.00/2.93M [00:00<?, ?B/s]
Downloading data: 100%|ββββββββββ| 2.93M/2.93M [00:00<00:00, 3.11MB/s]
Downloading data: 100%|ββββββββββ| 2.93M/2.93M [00:00<00:00, 3.10MB/s] |
|
Downloading data: 0%| | 0.00/4.78M [00:00<?, ?B/s]
Downloading data: 100%|ββββββββββ| 4.78M/4.78M [00:00<00:00, 8.75MB/s]
Downloading data: 100%|ββββββββββ| 4.78M/4.78M [00:00<00:00, 8.68MB/s] |
|
Generating train split: 0 examples [00:00, ? examples/s]
Generating train split: 537 examples [00:00, 5349.78 examples/s]
Generating train split: 1338 examples [00:00, 5336.76 examples/s]
Generating train split: 1909 examples [00:00, 5477.50 examples/s]
Generating train split: 2673 examples [00:00, 5295.71 examples/s]
Generating train split: 3214 examples [00:00, 5326.77 examples/s]
Generating train split: 3802 examples [00:00, 5490.78 examples/s]
Generating train split: 4648 examples [00:00, 5544.17 examples/s]
Generating train split: 5441 examples [00:01, 5446.84 examples/s]
Generating train split: 6000 examples [00:01, 5423.79 examples/s]
Generating train split: 6638 examples [00:01, 5671.92 examples/s]
Generating train split: 7486 examples [00:01, 5659.27 examples/s]
Generating train split: 8305 examples [00:01, 5558.03 examples/s]
Generating train split: 8896 examples [00:01, 5641.52 examples/s]
Generating train split: 9716 examples [00:01, 5576.75 examples/s]
Generating train split: 10314 examples [00:01, 5538.16 examples/s]
Generating train split: 10920 examples [00:01, 5664.12 examples/s]
Generating train split: 11728 examples [00:02, 5559.92 examples/s]
Generating train split: 12300 examples [00:02, 5487.24 examples/s]
Generating train split: 12899 examples [00:02, 5616.31 examples/s]
Generating train split: 13013 examples [00:02, 5514.63 examples/s] |
|
Generating validation split: 0 examples [00:00, ? examples/s]
Generating validation split: 656 examples [00:00, 6542.30 examples/s]
Generating validation split: 1537 examples [00:00, 6076.82 examples/s]
Generating validation split: 2406 examples [00:00, 5933.67 examples/s]
Generating validation split: 2519 examples [00:00, 5905.73 examples/s] |
|
Generating test split: 0 examples [00:00, ? examples/s]
Generating test split: 650 examples [00:00, 6476.60 examples/s]
Generating test split: 1528 examples [00:00, 6042.87 examples/s]
Generating test split: 2370 examples [00:00, 5828.00 examples/s]
Generating test split: 2999 examples [00:00, 5972.57 examples/s]
Generating test split: 3867 examples [00:00, 5889.51 examples/s]
Generating test split: 4047 examples [00:00, 5842.24 examples/s] |
|
[INFO|configuration_utils.py:733] 2024-09-09 11:54:06,987 >> loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/config.json |
|
[INFO|configuration_utils.py:800] 2024-09-09 11:54:06,991 >> Model config RobertaConfig { |
|
"_name_or_path": "PlanTL-GOB-ES/bsc-bio-ehr-es", |
|
"architectures": [ |
|
"RobertaForMaskedLM" |
|
], |
|
"attention_probs_dropout_prob": 0.1, |
|
"bos_token_id": 0, |
|
"classifier_dropout": null, |
|
"eos_token_id": 2, |
|
"finetuning_task": "ner", |
|
"gradient_checkpointing": false, |
|
"hidden_act": "gelu", |
|
"hidden_dropout_prob": 0.1, |
|
"hidden_size": 768, |
|
"id2label": { |
|
"0": "O", |
|
"1": "B-SINTOMA", |
|
"2": "I-SINTOMA" |
|
}, |
|
"initializer_range": 0.02, |
|
"intermediate_size": 3072, |
|
"label2id": { |
|
"B-SINTOMA": 1, |
|
"I-SINTOMA": 2, |
|
"O": 0 |
|
}, |
|
"layer_norm_eps": 1e-05, |
|
"max_position_embeddings": 514, |
|
"model_type": "roberta", |
|
"num_attention_heads": 12, |
|
"num_hidden_layers": 12, |
|
"pad_token_id": 1, |
|
"position_embedding_type": "absolute", |
|
"transformers_version": "4.44.2", |
|
"type_vocab_size": 1, |
|
"use_cache": true, |
|
"vocab_size": 50262 |
|
} |
|
|
|
[INFO|configuration_utils.py:733] 2024-09-09 11:54:07,264 >> loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/config.json |
|
[INFO|configuration_utils.py:800] 2024-09-09 11:54:07,265 >> Model config RobertaConfig { |
|
"_name_or_path": "PlanTL-GOB-ES/bsc-bio-ehr-es", |
|
"architectures": [ |
|
"RobertaForMaskedLM" |
|
], |
|
"attention_probs_dropout_prob": 0.1, |
|
"bos_token_id": 0, |
|
"classifier_dropout": null, |
|
"eos_token_id": 2, |
|
"gradient_checkpointing": false, |
|
"hidden_act": "gelu", |
|
"hidden_dropout_prob": 0.1, |
|
"hidden_size": 768, |
|
"initializer_range": 0.02, |
|
"intermediate_size": 3072, |
|
"layer_norm_eps": 1e-05, |
|
"max_position_embeddings": 514, |
|
"model_type": "roberta", |
|
"num_attention_heads": 12, |
|
"num_hidden_layers": 12, |
|
"pad_token_id": 1, |
|
"position_embedding_type": "absolute", |
|
"transformers_version": "4.44.2", |
|
"type_vocab_size": 1, |
|
"use_cache": true, |
|
"vocab_size": 50262 |
|
} |
|
|
|
[INFO|tokenization_utils_base.py:2269] 2024-09-09 11:54:07,275 >> loading file vocab.json from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/vocab.json |
|
[INFO|tokenization_utils_base.py:2269] 2024-09-09 11:54:07,275 >> loading file merges.txt from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/merges.txt |
|
[INFO|tokenization_utils_base.py:2269] 2024-09-09 11:54:07,275 >> loading file tokenizer.json from cache at None |
|
[INFO|tokenization_utils_base.py:2269] 2024-09-09 11:54:07,275 >> loading file added_tokens.json from cache at None |
|
[INFO|tokenization_utils_base.py:2269] 2024-09-09 11:54:07,275 >> loading file special_tokens_map.json from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2269] 2024-09-09 11:54:07,275 >> loading file tokenizer_config.json from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/tokenizer_config.json |
|
[INFO|configuration_utils.py:733] 2024-09-09 11:54:07,275 >> loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/config.json |
|
[INFO|configuration_utils.py:800] 2024-09-09 11:54:07,276 >> Model config RobertaConfig { |
|
"_name_or_path": "PlanTL-GOB-ES/bsc-bio-ehr-es", |
|
"architectures": [ |
|
"RobertaForMaskedLM" |
|
], |
|
"attention_probs_dropout_prob": 0.1, |
|
"bos_token_id": 0, |
|
"classifier_dropout": null, |
|
"eos_token_id": 2, |
|
"gradient_checkpointing": false, |
|
"hidden_act": "gelu", |
|
"hidden_dropout_prob": 0.1, |
|
"hidden_size": 768, |
|
"initializer_range": 0.02, |
|
"intermediate_size": 3072, |
|
"layer_norm_eps": 1e-05, |
|
"max_position_embeddings": 514, |
|
"model_type": "roberta", |
|
"num_attention_heads": 12, |
|
"num_hidden_layers": 12, |
|
"pad_token_id": 1, |
|
"position_embedding_type": "absolute", |
|
"transformers_version": "4.44.2", |
|
"type_vocab_size": 1, |
|
"use_cache": true, |
|
"vocab_size": 50262 |
|
} |
|
|
|
/usr/local/lib/python3.10/dist-packages/transformers/tokenization_utils_base.py:1601: FutureWarning: `clean_up_tokenization_spaces` was not set. It will be set to `True` by default. This behavior will be depracted in transformers v4.45, and will be then set to `False` by default. For more details check this issue: https://github.com/huggingface/transformers/issues/31884 |
|
warnings.warn( |
|
[INFO|configuration_utils.py:733] 2024-09-09 11:54:07,353 >> loading configuration file config.json from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/config.json |
|
[INFO|configuration_utils.py:800] 2024-09-09 11:54:07,354 >> Model config RobertaConfig { |
|
"_name_or_path": "PlanTL-GOB-ES/bsc-bio-ehr-es", |
|
"architectures": [ |
|
"RobertaForMaskedLM" |
|
], |
|
"attention_probs_dropout_prob": 0.1, |
|
"bos_token_id": 0, |
|
"classifier_dropout": null, |
|
"eos_token_id": 2, |
|
"gradient_checkpointing": false, |
|
"hidden_act": "gelu", |
|
"hidden_dropout_prob": 0.1, |
|
"hidden_size": 768, |
|
"initializer_range": 0.02, |
|
"intermediate_size": 3072, |
|
"layer_norm_eps": 1e-05, |
|
"max_position_embeddings": 514, |
|
"model_type": "roberta", |
|
"num_attention_heads": 12, |
|
"num_hidden_layers": 12, |
|
"pad_token_id": 1, |
|
"position_embedding_type": "absolute", |
|
"transformers_version": "4.44.2", |
|
"type_vocab_size": 1, |
|
"use_cache": true, |
|
"vocab_size": 50262 |
|
} |
|
|
|
[INFO|modeling_utils.py:3678] 2024-09-09 11:54:07,676 >> loading weights file pytorch_model.bin from cache at /root/.cache/huggingface/hub/models--PlanTL-GOB-ES--bsc-bio-ehr-es/snapshots/1e543adb2d21f19d85a89305eebdbd64ab656b99/pytorch_model.bin |
|
[INFO|modeling_utils.py:4497] 2024-09-09 11:54:07,755 >> Some weights of the model checkpoint at PlanTL-GOB-ES/bsc-bio-ehr-es were not used when initializing RobertaForTokenClassification: ['lm_head.bias', 'lm_head.decoder.bias', 'lm_head.decoder.weight', 'lm_head.dense.bias', 'lm_head.dense.weight', 'lm_head.layer_norm.bias', 'lm_head.layer_norm.weight'] |
|
- This IS expected if you are initializing RobertaForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model). |
|
- This IS NOT expected if you are initializing RobertaForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model). |
|
[WARNING|modeling_utils.py:4509] 2024-09-09 11:54:07,755 >> Some weights of RobertaForTokenClassification were not initialized from the model checkpoint at PlanTL-GOB-ES/bsc-bio-ehr-es and are newly initialized: ['classifier.bias', 'classifier.weight'] |
|
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference. |
|
Map: 0%| | 0/13013 [00:00<?, ? examples/s]
Map: 8%|β | 1000/13013 [00:00<00:03, 3034.27 examples/s]
Map: 15%|ββ | 2000/13013 [00:00<00:02, 4988.47 examples/s]
Map: 23%|βββ | 3000/13013 [00:00<00:01, 6230.88 examples/s]
Map: 31%|βββ | 4000/13013 [00:00<00:01, 7209.92 examples/s]
Map: 38%|ββββ | 5000/13013 [00:00<00:01, 7950.65 examples/s]
Map: 46%|βββββ | 6000/13013 [00:00<00:00, 8369.02 examples/s]
Map: 54%|ββββββ | 7000/13013 [00:00<00:00, 8728.71 examples/s]
Map: 61%|βββββββ | 8000/13013 [00:01<00:00, 8875.35 examples/s]
Map: 69%|βββββββ | 9000/13013 [00:01<00:00, 8980.49 examples/s]
Map: 77%|ββββββββ | 10000/13013 [00:01<00:00, 9061.70 examples/s]
Map: 85%|βββββββββ | 11000/13013 [00:01<00:00, 9201.45 examples/s]
Map: 92%|ββββββββββ| 12000/13013 [00:01<00:00, 9048.92 examples/s]
Map: 100%|ββββββββββ| 13000/13013 [00:01<00:00, 9107.40 examples/s]
Map: 100%|ββββββββββ| 13013/13013 [00:01<00:00, 7923.23 examples/s] |
|
Map: 0%| | 0/2519 [00:00<?, ? examples/s]
Map: 79%|ββββββββ | 2000/2519 [00:00<00:00, 9881.73 examples/s]
Map: 100%|ββββββββββ| 2519/2519 [00:00<00:00, 9693.41 examples/s] |
|
Map: 0%| | 0/4047 [00:00<?, ? examples/s]
Map: 25%|βββ | 1000/4047 [00:00<00:00, 9961.79 examples/s]
Map: 49%|βββββ | 2000/4047 [00:00<00:00, 9145.74 examples/s]
Map: 74%|ββββββββ | 3000/4047 [00:00<00:00, 9474.04 examples/s]
Map: 99%|ββββββββββ| 4000/4047 [00:00<00:00, 9541.57 examples/s]
Map: 100%|ββββββββββ| 4047/4047 [00:00<00:00, 9380.54 examples/s] |
|
/content/dissertation/scripts/ner/run_ner_train.py:397: FutureWarning: load_metric is deprecated and will be removed in the next major version of datasets. Use 'evaluate.load' instead, from the new library π€ Evaluate: https://huggingface.co/docs/evaluate |
|
metric = load_metric("seqeval", trust_remote_code=True) |
|
[INFO|trainer.py:811] 2024-09-09 11:54:12,226 >> The following columns in the training set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:2134] 2024-09-09 11:54:12,775 >> ***** Running training ***** |
|
[INFO|trainer.py:2135] 2024-09-09 11:54:12,776 >> Num examples = 13,013 |
|
[INFO|trainer.py:2136] 2024-09-09 11:54:12,776 >> Num Epochs = 10 |
|
[INFO|trainer.py:2137] 2024-09-09 11:54:12,776 >> Instantaneous batch size per device = 32 |
|
[INFO|trainer.py:2140] 2024-09-09 11:54:12,776 >> Total train batch size (w. parallel, distributed & accumulation) = 64 |
|
[INFO|trainer.py:2141] 2024-09-09 11:54:12,776 >> Gradient Accumulation steps = 2 |
|
[INFO|trainer.py:2142] 2024-09-09 11:54:12,776 >> Total optimization steps = 2,030 |
|
[INFO|trainer.py:2143] 2024-09-09 11:54:12,776 >> Number of trainable parameters = 124,055,043 |
|
0%| | 0/2030 [00:00<?, ?it/s]
0%| | 1/2030 [00:01<43:23, 1.28s/it]
0%| | 2/2030 [00:01<27:30, 1.23it/s]
0%| | 3/2030 [00:02<22:20, 1.51it/s]
0%| | 4/2030 [00:02<20:58, 1.61it/s]
0%| | 5/2030 [00:03<18:15, 1.85it/s]
0%| | 6/2030 [00:03<16:47, 2.01it/s]
0%| | 7/2030 [00:04<16:12, 2.08it/s]
0%| | 8/2030 [00:04<16:25, 2.05it/s]
0%| | 9/2030 [00:05<15:51, 2.12it/s]
0%| | 10/2030 [00:05<16:55, 1.99it/s]
1%| | 11/2030 [00:05<15:19, 2.20it/s]
1%| | 12/2030 [00:06<17:18, 1.94it/s]
1%| | 13/2030 [00:07<16:43, 2.01it/s]
1%| | 14/2030 [00:07<18:38, 1.80it/s]
1%| | 15/2030 [00:08<16:34, 2.03it/s]
1%| | 16/2030 [00:08<17:35, 1.91it/s]
1%| | 17/2030 [00:09<16:44, 2.00it/s]
1%| | 18/2030 [00:09<18:13, 1.84it/s]
1%| | 19/2030 [00:10<23:35, 1.42it/s]
1%| | 20/2030 [00:11<22:07, 1.51it/s]
1%| | 21/2030 [00:11<19:46, 1.69it/s]
1%| | 22/2030 [00:12<17:22, 1.93it/s]
1%| | 23/2030 [00:12<19:14, 1.74it/s]
1%| | 24/2030 [00:13<18:36, 1.80it/s]
1%| | 25/2030 [00:13<17:01, 1.96it/s]
1%|β | 26/2030 [00:14<16:28, 2.03it/s]
1%|β | 27/2030 [00:14<16:55, 1.97it/s]
1%|β | 28/2030 [00:15<18:05, 1.84it/s]
1%|β | 29/2030 [00:15<16:38, 2.00it/s]
1%|β | 30/2030 [00:16<16:25, 2.03it/s]
2%|β | 31/2030 [00:16<16:14, 2.05it/s]
2%|β | 32/2030 [00:17<16:03, 2.07it/s]
2%|β | 33/2030 [00:17<17:38, 1.89it/s]
2%|β | 34/2030 [00:18<16:22, 2.03it/s]
2%|β | 35/2030 [00:18<15:07, 2.20it/s]
2%|β | 36/2030 [00:19<14:36, 2.28it/s]
2%|β | 37/2030 [00:19<15:03, 2.21it/s]
2%|β | 38/2030 [00:19<14:25, 2.30it/s]
2%|β | 39/2030 [00:20<15:44, 2.11it/s]
2%|β | 40/2030 [00:20<14:43, 2.25it/s]
2%|β | 41/2030 [00:21<14:17, 2.32it/s]
2%|β | 42/2030 [00:21<14:54, 2.22it/s]
2%|β | 43/2030 [00:22<14:50, 2.23it/s]
2%|β | 44/2030 [00:22<15:11, 2.18it/s]
2%|β | 45/2030 [00:23<15:19, 2.16it/s]
2%|β | 46/2030 [00:23<14:40, 2.25it/s]
2%|β | 47/2030 [00:24<15:29, 2.13it/s]
2%|β | 48/2030 [00:24<14:57, 2.21it/s]
2%|β | 49/2030 [00:24<15:07, 2.18it/s]
2%|β | 50/2030 [00:25<15:57, 2.07it/s]
3%|β | 51/2030 [00:25<15:31, 2.12it/s]
3%|β | 52/2030 [00:26<15:21, 2.15it/s]
3%|β | 53/2030 [00:26<14:55, 2.21it/s]
3%|β | 54/2030 [00:27<13:40, 2.41it/s]
3%|β | 55/2030 [00:27<13:39, 2.41it/s]
3%|β | 56/2030 [00:28<14:39, 2.25it/s]
3%|β | 57/2030 [00:28<14:34, 2.26it/s]
3%|β | 58/2030 [00:28<14:11, 2.32it/s]
3%|β | 59/2030 [00:29<14:11, 2.31it/s]
3%|β | 60/2030 [00:30<16:39, 1.97it/s]
3%|β | 61/2030 [00:30<14:58, 2.19it/s]
3%|β | 62/2030 [00:30<13:48, 2.38it/s]
3%|β | 63/2030 [00:31<13:58, 2.35it/s]
3%|β | 64/2030 [00:31<14:10, 2.31it/s]
3%|β | 65/2030 [00:32<14:04, 2.33it/s]
3%|β | 66/2030 [00:32<13:33, 2.41it/s]
3%|β | 67/2030 [00:32<13:57, 2.34it/s]
3%|β | 68/2030 [00:33<13:23, 2.44it/s]
3%|β | 69/2030 [00:33<12:56, 2.53it/s]
3%|β | 70/2030 [00:34<14:55, 2.19it/s]
3%|β | 71/2030 [00:34<14:42, 2.22it/s]
4%|β | 72/2030 [00:35<14:08, 2.31it/s]
4%|β | 73/2030 [00:35<13:54, 2.34it/s]
4%|β | 74/2030 [00:35<13:32, 2.41it/s]
4%|β | 75/2030 [00:36<13:34, 2.40it/s]
4%|β | 76/2030 [00:36<13:41, 2.38it/s]
4%|β | 77/2030 [00:37<14:07, 2.30it/s]
4%|β | 78/2030 [00:37<14:33, 2.24it/s]
4%|β | 79/2030 [00:38<14:16, 2.28it/s]
4%|β | 80/2030 [00:38<14:14, 2.28it/s]
4%|β | 81/2030 [00:38<13:49, 2.35it/s]
4%|β | 82/2030 [00:39<14:52, 2.18it/s]
4%|β | 83/2030 [00:39<13:50, 2.34it/s]
4%|β | 84/2030 [00:40<15:49, 2.05it/s]
4%|β | 85/2030 [00:40<15:30, 2.09it/s]
4%|β | 86/2030 [00:41<15:10, 2.14it/s]
4%|β | 87/2030 [00:41<15:02, 2.15it/s]
4%|β | 88/2030 [00:42<15:54, 2.04it/s]
4%|β | 89/2030 [00:42<15:01, 2.15it/s]
4%|β | 90/2030 [00:43<14:36, 2.21it/s]
4%|β | 91/2030 [00:43<13:44, 2.35it/s]
5%|β | 92/2030 [00:43<14:17, 2.26it/s]
5%|β | 93/2030 [00:44<17:39, 1.83it/s]
5%|β | 94/2030 [00:45<16:23, 1.97it/s]
5%|β | 95/2030 [00:45<15:11, 2.12it/s]
5%|β | 96/2030 [00:46<14:51, 2.17it/s]
5%|β | 97/2030 [00:46<14:32, 2.21it/s]
5%|β | 98/2030 [00:46<14:14, 2.26it/s]
5%|β | 99/2030 [00:47<14:50, 2.17it/s]
5%|β | 100/2030 [00:47<13:48, 2.33it/s]
5%|β | 101/2030 [00:48<13:31, 2.38it/s]
5%|β | 102/2030 [00:48<13:42, 2.34it/s]
5%|β | 103/2030 [00:48<12:47, 2.51it/s]
5%|β | 104/2030 [00:49<14:29, 2.22it/s]
5%|β | 105/2030 [00:49<14:31, 2.21it/s]
5%|β | 106/2030 [00:50<14:53, 2.15it/s]
5%|β | 107/2030 [00:50<14:26, 2.22it/s]
5%|β | 108/2030 [00:51<13:20, 2.40it/s]
5%|β | 109/2030 [00:51<14:11, 2.25it/s]
5%|β | 110/2030 [00:52<14:00, 2.28it/s]
5%|β | 111/2030 [00:52<13:40, 2.34it/s]
6%|β | 112/2030 [00:52<13:15, 2.41it/s]
6%|β | 113/2030 [00:53<14:36, 2.19it/s]
6%|β | 114/2030 [00:53<15:33, 2.05it/s]
6%|β | 115/2030 [00:54<15:08, 2.11it/s]
6%|β | 116/2030 [00:54<14:34, 2.19it/s]
6%|β | 117/2030 [00:55<14:45, 2.16it/s]
6%|β | 118/2030 [00:55<14:07, 2.26it/s]
6%|β | 119/2030 [00:56<14:05, 2.26it/s]
6%|β | 120/2030 [00:56<13:44, 2.32it/s]
6%|β | 121/2030 [00:57<14:00, 2.27it/s]
6%|β | 122/2030 [00:57<13:23, 2.37it/s]
6%|β | 123/2030 [00:57<12:58, 2.45it/s]
6%|β | 124/2030 [00:58<15:07, 2.10it/s]
6%|β | 125/2030 [00:58<15:02, 2.11it/s]
6%|β | 126/2030 [00:59<15:04, 2.11it/s]
6%|β | 127/2030 [00:59<14:34, 2.18it/s]
6%|β | 128/2030 [01:00<14:47, 2.14it/s]
6%|β | 129/2030 [01:00<13:53, 2.28it/s]
6%|β | 130/2030 [01:01<16:03, 1.97it/s]
6%|β | 131/2030 [01:01<16:28, 1.92it/s]
7%|β | 132/2030 [01:02<15:23, 2.06it/s]
7%|β | 133/2030 [01:03<18:04, 1.75it/s]
7%|β | 134/2030 [01:03<17:08, 1.84it/s]
7%|β | 135/2030 [01:03<16:13, 1.95it/s]
7%|β | 136/2030 [01:04<15:14, 2.07it/s]
7%|β | 137/2030 [01:04<13:58, 2.26it/s]
7%|β | 138/2030 [01:05<13:47, 2.29it/s]
7%|β | 139/2030 [01:05<13:46, 2.29it/s]
7%|β | 140/2030 [01:06<17:13, 1.83it/s]
7%|β | 141/2030 [01:06<15:44, 2.00it/s]
7%|β | 142/2030 [01:07<18:04, 1.74it/s]
7%|β | 143/2030 [01:07<16:32, 1.90it/s]
7%|β | 144/2030 [01:08<17:46, 1.77it/s]
7%|β | 145/2030 [01:08<15:39, 2.01it/s]
7%|β | 146/2030 [01:09<15:15, 2.06it/s]
7%|β | 147/2030 [01:09<14:20, 2.19it/s]
7%|β | 148/2030 [01:10<13:42, 2.29it/s]
7%|β | 149/2030 [01:10<13:13, 2.37it/s]
7%|β | 150/2030 [01:11<14:12, 2.21it/s]
7%|β | 151/2030 [01:11<15:01, 2.08it/s]
7%|β | 152/2030 [01:12<14:34, 2.15it/s]
8%|β | 153/2030 [01:12<13:22, 2.34it/s]
8%|β | 154/2030 [01:12<14:04, 2.22it/s]
8%|β | 155/2030 [01:13<13:31, 2.31it/s]
8%|β | 156/2030 [01:13<14:24, 2.17it/s]
8%|β | 157/2030 [01:14<14:18, 2.18it/s]
8%|β | 158/2030 [01:14<15:19, 2.04it/s]
8%|β | 159/2030 [01:15<14:23, 2.17it/s]
8%|β | 160/2030 [01:15<13:47, 2.26it/s]
8%|β | 161/2030 [01:16<13:50, 2.25it/s]
8%|β | 162/2030 [01:16<14:12, 2.19it/s]
8%|β | 163/2030 [01:17<13:53, 2.24it/s]
8%|β | 164/2030 [01:17<13:45, 2.26it/s]
8%|β | 165/2030 [01:17<13:39, 2.28it/s]
8%|β | 166/2030 [01:18<15:08, 2.05it/s]
8%|β | 167/2030 [01:18<14:35, 2.13it/s]
8%|β | 168/2030 [01:19<14:27, 2.15it/s]
8%|β | 169/2030 [01:19<13:34, 2.29it/s]
8%|β | 170/2030 [01:20<14:37, 2.12it/s]
8%|β | 171/2030 [01:20<13:29, 2.30it/s]
8%|β | 172/2030 [01:21<16:15, 1.90it/s]
9%|β | 173/2030 [01:21<15:03, 2.06it/s]
9%|β | 174/2030 [01:22<13:56, 2.22it/s]
9%|β | 175/2030 [01:22<13:27, 2.30it/s]
9%|β | 176/2030 [01:22<12:39, 2.44it/s]
9%|β | 177/2030 [01:23<14:01, 2.20it/s]
9%|β | 178/2030 [01:23<12:55, 2.39it/s]
9%|β | 179/2030 [01:24<12:19, 2.50it/s]
9%|β | 180/2030 [01:24<12:59, 2.37it/s]
9%|β | 181/2030 [01:24<12:19, 2.50it/s]
9%|β | 182/2030 [01:25<12:00, 2.56it/s]
9%|β | 183/2030 [01:25<12:02, 2.56it/s]
9%|β | 184/2030 [01:26<12:22, 2.49it/s]
9%|β | 185/2030 [01:26<12:37, 2.44it/s]
9%|β | 186/2030 [01:26<12:00, 2.56it/s]
9%|β | 187/2030 [01:27<12:49, 2.39it/s]
9%|β | 188/2030 [01:27<13:38, 2.25it/s]
9%|β | 189/2030 [01:28<13:21, 2.30it/s]
9%|β | 190/2030 [01:29<16:36, 1.85it/s]
9%|β | 191/2030 [01:29<16:06, 1.90it/s]
9%|β | 192/2030 [01:29<14:24, 2.13it/s]
10%|β | 193/2030 [01:30<16:50, 1.82it/s]
10%|β | 194/2030 [01:31<15:12, 2.01it/s]
10%|β | 195/2030 [01:31<15:09, 2.02it/s]
10%|β | 196/2030 [01:31<14:00, 2.18it/s]
10%|β | 197/2030 [01:32<16:28, 1.85it/s]
10%|β | 198/2030 [01:33<18:54, 1.62it/s]
10%|β | 199/2030 [01:33<17:25, 1.75it/s]
10%|β | 200/2030 [01:34<16:29, 1.85it/s]
10%|β | 201/2030 [01:34<15:25, 1.98it/s]
10%|β | 202/2030 [01:35<14:43, 2.07it/s]
10%|β | 203/2030 [01:35<14:58, 2.03it/s][INFO|trainer.py:811] 2024-09-09 11:55:48,641 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 11:55:48,644 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 11:55:48,644 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 11:55:48,644 >> Batch size = 8 |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:04, 76.12it/s][A |
|
5%|β | 16/315 [00:00<00:04, 74.05it/s][A |
|
8%|β | 24/315 [00:00<00:03, 75.18it/s][A |
|
10%|β | 32/315 [00:00<00:03, 70.92it/s][A |
|
13%|ββ | 40/315 [00:00<00:03, 73.74it/s][A |
|
15%|ββ | 48/315 [00:00<00:03, 74.41it/s][A |
|
18%|ββ | 56/315 [00:00<00:03, 73.32it/s][A |
|
20%|ββ | 64/315 [00:00<00:03, 71.03it/s][A |
|
23%|βββ | 72/315 [00:00<00:03, 73.04it/s][A |
|
25%|βββ | 80/315 [00:01<00:03, 69.62it/s][A |
|
28%|βββ | 88/315 [00:01<00:03, 67.05it/s][A |
|
30%|βββ | 96/315 [00:01<00:03, 70.09it/s][A |
|
33%|ββββ | 104/315 [00:01<00:03, 67.36it/s][A |
|
36%|ββββ | 112/315 [00:01<00:02, 69.60it/s][A |
|
38%|ββββ | 120/315 [00:01<00:02, 69.30it/s][A |
|
40%|ββββ | 127/315 [00:01<00:02, 68.58it/s][A |
|
43%|βββββ | 134/315 [00:01<00:02, 67.97it/s][A |
|
45%|βββββ | 141/315 [00:02<00:02, 68.37it/s][A |
|
47%|βββββ | 149/315 [00:02<00:02, 70.96it/s][A |
|
50%|βββββ | 158/315 [00:02<00:02, 74.16it/s][A |
|
53%|ββββββ | 166/315 [00:02<00:02, 72.11it/s][A |
|
55%|ββββββ | 174/315 [00:02<00:01, 71.61it/s][A |
|
58%|ββββββ | 182/315 [00:02<00:01, 68.73it/s][A |
|
60%|ββββββ | 189/315 [00:02<00:01, 68.38it/s][A |
|
62%|βββββββ | 196/315 [00:02<00:01, 67.76it/s][A |
|
64%|βββββββ | 203/315 [00:02<00:01, 64.44it/s][A |
|
67%|βββββββ | 210/315 [00:03<00:01, 64.84it/s][A |
|
69%|βββββββ | 218/315 [00:03<00:01, 68.36it/s][A |
|
72%|ββββββββ | 226/315 [00:03<00:01, 70.84it/s][A |
|
75%|ββββββββ | 235/315 [00:03<00:01, 73.77it/s][A |
|
77%|ββββββββ | 243/315 [00:03<00:01, 70.62it/s][A |
|
80%|ββββββββ | 251/315 [00:03<00:00, 70.66it/s][A |
|
82%|βββββββββ | 259/315 [00:03<00:00, 69.14it/s][A |
|
85%|βββββββββ | 267/315 [00:03<00:00, 70.28it/s][A |
|
88%|βββββββββ | 276/315 [00:03<00:00, 73.48it/s][A |
|
90%|βββββββββ | 284/315 [00:04<00:00, 73.87it/s][A |
|
93%|ββββββββββ| 292/315 [00:04<00:00, 71.52it/s][A |
|
95%|ββββββββββ| 300/315 [00:04<00:00, 71.25it/s][A |
|
98%|ββββββββββ| 308/315 [00:04<00:00, 71.82it/s][A
|
|
[A
10%|β | 203/2030 [01:41<14:58, 2.03it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 71.82it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 11:55:54,552 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-203 |
|
[INFO|configuration_utils.py:472] 2024-09-09 11:55:54,553 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-203/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 11:55:55,568 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-203/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 11:55:55,569 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-203/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 11:55:55,569 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-203/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 11:56:00,182 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 11:56:00,183 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
10%|β | 204/2030 [01:47<1:59:40, 3.93s/it]
10%|β | 205/2030 [01:48<1:28:45, 2.92s/it]
10%|β | 206/2030 [01:48<1:06:21, 2.18s/it]
10%|β | 207/2030 [01:49<50:53, 1.67s/it]
10%|β | 208/2030 [01:49<39:22, 1.30s/it]
10%|β | 209/2030 [01:49<30:44, 1.01s/it]
10%|β | 210/2030 [01:50<25:37, 1.18it/s]
10%|β | 211/2030 [01:51<24:14, 1.25it/s]
10%|β | 212/2030 [01:51<21:03, 1.44it/s]
10%|β | 213/2030 [01:51<18:36, 1.63it/s]
11%|β | 214/2030 [01:52<17:59, 1.68it/s]
11%|β | 215/2030 [01:52<16:37, 1.82it/s]
11%|β | 216/2030 [01:53<15:39, 1.93it/s]
11%|β | 217/2030 [01:54<19:55, 1.52it/s]
11%|β | 218/2030 [01:54<17:23, 1.74it/s]
11%|β | 219/2030 [01:55<16:28, 1.83it/s]
11%|β | 220/2030 [01:55<17:39, 1.71it/s]
11%|β | 221/2030 [01:56<15:31, 1.94it/s]
11%|β | 222/2030 [01:56<14:36, 2.06it/s]
11%|β | 223/2030 [01:57<14:18, 2.11it/s]
11%|β | 224/2030 [01:57<16:05, 1.87it/s]
11%|β | 225/2030 [01:58<15:11, 1.98it/s]
11%|β | 226/2030 [01:58<14:18, 2.10it/s]
11%|β | 227/2030 [01:59<14:05, 2.13it/s]
11%|β | 228/2030 [01:59<13:34, 2.21it/s]
11%|ββ | 229/2030 [01:59<12:44, 2.36it/s]
11%|ββ | 230/2030 [02:00<12:42, 2.36it/s]
11%|ββ | 231/2030 [02:00<12:22, 2.42it/s]
11%|ββ | 232/2030 [02:01<12:16, 2.44it/s]
11%|ββ | 233/2030 [02:01<12:45, 2.35it/s]
12%|ββ | 234/2030 [02:02<14:11, 2.11it/s]
12%|ββ | 235/2030 [02:02<13:37, 2.20it/s]
12%|ββ | 236/2030 [02:02<13:13, 2.26it/s]
12%|ββ | 237/2030 [02:03<13:48, 2.16it/s]
12%|ββ | 238/2030 [02:03<13:05, 2.28it/s]
12%|ββ | 239/2030 [02:04<12:34, 2.37it/s]
12%|ββ | 240/2030 [02:04<12:38, 2.36it/s]
12%|ββ | 241/2030 [02:05<12:12, 2.44it/s]
12%|ββ | 242/2030 [02:05<12:03, 2.47it/s]
12%|ββ | 243/2030 [02:05<13:09, 2.26it/s]
12%|ββ | 244/2030 [02:06<13:57, 2.13it/s]
12%|ββ | 245/2030 [02:06<12:28, 2.39it/s]
12%|ββ | 246/2030 [02:07<11:47, 2.52it/s]
12%|ββ | 247/2030 [02:07<12:04, 2.46it/s]
12%|ββ | 248/2030 [02:07<11:32, 2.57it/s]
12%|ββ | 249/2030 [02:08<12:22, 2.40it/s]
12%|ββ | 250/2030 [02:08<12:07, 2.45it/s]
12%|ββ | 251/2030 [02:09<11:40, 2.54it/s]
12%|ββ | 252/2030 [02:09<14:13, 2.08it/s]
12%|ββ | 253/2030 [02:10<15:51, 1.87it/s]
13%|ββ | 254/2030 [02:10<14:48, 2.00it/s]
13%|ββ | 255/2030 [02:11<16:12, 1.83it/s]
13%|ββ | 256/2030 [02:12<15:55, 1.86it/s]
13%|ββ | 257/2030 [02:12<15:12, 1.94it/s]
13%|ββ | 258/2030 [02:13<16:09, 1.83it/s]
13%|ββ | 259/2030 [02:13<14:20, 2.06it/s]
13%|ββ | 260/2030 [02:13<13:31, 2.18it/s]
13%|ββ | 261/2030 [02:14<16:16, 1.81it/s]
13%|ββ | 262/2030 [02:15<14:54, 1.98it/s]
13%|ββ | 263/2030 [02:15<14:32, 2.03it/s]
13%|ββ | 264/2030 [02:16<15:26, 1.91it/s]
13%|ββ | 265/2030 [02:16<14:04, 2.09it/s]
13%|ββ | 266/2030 [02:16<13:00, 2.26it/s]
13%|ββ | 267/2030 [02:17<12:11, 2.41it/s]
13%|ββ | 268/2030 [02:17<12:46, 2.30it/s]
13%|ββ | 269/2030 [02:18<11:57, 2.46it/s]
13%|ββ | 270/2030 [02:18<12:20, 2.38it/s]
13%|ββ | 271/2030 [02:19<12:47, 2.29it/s]
13%|ββ | 272/2030 [02:19<13:52, 2.11it/s]
13%|ββ | 273/2030 [02:20<13:54, 2.11it/s]
13%|ββ | 274/2030 [02:20<12:44, 2.30it/s]
14%|ββ | 275/2030 [02:20<12:38, 2.31it/s]
14%|ββ | 276/2030 [02:21<12:42, 2.30it/s]
14%|ββ | 277/2030 [02:21<12:34, 2.32it/s]
14%|ββ | 278/2030 [02:22<12:30, 2.33it/s]
14%|ββ | 279/2030 [02:22<12:28, 2.34it/s]
14%|ββ | 280/2030 [02:22<11:52, 2.46it/s]
14%|ββ | 281/2030 [02:23<12:37, 2.31it/s]
14%|ββ | 282/2030 [02:23<12:16, 2.37it/s]
14%|ββ | 283/2030 [02:24<12:33, 2.32it/s]
14%|ββ | 284/2030 [02:24<13:13, 2.20it/s]
14%|ββ | 285/2030 [02:25<13:08, 2.21it/s]
14%|ββ | 286/2030 [02:25<13:09, 2.21it/s]
14%|ββ | 287/2030 [02:26<12:27, 2.33it/s]
14%|ββ | 288/2030 [02:26<13:57, 2.08it/s]
14%|ββ | 289/2030 [02:27<13:51, 2.09it/s]
14%|ββ | 290/2030 [02:27<15:16, 1.90it/s]
14%|ββ | 291/2030 [02:28<14:18, 2.02it/s]
14%|ββ | 292/2030 [02:28<15:12, 1.91it/s]
14%|ββ | 293/2030 [02:29<14:05, 2.05it/s]
14%|ββ | 294/2030 [02:29<15:37, 1.85it/s]
15%|ββ | 295/2030 [02:30<13:51, 2.09it/s]
15%|ββ | 296/2030 [02:30<13:08, 2.20it/s]
15%|ββ | 297/2030 [02:31<13:30, 2.14it/s]
15%|ββ | 298/2030 [02:31<13:08, 2.20it/s]
15%|ββ | 299/2030 [02:31<13:26, 2.15it/s]
15%|ββ | 300/2030 [02:32<14:33, 1.98it/s]
15%|ββ | 301/2030 [02:32<14:07, 2.04it/s]
15%|ββ | 302/2030 [02:33<13:49, 2.08it/s]
15%|ββ | 303/2030 [02:33<12:42, 2.26it/s]
15%|ββ | 304/2030 [02:34<11:59, 2.40it/s]
15%|ββ | 305/2030 [02:34<14:03, 2.04it/s]
15%|ββ | 306/2030 [02:35<13:33, 2.12it/s]
15%|ββ | 307/2030 [02:35<13:04, 2.20it/s]
15%|ββ | 308/2030 [02:36<13:12, 2.17it/s]
15%|ββ | 309/2030 [02:36<12:55, 2.22it/s]
15%|ββ | 310/2030 [02:37<13:23, 2.14it/s]
15%|ββ | 311/2030 [02:37<12:53, 2.22it/s]
15%|ββ | 312/2030 [02:37<12:41, 2.25it/s]
15%|ββ | 313/2030 [02:38<13:26, 2.13it/s]
15%|ββ | 314/2030 [02:38<13:53, 2.06it/s]
16%|ββ | 315/2030 [02:39<13:04, 2.19it/s]
16%|ββ | 316/2030 [02:39<13:44, 2.08it/s]
16%|ββ | 317/2030 [02:40<14:44, 1.94it/s]
16%|ββ | 318/2030 [02:40<14:00, 2.04it/s]
16%|ββ | 319/2030 [02:41<13:12, 2.16it/s]
16%|ββ | 320/2030 [02:41<13:30, 2.11it/s]
16%|ββ | 321/2030 [02:42<13:18, 2.14it/s]
16%|ββ | 322/2030 [02:42<14:01, 2.03it/s]
16%|ββ | 323/2030 [02:43<13:30, 2.11it/s]
16%|ββ | 324/2030 [02:43<13:54, 2.04it/s]
16%|ββ | 325/2030 [02:44<12:44, 2.23it/s]
16%|ββ | 326/2030 [02:44<12:54, 2.20it/s]
16%|ββ | 327/2030 [02:45<14:11, 2.00it/s]
16%|ββ | 328/2030 [02:45<13:37, 2.08it/s]
16%|ββ | 329/2030 [02:45<12:07, 2.34it/s]
16%|ββ | 330/2030 [02:46<11:46, 2.41it/s]
16%|ββ | 331/2030 [02:46<11:52, 2.38it/s]
16%|ββ | 332/2030 [02:47<12:06, 2.34it/s]
16%|ββ | 333/2030 [02:47<12:21, 2.29it/s]
16%|ββ | 334/2030 [02:48<12:17, 2.30it/s]
17%|ββ | 335/2030 [02:48<15:27, 1.83it/s]
17%|ββ | 336/2030 [02:49<14:13, 1.98it/s]
17%|ββ | 337/2030 [02:49<14:16, 1.98it/s]
17%|ββ | 338/2030 [02:50<13:03, 2.16it/s]
17%|ββ | 339/2030 [02:50<12:44, 2.21it/s]
17%|ββ | 340/2030 [02:51<17:41, 1.59it/s]
17%|ββ | 341/2030 [02:52<18:04, 1.56it/s]
17%|ββ | 342/2030 [02:52<16:49, 1.67it/s]
17%|ββ | 343/2030 [02:53<15:23, 1.83it/s]
17%|ββ | 344/2030 [02:53<13:53, 2.02it/s]
17%|ββ | 345/2030 [02:54<15:18, 1.83it/s]
17%|ββ | 346/2030 [02:54<14:12, 1.98it/s]
17%|ββ | 347/2030 [02:55<13:19, 2.11it/s]
17%|ββ | 348/2030 [02:55<13:30, 2.08it/s]
17%|ββ | 349/2030 [02:56<14:05, 1.99it/s]
17%|ββ | 350/2030 [02:56<13:39, 2.05it/s]
17%|ββ | 351/2030 [02:57<13:26, 2.08it/s]
17%|ββ | 352/2030 [02:57<13:56, 2.01it/s]
17%|ββ | 353/2030 [02:58<16:18, 1.71it/s]
17%|ββ | 354/2030 [02:58<15:13, 1.84it/s]
17%|ββ | 355/2030 [02:59<14:56, 1.87it/s]
18%|ββ | 356/2030 [02:59<14:51, 1.88it/s]
18%|ββ | 357/2030 [03:00<14:00, 1.99it/s]
18%|ββ | 358/2030 [03:00<14:26, 1.93it/s]
18%|ββ | 359/2030 [03:01<13:47, 2.02it/s]
18%|ββ | 360/2030 [03:01<12:53, 2.16it/s]
18%|ββ | 361/2030 [03:02<13:00, 2.14it/s]
18%|ββ | 362/2030 [03:02<12:09, 2.29it/s]
18%|ββ | 363/2030 [03:02<11:28, 2.42it/s]
18%|ββ | 364/2030 [03:03<11:51, 2.34it/s]
18%|ββ | 365/2030 [03:03<12:11, 2.28it/s]
18%|ββ | 366/2030 [03:04<12:25, 2.23it/s]
18%|ββ | 367/2030 [03:04<11:17, 2.45it/s]
18%|ββ | 368/2030 [03:05<17:17, 1.60it/s]
18%|ββ | 369/2030 [03:06<16:18, 1.70it/s]
18%|ββ | 370/2030 [03:06<16:17, 1.70it/s]
18%|ββ | 371/2030 [03:07<15:54, 1.74it/s]
18%|ββ | 372/2030 [03:07<15:53, 1.74it/s]
18%|ββ | 373/2030 [03:08<13:59, 1.97it/s]
18%|ββ | 374/2030 [03:08<13:06, 2.11it/s]
18%|ββ | 375/2030 [03:09<12:35, 2.19it/s]
19%|ββ | 376/2030 [03:09<13:07, 2.10it/s]
19%|ββ | 377/2030 [03:09<12:02, 2.29it/s]
19%|ββ | 378/2030 [03:10<12:18, 2.24it/s]
19%|ββ | 379/2030 [03:10<11:32, 2.39it/s]
19%|ββ | 380/2030 [03:11<12:03, 2.28it/s]
19%|ββ | 381/2030 [03:11<12:14, 2.24it/s]
19%|ββ | 382/2030 [03:12<11:44, 2.34it/s]
19%|ββ | 383/2030 [03:12<11:36, 2.36it/s]
19%|ββ | 384/2030 [03:12<10:45, 2.55it/s]
19%|ββ | 385/2030 [03:13<10:56, 2.51it/s]
19%|ββ | 386/2030 [03:13<11:08, 2.46it/s]
19%|ββ | 387/2030 [03:14<11:13, 2.44it/s]
19%|ββ | 388/2030 [03:14<11:16, 2.43it/s]
19%|ββ | 389/2030 [03:14<11:19, 2.42it/s]
19%|ββ | 390/2030 [03:15<11:05, 2.46it/s]
19%|ββ | 391/2030 [03:15<12:47, 2.13it/s]
19%|ββ | 392/2030 [03:16<15:14, 1.79it/s]
19%|ββ | 393/2030 [03:17<15:13, 1.79it/s]
19%|ββ | 394/2030 [03:17<15:02, 1.81it/s]
19%|ββ | 395/2030 [03:18<15:13, 1.79it/s]
20%|ββ | 396/2030 [03:19<16:49, 1.62it/s]
20%|ββ | 397/2030 [03:19<15:15, 1.78it/s]
20%|ββ | 398/2030 [03:20<14:13, 1.91it/s]
20%|ββ | 399/2030 [03:20<15:23, 1.77it/s]
20%|ββ | 400/2030 [03:21<14:32, 1.87it/s]
20%|ββ | 401/2030 [03:21<13:48, 1.97it/s]
20%|ββ | 402/2030 [03:21<12:29, 2.17it/s]
20%|ββ | 403/2030 [03:22<12:24, 2.18it/s]
20%|ββ | 404/2030 [03:22<12:28, 2.17it/s]
20%|ββ | 405/2030 [03:23<11:54, 2.27it/s]
20%|ββ | 406/2030 [03:23<12:50, 2.11it/s]
20%|ββ | 407/2030 [03:24<12:00, 2.25it/s][INFO|trainer.py:811] 2024-09-09 11:57:36,964 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 11:57:36,967 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 11:57:36,967 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 11:57:36,967 >> Batch size = 8 |
|
{'eval_loss': 0.15010379254817963, 'eval_precision': 0.5959855892949047, 'eval_recall': 0.6338259441707718, 'eval_f1': 0.6143236074270556, 'eval_accuracy': 0.9467740383072925, 'eval_runtime': 5.907, 'eval_samples_per_second': 426.445, 'eval_steps_per_second': 53.327, 'epoch': 1.0} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:03, 77.84it/s][A |
|
5%|β | 16/315 [00:00<00:03, 75.71it/s][A |
|
8%|β | 24/315 [00:00<00:03, 77.33it/s][A |
|
10%|β | 32/315 [00:00<00:03, 72.67it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 76.17it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 75.16it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 75.30it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 72.75it/s][A |
|
23%|βββ | 73/315 [00:00<00:03, 74.74it/s][A |
|
26%|βββ | 81/315 [00:01<00:03, 70.68it/s][A |
|
28%|βββ | 89/315 [00:01<00:03, 67.87it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.64it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 68.83it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 70.42it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 68.78it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 69.95it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 69.66it/s][A |
|
46%|βββββ | 144/315 [00:02<00:02, 69.18it/s][A |
|
49%|βββββ | 153/315 [00:02<00:02, 73.28it/s][A |
|
51%|βββββ | 161/315 [00:02<00:02, 72.02it/s][A |
|
54%|ββββββ | 169/315 [00:02<00:02, 71.40it/s][A |
|
56%|ββββββ | 177/315 [00:02<00:01, 71.35it/s][A |
|
59%|ββββββ | 185/315 [00:02<00:01, 69.35it/s][A |
|
61%|ββββββ | 192/315 [00:02<00:01, 69.15it/s][A |
|
63%|βββββββ | 199/315 [00:02<00:01, 66.50it/s][A |
|
65%|βββββββ | 206/315 [00:02<00:01, 65.14it/s][A |
|
68%|βββββββ | 214/315 [00:03<00:01, 68.76it/s][A |
|
70%|βββββββ | 222/315 [00:03<00:01, 70.60it/s][A |
|
73%|ββββββββ | 231/315 [00:03<00:01, 73.67it/s][A |
|
76%|ββββββββ | 239/315 [00:03<00:01, 74.84it/s][A |
|
78%|ββββββββ | 247/315 [00:03<00:00, 70.52it/s][A |
|
81%|ββββββββ | 255/315 [00:03<00:00, 68.93it/s][A |
|
83%|βββββββββ | 263/315 [00:03<00:00, 70.74it/s][A |
|
86%|βββββββββ | 271/315 [00:03<00:00, 72.69it/s][A |
|
89%|βββββββββ | 280/315 [00:03<00:00, 75.36it/s][A |
|
91%|ββββββββββ| 288/315 [00:04<00:00, 72.64it/s][A |
|
94%|ββββββββββ| 296/315 [00:04<00:00, 70.98it/s][A |
|
97%|ββββββββββ| 304/315 [00:04<00:00, 72.03it/s][A |
|
99%|ββββββββββ| 312/315 [00:04<00:00, 71.91it/s][A
|
|
[A
20%|ββ | 407/2030 [03:30<12:00, 2.25it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 71.91it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 11:57:42,861 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-407 |
|
[INFO|configuration_utils.py:472] 2024-09-09 11:57:42,863 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-407/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 11:57:43,887 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-407/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 11:57:43,888 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-407/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 11:57:43,888 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-407/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 11:57:48,014 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 11:57:48,015 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
20%|ββ | 408/2030 [03:35<1:42:07, 3.78s/it]
20%|ββ | 409/2030 [03:36<1:14:36, 2.76s/it]
20%|ββ | 410/2030 [03:36<55:53, 2.07s/it]
20%|ββ | 411/2030 [03:37<43:27, 1.61s/it]
20%|ββ | 412/2030 [03:37<33:47, 1.25s/it]
20%|ββ | 413/2030 [03:37<27:05, 1.01s/it]
20%|ββ | 414/2030 [03:38<21:49, 1.23it/s]
20%|ββ | 415/2030 [03:38<18:01, 1.49it/s]
20%|ββ | 416/2030 [03:39<17:07, 1.57it/s]
21%|ββ | 417/2030 [03:39<14:44, 1.82it/s]
21%|ββ | 418/2030 [03:39<13:20, 2.01it/s]
21%|ββ | 419/2030 [03:40<12:25, 2.16it/s]
21%|ββ | 420/2030 [03:40<11:35, 2.31it/s]
21%|ββ | 421/2030 [03:41<11:46, 2.28it/s]
21%|ββ | 422/2030 [03:41<11:29, 2.33it/s]
21%|ββ | 423/2030 [03:41<10:51, 2.47it/s]
21%|ββ | 424/2030 [03:42<11:17, 2.37it/s]
21%|ββ | 425/2030 [03:42<10:51, 2.46it/s]
21%|ββ | 426/2030 [03:43<10:09, 2.63it/s]
21%|ββ | 427/2030 [03:43<11:34, 2.31it/s]
21%|ββ | 428/2030 [03:43<11:15, 2.37it/s]
21%|ββ | 429/2030 [03:44<11:04, 2.41it/s]
21%|ββ | 430/2030 [03:44<11:52, 2.24it/s]
21%|ββ | 431/2030 [03:45<12:22, 2.15it/s]
21%|βββ | 432/2030 [03:45<12:04, 2.21it/s]
21%|βββ | 433/2030 [03:46<12:06, 2.20it/s]
21%|βββ | 434/2030 [03:46<11:49, 2.25it/s]
21%|βββ | 435/2030 [03:47<11:40, 2.28it/s]
21%|βββ | 436/2030 [03:47<11:38, 2.28it/s]
22%|βββ | 437/2030 [03:48<11:43, 2.26it/s]
22%|βββ | 438/2030 [03:48<11:49, 2.24it/s]
22%|βββ | 439/2030 [03:48<11:21, 2.33it/s]
22%|βββ | 440/2030 [03:49<11:26, 2.32it/s]
22%|βββ | 441/2030 [03:49<11:26, 2.32it/s]
22%|βββ | 442/2030 [03:50<11:27, 2.31it/s]
22%|βββ | 443/2030 [03:50<10:59, 2.41it/s]
22%|βββ | 444/2030 [03:51<11:59, 2.20it/s]
22%|βββ | 445/2030 [03:51<11:41, 2.26it/s]
22%|βββ | 446/2030 [03:52<12:32, 2.10it/s]
22%|βββ | 447/2030 [03:52<13:39, 1.93it/s]
22%|βββ | 448/2030 [03:53<12:16, 2.15it/s]
22%|βββ | 449/2030 [03:53<12:03, 2.19it/s]
22%|βββ | 450/2030 [03:53<12:04, 2.18it/s]
22%|βββ | 451/2030 [03:54<12:47, 2.06it/s]
22%|βββ | 452/2030 [03:55<14:24, 1.83it/s]
22%|βββ | 453/2030 [03:55<15:25, 1.70it/s]
22%|βββ | 454/2030 [03:56<14:59, 1.75it/s]
22%|βββ | 455/2030 [03:56<13:25, 1.96it/s]
22%|βββ | 456/2030 [03:57<13:25, 1.95it/s]
23%|βββ | 457/2030 [03:57<13:00, 2.02it/s]
23%|βββ | 458/2030 [03:58<13:08, 1.99it/s]
23%|βββ | 459/2030 [03:58<13:54, 1.88it/s]
23%|βββ | 460/2030 [03:59<13:24, 1.95it/s]
23%|βββ | 461/2030 [03:59<13:11, 1.98it/s]
23%|βββ | 462/2030 [04:00<12:12, 2.14it/s]
23%|βββ | 463/2030 [04:00<13:31, 1.93it/s]
23%|βββ | 464/2030 [04:01<12:23, 2.11it/s]
23%|βββ | 465/2030 [04:01<11:55, 2.19it/s]
23%|βββ | 466/2030 [04:02<11:24, 2.29it/s]
23%|βββ | 467/2030 [04:02<11:04, 2.35it/s]
23%|βββ | 468/2030 [04:02<11:07, 2.34it/s]
23%|βββ | 469/2030 [04:03<15:26, 1.68it/s]
23%|βββ | 470/2030 [04:04<14:11, 1.83it/s]
23%|βββ | 471/2030 [04:04<12:33, 2.07it/s]
23%|βββ | 472/2030 [04:05<13:26, 1.93it/s]
23%|βββ | 473/2030 [04:05<12:45, 2.03it/s]
23%|βββ | 474/2030 [04:05<11:48, 2.20it/s]
23%|βββ | 475/2030 [04:06<13:34, 1.91it/s]
23%|βββ | 476/2030 [04:07<12:11, 2.12it/s]
23%|βββ | 477/2030 [04:07<12:14, 2.11it/s]
24%|βββ | 478/2030 [04:08<12:59, 1.99it/s]
24%|βββ | 479/2030 [04:08<12:50, 2.01it/s]
24%|βββ | 480/2030 [04:08<12:15, 2.11it/s]
24%|βββ | 481/2030 [04:09<11:12, 2.30it/s]
24%|βββ | 482/2030 [04:09<10:51, 2.38it/s]
24%|βββ | 483/2030 [04:10<10:58, 2.35it/s]
24%|βββ | 484/2030 [04:10<10:34, 2.43it/s]
24%|βββ | 485/2030 [04:10<10:57, 2.35it/s]
24%|βββ | 486/2030 [04:11<11:17, 2.28it/s]
24%|βββ | 487/2030 [04:11<10:37, 2.42it/s]
24%|βββ | 488/2030 [04:12<10:35, 2.43it/s]
24%|βββ | 489/2030 [04:12<12:24, 2.07it/s]
24%|βββ | 490/2030 [04:13<13:26, 1.91it/s]
24%|βββ | 491/2030 [04:13<12:28, 2.06it/s]
24%|βββ | 492/2030 [04:14<12:05, 2.12it/s]
24%|βββ | 493/2030 [04:14<11:17, 2.27it/s]
24%|βββ | 494/2030 [04:15<11:15, 2.27it/s]
24%|βββ | 495/2030 [04:15<10:57, 2.33it/s]
24%|βββ | 496/2030 [04:15<11:16, 2.27it/s]
24%|βββ | 497/2030 [04:16<11:11, 2.28it/s]
25%|βββ | 498/2030 [04:17<12:23, 2.06it/s]
25%|βββ | 499/2030 [04:17<10:59, 2.32it/s]
25%|βββ | 500/2030 [04:18<13:30, 1.89it/s]
25%|βββ | 500/2030 [04:18<13:30, 1.89it/s]
25%|βββ | 501/2030 [04:18<12:28, 2.04it/s]
25%|βββ | 502/2030 [04:18<12:10, 2.09it/s]
25%|βββ | 503/2030 [04:19<11:13, 2.27it/s]
25%|βββ | 504/2030 [04:19<10:48, 2.35it/s]
25%|βββ | 505/2030 [04:20<10:15, 2.48it/s]
25%|βββ | 506/2030 [04:20<10:00, 2.54it/s]
25%|βββ | 507/2030 [04:20<11:06, 2.28it/s]
25%|βββ | 508/2030 [04:21<11:14, 2.26it/s]
25%|βββ | 509/2030 [04:21<11:39, 2.18it/s]
25%|βββ | 510/2030 [04:22<11:35, 2.18it/s]
25%|βββ | 511/2030 [04:22<11:52, 2.13it/s]
25%|βββ | 512/2030 [04:23<10:57, 2.31it/s]
25%|βββ | 513/2030 [04:23<11:41, 2.16it/s]
25%|βββ | 514/2030 [04:24<10:46, 2.34it/s]
25%|βββ | 515/2030 [04:24<10:03, 2.51it/s]
25%|βββ | 516/2030 [04:24<10:01, 2.52it/s]
25%|βββ | 517/2030 [04:25<10:02, 2.51it/s]
26%|βββ | 518/2030 [04:25<09:28, 2.66it/s]
26%|βββ | 519/2030 [04:25<09:36, 2.62it/s]
26%|βββ | 520/2030 [04:26<10:16, 2.45it/s]
26%|βββ | 521/2030 [04:26<10:18, 2.44it/s]
26%|βββ | 522/2030 [04:27<11:24, 2.20it/s]
26%|βββ | 523/2030 [04:27<12:07, 2.07it/s]
26%|βββ | 524/2030 [04:28<11:26, 2.19it/s]
26%|βββ | 525/2030 [04:28<10:51, 2.31it/s]
26%|βββ | 526/2030 [04:29<12:02, 2.08it/s]
26%|βββ | 527/2030 [04:29<11:56, 2.10it/s]
26%|βββ | 528/2030 [04:30<11:10, 2.24it/s]
26%|βββ | 529/2030 [04:30<11:17, 2.22it/s]
26%|βββ | 530/2030 [04:31<11:18, 2.21it/s]
26%|βββ | 531/2030 [04:31<11:00, 2.27it/s]
26%|βββ | 532/2030 [04:31<10:29, 2.38it/s]
26%|βββ | 533/2030 [04:32<10:29, 2.38it/s]
26%|βββ | 534/2030 [04:32<09:53, 2.52it/s]
26%|βββ | 535/2030 [04:32<10:05, 2.47it/s]
26%|βββ | 536/2030 [04:33<09:42, 2.56it/s]
26%|βββ | 537/2030 [04:33<10:24, 2.39it/s]
27%|βββ | 538/2030 [04:34<10:46, 2.31it/s]
27%|βββ | 539/2030 [04:34<10:34, 2.35it/s]
27%|βββ | 540/2030 [04:35<10:10, 2.44it/s]
27%|βββ | 541/2030 [04:35<10:55, 2.27it/s]
27%|βββ | 542/2030 [04:35<10:28, 2.37it/s]
27%|βββ | 543/2030 [04:36<09:55, 2.50it/s]
27%|βββ | 544/2030 [04:37<12:06, 2.05it/s]
27%|βββ | 545/2030 [04:37<11:51, 2.09it/s]
27%|βββ | 546/2030 [04:37<11:59, 2.06it/s]
27%|βββ | 547/2030 [04:38<11:23, 2.17it/s]
27%|βββ | 548/2030 [04:38<11:56, 2.07it/s]
27%|βββ | 549/2030 [04:39<11:42, 2.11it/s]
27%|βββ | 550/2030 [04:39<11:10, 2.21it/s]
27%|βββ | 551/2030 [04:40<12:14, 2.01it/s]
27%|βββ | 552/2030 [04:40<11:45, 2.09it/s]
27%|βββ | 553/2030 [04:41<10:46, 2.29it/s]
27%|βββ | 554/2030 [04:41<10:22, 2.37it/s]
27%|βββ | 555/2030 [04:42<13:25, 1.83it/s]
27%|βββ | 556/2030 [04:42<12:29, 1.97it/s]
27%|βββ | 557/2030 [04:43<11:54, 2.06it/s]
27%|βββ | 558/2030 [04:43<11:29, 2.14it/s]
28%|βββ | 559/2030 [04:44<12:41, 1.93it/s]
28%|βββ | 560/2030 [04:44<11:43, 2.09it/s]
28%|βββ | 561/2030 [04:45<12:54, 1.90it/s]
28%|βββ | 562/2030 [04:45<13:00, 1.88it/s]
28%|βββ | 563/2030 [04:46<13:09, 1.86it/s]
28%|βββ | 564/2030 [04:46<13:16, 1.84it/s]
28%|βββ | 565/2030 [04:47<12:09, 2.01it/s]
28%|βββ | 566/2030 [04:47<11:21, 2.15it/s]
28%|βββ | 567/2030 [04:48<11:22, 2.14it/s]
28%|βββ | 568/2030 [04:48<11:05, 2.20it/s]
28%|βββ | 569/2030 [04:49<11:16, 2.16it/s]
28%|βββ | 570/2030 [04:49<11:09, 2.18it/s]
28%|βββ | 571/2030 [04:49<10:46, 2.26it/s]
28%|βββ | 572/2030 [04:50<10:59, 2.21it/s]
28%|βββ | 573/2030 [04:50<10:29, 2.31it/s]
28%|βββ | 574/2030 [04:51<10:08, 2.39it/s]
28%|βββ | 575/2030 [04:51<10:14, 2.37it/s]
28%|βββ | 576/2030 [04:52<09:59, 2.42it/s]
28%|βββ | 577/2030 [04:52<12:18, 1.97it/s]
28%|βββ | 578/2030 [04:53<12:25, 1.95it/s]
29%|βββ | 579/2030 [04:53<11:44, 2.06it/s]
29%|βββ | 580/2030 [04:54<12:14, 1.97it/s]
29%|βββ | 581/2030 [04:54<11:54, 2.03it/s]
29%|βββ | 582/2030 [04:55<12:50, 1.88it/s]
29%|βββ | 583/2030 [04:55<12:13, 1.97it/s]
29%|βββ | 584/2030 [04:56<11:23, 2.11it/s]
29%|βββ | 585/2030 [04:56<11:37, 2.07it/s]
29%|βββ | 586/2030 [04:57<11:00, 2.19it/s]
29%|βββ | 587/2030 [04:57<10:51, 2.21it/s]
29%|βββ | 588/2030 [04:58<11:13, 2.14it/s]
29%|βββ | 589/2030 [04:58<11:11, 2.15it/s]
29%|βββ | 590/2030 [04:58<10:27, 2.30it/s]
29%|βββ | 591/2030 [04:59<10:22, 2.31it/s]
29%|βββ | 592/2030 [05:00<13:37, 1.76it/s]
29%|βββ | 593/2030 [05:00<12:36, 1.90it/s]
29%|βββ | 594/2030 [05:01<14:48, 1.62it/s]
29%|βββ | 595/2030 [05:01<13:04, 1.83it/s]
29%|βββ | 596/2030 [05:02<12:20, 1.94it/s]
29%|βββ | 597/2030 [05:03<14:06, 1.69it/s]
29%|βββ | 598/2030 [05:03<13:25, 1.78it/s]
30%|βββ | 599/2030 [05:04<13:41, 1.74it/s]
30%|βββ | 600/2030 [05:04<12:55, 1.84it/s]
30%|βββ | 601/2030 [05:05<12:45, 1.87it/s]
30%|βββ | 602/2030 [05:05<11:08, 2.14it/s]
30%|βββ | 603/2030 [05:05<11:30, 2.07it/s]
30%|βββ | 604/2030 [05:06<11:35, 2.05it/s]
30%|βββ | 605/2030 [05:06<10:59, 2.16it/s]
30%|βββ | 606/2030 [05:07<10:20, 2.29it/s]
30%|βββ | 607/2030 [05:07<09:23, 2.53it/s]
30%|βββ | 608/2030 [05:08<10:06, 2.35it/s]
30%|βββ | 609/2030 [05:08<10:17, 2.30it/s]
30%|βββ | 610/2030 [05:08<10:16, 2.30it/s][INFO|trainer.py:811] 2024-09-09 11:59:21,842 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 11:59:21,844 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 11:59:21,844 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 11:59:21,844 >> Batch size = 8 |
|
{'eval_loss': 0.17612887918949127, 'eval_precision': 0.6529351184346035, 'eval_recall': 0.6940339354132458, 'eval_f1': 0.6728575218890952, 'eval_accuracy': 0.949244441592608, 'eval_runtime': 5.8933, 'eval_samples_per_second': 427.436, 'eval_steps_per_second': 53.451, 'epoch': 2.0} |
|
{'loss': 0.1312, 'grad_norm': 0.6181371212005615, 'learning_rate': 3.768472906403941e-05, 'epoch': 2.46} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:04, 75.43it/s][A |
|
5%|β | 16/315 [00:00<00:04, 74.71it/s][A |
|
8%|β | 24/315 [00:00<00:03, 77.03it/s][A |
|
10%|β | 32/315 [00:00<00:03, 72.48it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 76.53it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 75.55it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 75.61it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 72.63it/s][A |
|
23%|βββ | 73/315 [00:00<00:03, 74.66it/s][A |
|
26%|βββ | 81/315 [00:01<00:03, 70.82it/s][A |
|
28%|βββ | 89/315 [00:01<00:03, 67.78it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.59it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 68.67it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 70.25it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 68.82it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 69.76it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 69.32it/s][A |
|
46%|βββββ | 144/315 [00:02<00:02, 69.42it/s][A |
|
49%|βββββ | 153/315 [00:02<00:02, 73.74it/s][A |
|
51%|βββββ | 161/315 [00:02<00:02, 72.59it/s][A |
|
54%|ββββββ | 169/315 [00:02<00:02, 72.05it/s][A |
|
56%|ββββββ | 177/315 [00:02<00:01, 71.73it/s][A |
|
59%|ββββββ | 185/315 [00:02<00:01, 69.31it/s][A |
|
61%|ββββββ | 192/315 [00:02<00:01, 68.97it/s][A |
|
63%|βββββββ | 199/315 [00:02<00:01, 66.09it/s][A |
|
65%|βββββββ | 206/315 [00:02<00:01, 64.71it/s][A |
|
68%|βββββββ | 214/315 [00:03<00:01, 68.59it/s][A |
|
70%|βββββββ | 222/315 [00:03<00:01, 70.27it/s][A |
|
73%|ββββββββ | 231/315 [00:03<00:01, 73.41it/s][A |
|
76%|ββββββββ | 239/315 [00:03<00:01, 74.85it/s][A |
|
78%|ββββββββ | 247/315 [00:03<00:00, 70.13it/s][A |
|
81%|ββββββββ | 255/315 [00:03<00:00, 68.73it/s][A |
|
83%|βββββββββ | 263/315 [00:03<00:00, 70.54it/s][A |
|
86%|βββββββββ | 271/315 [00:03<00:00, 72.43it/s][A |
|
89%|βββββββββ | 280/315 [00:03<00:00, 75.55it/s][A |
|
91%|ββββββββββ| 288/315 [00:04<00:00, 72.63it/s][A |
|
94%|ββββββββββ| 296/315 [00:04<00:00, 71.32it/s][A |
|
97%|ββββββββββ| 304/315 [00:04<00:00, 72.46it/s][A |
|
99%|ββββββββββ| 312/315 [00:04<00:00, 72.19it/s][A
|
|
[A
30%|βββ | 610/2030 [05:14<10:16, 2.30it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 72.19it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 11:59:27,690 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-610 |
|
[INFO|configuration_utils.py:472] 2024-09-09 11:59:27,692 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-610/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 11:59:28,717 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-610/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 11:59:28,718 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-610/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 11:59:28,718 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-610/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 11:59:31,818 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 11:59:31,819 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
30%|βββ | 611/2030 [05:19<1:20:23, 3.40s/it]
30%|βββ | 612/2030 [05:19<59:41, 2.53s/it]
30%|βββ | 613/2030 [05:20<47:12, 2.00s/it]
30%|βββ | 614/2030 [05:20<35:37, 1.51s/it]
30%|βββ | 615/2030 [05:21<27:24, 1.16s/it]
30%|βββ | 616/2030 [05:21<23:10, 1.02it/s]
30%|βββ | 617/2030 [05:22<19:02, 1.24it/s]
30%|βββ | 618/2030 [05:22<17:57, 1.31it/s]
30%|βββ | 619/2030 [05:23<15:09, 1.55it/s]
31%|βββ | 620/2030 [05:23<13:12, 1.78it/s]
31%|βββ | 621/2030 [05:23<11:55, 1.97it/s]
31%|βββ | 622/2030 [05:24<11:43, 2.00it/s]
31%|βββ | 623/2030 [05:24<10:55, 2.15it/s]
31%|βββ | 624/2030 [05:25<11:36, 2.02it/s]
31%|βββ | 625/2030 [05:26<13:00, 1.80it/s]
31%|βββ | 626/2030 [05:26<12:31, 1.87it/s]
31%|βββ | 627/2030 [05:26<11:20, 2.06it/s]
31%|βββ | 628/2030 [05:27<10:13, 2.28it/s]
31%|βββ | 629/2030 [05:27<10:31, 2.22it/s]
31%|βββ | 630/2030 [05:28<10:39, 2.19it/s]
31%|βββ | 631/2030 [05:29<12:59, 1.79it/s]
31%|βββ | 632/2030 [05:29<12:03, 1.93it/s]
31%|βββ | 633/2030 [05:29<11:21, 2.05it/s]
31%|βββ | 634/2030 [05:30<11:31, 2.02it/s]
31%|ββββ | 635/2030 [05:30<11:03, 2.10it/s]
31%|ββββ | 636/2030 [05:31<10:53, 2.13it/s]
31%|ββββ | 637/2030 [05:31<10:19, 2.25it/s]
31%|ββββ | 638/2030 [05:32<09:58, 2.33it/s]
31%|ββββ | 639/2030 [05:32<10:21, 2.24it/s]
32%|ββββ | 640/2030 [05:32<09:53, 2.34it/s]
32%|ββββ | 641/2030 [05:33<09:42, 2.38it/s]
32%|ββββ | 642/2030 [05:33<10:11, 2.27it/s]
32%|ββββ | 643/2030 [05:34<10:48, 2.14it/s]
32%|ββββ | 644/2030 [05:34<10:16, 2.25it/s]
32%|ββββ | 645/2030 [05:35<09:57, 2.32it/s]
32%|ββββ | 646/2030 [05:35<09:37, 2.40it/s]
32%|ββββ | 647/2030 [05:35<10:13, 2.26it/s]
32%|ββββ | 648/2030 [05:36<09:30, 2.42it/s]
32%|ββββ | 649/2030 [05:36<09:54, 2.32it/s]
32%|ββββ | 650/2030 [05:37<10:46, 2.14it/s]
32%|ββββ | 651/2030 [05:37<09:52, 2.33it/s]
32%|ββββ | 652/2030 [05:38<10:02, 2.29it/s]
32%|ββββ | 653/2030 [05:38<09:50, 2.33it/s]
32%|ββββ | 654/2030 [05:39<10:09, 2.26it/s]
32%|ββββ | 655/2030 [05:39<11:45, 1.95it/s]
32%|ββββ | 656/2030 [05:40<11:24, 2.01it/s]
32%|ββββ | 657/2030 [05:40<11:31, 1.99it/s]
32%|ββββ | 658/2030 [05:41<11:21, 2.01it/s]
32%|ββββ | 659/2030 [05:41<11:08, 2.05it/s]
33%|ββββ | 660/2030 [05:42<11:03, 2.07it/s]
33%|ββββ | 661/2030 [05:42<11:14, 2.03it/s]
33%|ββββ | 662/2030 [05:43<10:51, 2.10it/s]
33%|ββββ | 663/2030 [05:43<11:08, 2.05it/s]
33%|ββββ | 664/2030 [05:43<10:24, 2.19it/s]
33%|ββββ | 665/2030 [05:44<10:40, 2.13it/s]
33%|ββββ | 666/2030 [05:44<09:49, 2.31it/s]
33%|ββββ | 667/2030 [05:45<09:04, 2.51it/s]
33%|ββββ | 668/2030 [05:45<09:51, 2.30it/s]
33%|ββββ | 669/2030 [05:46<10:02, 2.26it/s]
33%|ββββ | 670/2030 [05:46<10:05, 2.25it/s]
33%|ββββ | 671/2030 [05:46<09:36, 2.36it/s]
33%|ββββ | 672/2030 [05:47<09:17, 2.43it/s]
33%|ββββ | 673/2030 [05:47<09:15, 2.44it/s]
33%|ββββ | 674/2030 [05:48<11:19, 2.00it/s]
33%|ββββ | 675/2030 [05:48<10:49, 2.09it/s]
33%|ββββ | 676/2030 [05:49<09:53, 2.28it/s]
33%|ββββ | 677/2030 [05:49<09:54, 2.27it/s]
33%|ββββ | 678/2030 [05:50<10:02, 2.24it/s]
33%|ββββ | 679/2030 [05:50<09:58, 2.26it/s]
33%|ββββ | 680/2030 [05:51<10:56, 2.06it/s]
34%|ββββ | 681/2030 [05:51<10:20, 2.18it/s]
34%|ββββ | 682/2030 [05:51<09:39, 2.33it/s]
34%|ββββ | 683/2030 [05:52<09:30, 2.36it/s]
34%|ββββ | 684/2030 [05:52<09:44, 2.30it/s]
34%|ββββ | 685/2030 [05:53<10:04, 2.22it/s]
34%|ββββ | 686/2030 [05:53<09:32, 2.35it/s]
34%|ββββ | 687/2030 [05:53<08:54, 2.51it/s]
34%|ββββ | 688/2030 [05:54<08:44, 2.56it/s]
34%|ββββ | 689/2030 [05:54<09:17, 2.41it/s]
34%|ββββ | 690/2030 [05:55<10:05, 2.21it/s]
34%|ββββ | 691/2030 [05:55<09:26, 2.36it/s]
34%|ββββ | 692/2030 [05:56<09:09, 2.44it/s]
34%|ββββ | 693/2030 [05:56<08:54, 2.50it/s]
34%|ββββ | 694/2030 [05:56<08:48, 2.53it/s]
34%|ββββ | 695/2030 [05:57<09:44, 2.28it/s]
34%|ββββ | 696/2030 [05:57<09:04, 2.45it/s]
34%|ββββ | 697/2030 [05:58<08:55, 2.49it/s]
34%|ββββ | 698/2030 [05:58<09:18, 2.39it/s]
34%|ββββ | 699/2030 [05:59<09:39, 2.30it/s]
34%|ββββ | 700/2030 [05:59<09:36, 2.31it/s]
35%|ββββ | 701/2030 [05:59<09:42, 2.28it/s]
35%|ββββ | 702/2030 [06:00<10:37, 2.08it/s]
35%|ββββ | 703/2030 [06:00<10:19, 2.14it/s]
35%|ββββ | 704/2030 [06:01<10:02, 2.20it/s]
35%|ββββ | 705/2030 [06:01<10:05, 2.19it/s]
35%|ββββ | 706/2030 [06:02<09:31, 2.32it/s]
35%|ββββ | 707/2030 [06:02<09:23, 2.35it/s]
35%|ββββ | 708/2030 [06:03<11:26, 1.93it/s]
35%|ββββ | 709/2030 [06:03<10:21, 2.13it/s]
35%|ββββ | 710/2030 [06:04<10:09, 2.17it/s]
35%|ββββ | 711/2030 [06:04<09:53, 2.22it/s]
35%|ββββ | 712/2030 [06:05<09:55, 2.21it/s]
35%|ββββ | 713/2030 [06:05<09:29, 2.31it/s]
35%|ββββ | 714/2030 [06:05<09:21, 2.35it/s]
35%|ββββ | 715/2030 [06:06<09:37, 2.28it/s]
35%|ββββ | 716/2030 [06:06<10:07, 2.16it/s]
35%|ββββ | 717/2030 [06:07<10:00, 2.19it/s]
35%|ββββ | 718/2030 [06:07<10:00, 2.18it/s]
35%|ββββ | 719/2030 [06:08<09:28, 2.31it/s]
35%|ββββ | 720/2030 [06:08<09:34, 2.28it/s]
36%|ββββ | 721/2030 [06:08<09:35, 2.27it/s]
36%|ββββ | 722/2030 [06:09<09:20, 2.34it/s]
36%|ββββ | 723/2030 [06:09<09:34, 2.27it/s]
36%|ββββ | 724/2030 [06:10<09:50, 2.21it/s]
36%|ββββ | 725/2030 [06:10<09:40, 2.25it/s]
36%|ββββ | 726/2030 [06:11<10:50, 2.00it/s]
36%|ββββ | 727/2030 [06:11<10:34, 2.05it/s]
36%|ββββ | 728/2030 [06:12<10:37, 2.04it/s]
36%|ββββ | 729/2030 [06:12<11:24, 1.90it/s]
36%|ββββ | 730/2030 [06:13<10:46, 2.01it/s]
36%|ββββ | 731/2030 [06:13<09:33, 2.26it/s]
36%|ββββ | 732/2030 [06:14<09:51, 2.20it/s]
36%|ββββ | 733/2030 [06:14<09:28, 2.28it/s]
36%|ββββ | 734/2030 [06:14<09:03, 2.39it/s]
36%|ββββ | 735/2030 [06:15<09:01, 2.39it/s]
36%|ββββ | 736/2030 [06:15<09:52, 2.18it/s]
36%|ββββ | 737/2030 [06:16<09:22, 2.30it/s]
36%|ββββ | 738/2030 [06:16<09:01, 2.39it/s]
36%|ββββ | 739/2030 [06:17<10:37, 2.02it/s]
36%|ββββ | 740/2030 [06:17<09:53, 2.17it/s]
37%|ββββ | 741/2030 [06:18<10:43, 2.00it/s]
37%|ββββ | 742/2030 [06:18<10:12, 2.10it/s]
37%|ββββ | 743/2030 [06:19<09:54, 2.17it/s]
37%|ββββ | 744/2030 [06:19<11:18, 1.89it/s]
37%|ββββ | 745/2030 [06:20<10:36, 2.02it/s]
37%|ββββ | 746/2030 [06:20<10:41, 2.00it/s]
37%|ββββ | 747/2030 [06:21<09:54, 2.16it/s]
37%|ββββ | 748/2030 [06:21<10:14, 2.09it/s]
37%|ββββ | 749/2030 [06:22<10:33, 2.02it/s]
37%|ββββ | 750/2030 [06:22<12:06, 1.76it/s]
37%|ββββ | 751/2030 [06:23<13:29, 1.58it/s]
37%|ββββ | 752/2030 [06:24<11:41, 1.82it/s]
37%|ββββ | 753/2030 [06:24<10:44, 1.98it/s]
37%|ββββ | 754/2030 [06:24<10:23, 2.05it/s]
37%|ββββ | 755/2030 [06:25<10:32, 2.01it/s]
37%|ββββ | 756/2030 [06:25<09:49, 2.16it/s]
37%|ββββ | 757/2030 [06:26<10:56, 1.94it/s]
37%|ββββ | 758/2030 [06:27<12:07, 1.75it/s]
37%|ββββ | 759/2030 [06:27<11:04, 1.91it/s]
37%|ββββ | 760/2030 [06:28<10:38, 1.99it/s]
37%|ββββ | 761/2030 [06:28<10:25, 2.03it/s]
38%|ββββ | 762/2030 [06:29<10:49, 1.95it/s]
38%|ββββ | 763/2030 [06:29<10:38, 1.99it/s]
38%|ββββ | 764/2030 [06:30<13:47, 1.53it/s]
38%|ββββ | 765/2030 [06:30<12:01, 1.75it/s]
38%|ββββ | 766/2030 [06:31<13:41, 1.54it/s]
38%|ββββ | 767/2030 [06:32<12:02, 1.75it/s]
38%|ββββ | 768/2030 [06:32<11:20, 1.85it/s]
38%|ββββ | 769/2030 [06:33<10:40, 1.97it/s]
38%|ββββ | 770/2030 [06:33<11:08, 1.88it/s]
38%|ββββ | 771/2030 [06:34<12:15, 1.71it/s]
38%|ββββ | 772/2030 [06:35<13:18, 1.58it/s]
38%|ββββ | 773/2030 [06:35<12:46, 1.64it/s]
38%|ββββ | 774/2030 [06:36<11:37, 1.80it/s]
38%|ββββ | 775/2030 [06:36<10:36, 1.97it/s]
38%|ββββ | 776/2030 [06:37<10:48, 1.93it/s]
38%|ββββ | 777/2030 [06:37<10:44, 1.94it/s]
38%|ββββ | 778/2030 [06:37<09:53, 2.11it/s]
38%|ββββ | 779/2030 [06:38<09:28, 2.20it/s]
38%|ββββ | 780/2030 [06:38<09:19, 2.24it/s]
38%|ββββ | 781/2030 [06:39<09:01, 2.31it/s]
39%|ββββ | 782/2030 [06:39<08:33, 2.43it/s]
39%|ββββ | 783/2030 [06:39<08:23, 2.48it/s]
39%|ββββ | 784/2030 [06:40<08:30, 2.44it/s]
39%|ββββ | 785/2030 [06:40<08:40, 2.39it/s]
39%|ββββ | 786/2030 [06:41<09:17, 2.23it/s]
39%|ββββ | 787/2030 [06:41<09:55, 2.09it/s]
39%|ββββ | 788/2030 [06:42<09:34, 2.16it/s]
39%|ββββ | 789/2030 [06:42<08:42, 2.37it/s]
39%|ββββ | 790/2030 [06:43<11:16, 1.83it/s]
39%|ββββ | 791/2030 [06:43<10:59, 1.88it/s]
39%|ββββ | 792/2030 [06:44<10:00, 2.06it/s]
39%|ββββ | 793/2030 [06:44<09:41, 2.13it/s]
39%|ββββ | 794/2030 [06:45<09:27, 2.18it/s]
39%|ββββ | 795/2030 [06:45<08:47, 2.34it/s]
39%|ββββ | 796/2030 [06:46<10:28, 1.96it/s]
39%|ββββ | 797/2030 [06:46<09:59, 2.06it/s]
39%|ββββ | 798/2030 [06:46<09:08, 2.25it/s]
39%|ββββ | 799/2030 [06:47<09:00, 2.28it/s]
39%|ββββ | 800/2030 [06:48<10:56, 1.87it/s]
39%|ββββ | 801/2030 [06:48<09:51, 2.08it/s]
40%|ββββ | 802/2030 [06:48<08:58, 2.28it/s]
40%|ββββ | 803/2030 [06:49<08:25, 2.43it/s]
40%|ββββ | 804/2030 [06:49<08:16, 2.47it/s]
40%|ββββ | 805/2030 [06:50<08:21, 2.44it/s]
40%|ββββ | 806/2030 [06:50<08:53, 2.29it/s]
40%|ββββ | 807/2030 [06:50<08:45, 2.33it/s]
40%|ββββ | 808/2030 [06:51<08:34, 2.37it/s]
40%|ββββ | 809/2030 [06:51<08:30, 2.39it/s]
40%|ββββ | 810/2030 [06:52<08:47, 2.31it/s]
40%|ββββ | 811/2030 [06:52<08:38, 2.35it/s]
40%|ββββ | 812/2030 [06:53<09:45, 2.08it/s]
40%|ββββ | 813/2030 [06:53<10:56, 1.85it/s]
40%|ββββ | 814/2030 [06:54<10:10, 1.99it/s][INFO|trainer.py:811] 2024-09-09 12:01:07,104 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:01:07,106 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:01:07,106 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:01:07,106 >> Batch size = 8 |
|
{'eval_loss': 0.1995203047990799, 'eval_precision': 0.6322393822393823, 'eval_recall': 0.7170224411603722, 'eval_f1': 0.671967171069505, 'eval_accuracy': 0.9469665372645898, 'eval_runtime': 5.8448, 'eval_samples_per_second': 430.983, 'eval_steps_per_second': 53.894, 'epoch': 3.0} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:03, 78.87it/s][A |
|
5%|β | 16/315 [00:00<00:03, 75.25it/s][A |
|
8%|β | 24/315 [00:00<00:03, 77.25it/s][A |
|
10%|β | 32/315 [00:00<00:03, 72.82it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 77.32it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 76.36it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 76.57it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 73.55it/s][A |
|
23%|βββ | 74/315 [00:00<00:03, 75.77it/s][A |
|
26%|βββ | 82/315 [00:01<00:03, 71.09it/s][A |
|
29%|βββ | 90/315 [00:01<00:03, 68.40it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.96it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 69.58it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 71.07it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 69.75it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 71.23it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 69.49it/s][A |
|
46%|βββββ | 144/315 [00:02<00:02, 68.89it/s][A |
|
49%|βββββ | 153/315 [00:02<00:02, 73.61it/s][A |
|
51%|βββββ | 161/315 [00:02<00:02, 72.32it/s][A |
|
54%|ββββββ | 169/315 [00:02<00:02, 72.09it/s][A |
|
56%|ββββββ | 177/315 [00:02<00:01, 71.28it/s][A |
|
59%|ββββββ | 185/315 [00:02<00:01, 69.33it/s][A |
|
61%|ββββββ | 192/315 [00:02<00:01, 69.28it/s][A |
|
63%|βββββββ | 199/315 [00:02<00:01, 66.15it/s][A |
|
65%|βββββββ | 206/315 [00:02<00:01, 64.64it/s][A |
|
68%|βββββββ | 214/315 [00:03<00:01, 68.14it/s][A |
|
70%|βββββββ | 222/315 [00:03<00:01, 70.42it/s][A |
|
73%|ββββββββ | 231/315 [00:03<00:01, 73.54it/s][A |
|
76%|ββββββββ | 239/315 [00:03<00:01, 74.46it/s][A |
|
78%|ββββββββ | 247/315 [00:03<00:00, 70.91it/s][A |
|
81%|ββββββββ | 255/315 [00:03<00:00, 69.76it/s][A |
|
83%|βββββββββ | 263/315 [00:03<00:00, 70.80it/s][A |
|
86%|βββββββββ | 271/315 [00:03<00:00, 72.83it/s][A |
|
89%|βββββββββ | 280/315 [00:03<00:00, 75.33it/s][A |
|
91%|ββββββββββ| 288/315 [00:04<00:00, 72.16it/s][A |
|
94%|ββββββββββ| 296/315 [00:04<00:00, 70.47it/s][A |
|
97%|ββββββββββ| 304/315 [00:04<00:00, 71.42it/s][A |
|
99%|ββββββββββ| 312/315 [00:04<00:00, 71.81it/s][A
|
|
[A
40%|ββββ | 814/2030 [07:00<10:10, 1.99it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 71.81it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 12:01:12,979 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-814 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:01:12,981 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-814/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:01:14,015 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-814/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:01:14,016 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-814/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:01:14,016 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-814/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:01:17,796 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:01:17,796 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
40%|ββββ | 815/2030 [07:05<1:14:56, 3.70s/it]
40%|ββββ | 816/2030 [07:05<55:06, 2.72s/it]
40%|ββββ | 817/2030 [07:06<41:38, 2.06s/it]
40%|ββββ | 818/2030 [07:06<31:44, 1.57s/it]
40%|ββββ | 819/2030 [07:07<24:35, 1.22s/it]
40%|ββββ | 820/2030 [07:07<19:39, 1.03it/s]
40%|ββββ | 821/2030 [07:08<16:18, 1.24it/s]
40%|ββββ | 822/2030 [07:08<14:52, 1.35it/s]
41%|ββββ | 823/2030 [07:09<12:30, 1.61it/s]
41%|ββββ | 824/2030 [07:09<11:45, 1.71it/s]
41%|ββββ | 825/2030 [07:10<12:53, 1.56it/s]
41%|ββββ | 826/2030 [07:10<11:30, 1.74it/s]
41%|ββββ | 827/2030 [07:11<11:01, 1.82it/s]
41%|ββββ | 828/2030 [07:11<10:17, 1.95it/s]
41%|ββββ | 829/2030 [07:12<10:03, 1.99it/s]
41%|ββββ | 830/2030 [07:12<10:11, 1.96it/s]
41%|ββββ | 831/2030 [07:13<09:23, 2.13it/s]
41%|ββββ | 832/2030 [07:13<09:22, 2.13it/s]
41%|ββββ | 833/2030 [07:14<11:02, 1.81it/s]
41%|ββββ | 834/2030 [07:14<09:52, 2.02it/s]
41%|ββββ | 835/2030 [07:15<09:28, 2.10it/s]
41%|ββββ | 836/2030 [07:15<09:19, 2.13it/s]
41%|ββββ | 837/2030 [07:15<09:14, 2.15it/s]
41%|βββββ | 838/2030 [07:16<08:57, 2.22it/s]
41%|βββββ | 839/2030 [07:17<10:58, 1.81it/s]
41%|βββββ | 840/2030 [07:17<10:08, 1.96it/s]
41%|βββββ | 841/2030 [07:17<09:19, 2.12it/s]
41%|βββββ | 842/2030 [07:18<09:02, 2.19it/s]
42%|βββββ | 843/2030 [07:18<08:32, 2.32it/s]
42%|βββββ | 844/2030 [07:19<09:20, 2.12it/s]
42%|βββββ | 845/2030 [07:19<08:56, 2.21it/s]
42%|βββββ | 846/2030 [07:20<08:16, 2.39it/s]
42%|βββββ | 847/2030 [07:20<07:49, 2.52it/s]
42%|βββββ | 848/2030 [07:20<07:54, 2.49it/s]
42%|βββββ | 849/2030 [07:21<08:23, 2.35it/s]
42%|βββββ | 850/2030 [07:21<08:22, 2.35it/s]
42%|βββββ | 851/2030 [07:22<10:33, 1.86it/s]
42%|βββββ | 852/2030 [07:23<10:20, 1.90it/s]
42%|βββββ | 853/2030 [07:23<09:57, 1.97it/s]
42%|βββββ | 854/2030 [07:23<09:37, 2.04it/s]
42%|βββββ | 855/2030 [07:24<10:30, 1.86it/s]
42%|βββββ | 856/2030 [07:24<09:32, 2.05it/s]
42%|βββββ | 857/2030 [07:25<09:10, 2.13it/s]
42%|βββββ | 858/2030 [07:25<08:56, 2.18it/s]
42%|βββββ | 859/2030 [07:26<11:58, 1.63it/s]
42%|βββββ | 860/2030 [07:27<11:06, 1.75it/s]
42%|βββββ | 861/2030 [07:28<13:14, 1.47it/s]
42%|βββββ | 862/2030 [07:29<14:19, 1.36it/s]
43%|βββββ | 863/2030 [07:29<13:02, 1.49it/s]
43%|βββββ | 864/2030 [07:30<12:08, 1.60it/s]
43%|βββββ | 865/2030 [07:30<11:54, 1.63it/s]
43%|βββββ | 866/2030 [07:31<10:29, 1.85it/s]
43%|βββββ | 867/2030 [07:31<09:58, 1.94it/s]
43%|βββββ | 868/2030 [07:31<08:57, 2.16it/s]
43%|βββββ | 869/2030 [07:32<09:20, 2.07it/s]
43%|βββββ | 870/2030 [07:32<08:25, 2.29it/s]
43%|βββββ | 871/2030 [07:33<08:36, 2.24it/s]
43%|βββββ | 872/2030 [07:33<08:29, 2.27it/s]
43%|βββββ | 873/2030 [07:34<09:00, 2.14it/s]
43%|βββββ | 874/2030 [07:34<08:03, 2.39it/s]
43%|βββββ | 875/2030 [07:34<08:07, 2.37it/s]
43%|βββββ | 876/2030 [07:35<09:13, 2.09it/s]
43%|βββββ | 877/2030 [07:35<08:29, 2.26it/s]
43%|βββββ | 878/2030 [07:36<10:24, 1.84it/s]
43%|βββββ | 879/2030 [07:37<09:57, 1.93it/s]
43%|βββββ | 880/2030 [07:37<09:39, 1.98it/s]
43%|βββββ | 881/2030 [07:38<10:34, 1.81it/s]
43%|βββββ | 882/2030 [07:38<09:33, 2.00it/s]
43%|βββββ | 883/2030 [07:38<09:09, 2.09it/s]
44%|βββββ | 884/2030 [07:39<09:41, 1.97it/s]
44%|βββββ | 885/2030 [07:40<11:01, 1.73it/s]
44%|βββββ | 886/2030 [07:40<10:45, 1.77it/s]
44%|βββββ | 887/2030 [07:41<09:52, 1.93it/s]
44%|βββββ | 888/2030 [07:41<09:07, 2.09it/s]
44%|βββββ | 889/2030 [07:42<08:49, 2.16it/s]
44%|βββββ | 890/2030 [07:42<08:48, 2.16it/s]
44%|βββββ | 891/2030 [07:42<08:44, 2.17it/s]
44%|βββββ | 892/2030 [07:43<09:25, 2.01it/s]
44%|βββββ | 893/2030 [07:43<08:56, 2.12it/s]
44%|βββββ | 894/2030 [07:44<09:50, 1.92it/s]
44%|βββββ | 895/2030 [07:45<09:43, 1.95it/s]
44%|βββββ | 896/2030 [07:45<09:28, 2.00it/s]
44%|βββββ | 897/2030 [07:46<09:11, 2.06it/s]
44%|βββββ | 898/2030 [07:46<09:03, 2.08it/s]
44%|βββββ | 899/2030 [07:46<08:44, 2.16it/s]
44%|βββββ | 900/2030 [07:47<08:17, 2.27it/s]
44%|βββββ | 901/2030 [07:47<08:14, 2.28it/s]
44%|βββββ | 902/2030 [07:48<08:14, 2.28it/s]
44%|βββββ | 903/2030 [07:48<08:08, 2.31it/s]
45%|βββββ | 904/2030 [07:49<08:52, 2.11it/s]
45%|βββββ | 905/2030 [07:49<08:51, 2.12it/s]
45%|βββββ | 906/2030 [07:50<08:29, 2.21it/s]
45%|βββββ | 907/2030 [07:50<08:45, 2.14it/s]
45%|βββββ | 908/2030 [07:51<08:37, 2.17it/s]
45%|βββββ | 909/2030 [07:51<08:08, 2.29it/s]
45%|βββββ | 910/2030 [07:51<09:03, 2.06it/s]
45%|βββββ | 911/2030 [07:52<08:40, 2.15it/s]
45%|βββββ | 912/2030 [07:52<08:11, 2.28it/s]
45%|βββββ | 913/2030 [07:53<07:59, 2.33it/s]
45%|βββββ | 914/2030 [07:53<08:04, 2.30it/s]
45%|βββββ | 915/2030 [07:54<08:34, 2.17it/s]
45%|βββββ | 916/2030 [07:54<09:57, 1.86it/s]
45%|βββββ | 917/2030 [07:55<10:55, 1.70it/s]
45%|βββββ | 918/2030 [07:56<10:33, 1.75it/s]
45%|βββββ | 919/2030 [07:56<09:59, 1.85it/s]
45%|βββββ | 920/2030 [07:56<08:52, 2.08it/s]
45%|βββββ | 921/2030 [07:57<08:19, 2.22it/s]
45%|βββββ | 922/2030 [07:57<09:24, 1.96it/s]
45%|βββββ | 923/2030 [07:58<09:10, 2.01it/s]
46%|βββββ | 924/2030 [07:58<08:44, 2.11it/s]
46%|βββββ | 925/2030 [07:59<08:41, 2.12it/s]
46%|βββββ | 926/2030 [07:59<08:12, 2.24it/s]
46%|βββββ | 927/2030 [08:00<08:09, 2.25it/s]
46%|βββββ | 928/2030 [08:00<09:13, 1.99it/s]
46%|βββββ | 929/2030 [08:01<09:04, 2.02it/s]
46%|βββββ | 930/2030 [08:01<08:05, 2.27it/s]
46%|βββββ | 931/2030 [08:01<07:42, 2.38it/s]
46%|βββββ | 932/2030 [08:02<07:16, 2.52it/s]
46%|βββββ | 933/2030 [08:02<07:17, 2.51it/s]
46%|βββββ | 934/2030 [08:03<08:26, 2.16it/s]
46%|βββββ | 935/2030 [08:03<08:32, 2.14it/s]
46%|βββββ | 936/2030 [08:04<08:28, 2.15it/s]
46%|βββββ | 937/2030 [08:04<08:08, 2.24it/s]
46%|βββββ | 938/2030 [08:04<07:45, 2.35it/s]
46%|βββββ | 939/2030 [08:05<09:30, 1.91it/s]
46%|βββββ | 940/2030 [08:06<08:38, 2.10it/s]
46%|βββββ | 941/2030 [08:06<08:34, 2.12it/s]
46%|βββββ | 942/2030 [08:07<08:29, 2.13it/s]
46%|βββββ | 943/2030 [08:07<07:58, 2.27it/s]
47%|βββββ | 944/2030 [08:07<07:29, 2.42it/s]
47%|βββββ | 945/2030 [08:08<08:10, 2.21it/s]
47%|βββββ | 946/2030 [08:08<07:56, 2.27it/s]
47%|βββββ | 947/2030 [08:09<07:56, 2.27it/s]
47%|βββββ | 948/2030 [08:09<07:52, 2.29it/s]
47%|βββββ | 949/2030 [08:10<07:51, 2.29it/s]
47%|βββββ | 950/2030 [08:10<08:04, 2.23it/s]
47%|βββββ | 951/2030 [08:10<07:56, 2.26it/s]
47%|βββββ | 952/2030 [08:11<08:05, 2.22it/s]
47%|βββββ | 953/2030 [08:11<08:07, 2.21it/s]
47%|βββββ | 954/2030 [08:12<07:38, 2.35it/s]
47%|βββββ | 955/2030 [08:12<07:50, 2.28it/s]
47%|βββββ | 956/2030 [08:13<08:10, 2.19it/s]
47%|βββββ | 957/2030 [08:13<08:43, 2.05it/s]
47%|βββββ | 958/2030 [08:14<08:10, 2.19it/s]
47%|βββββ | 959/2030 [08:14<08:39, 2.06it/s]
47%|βββββ | 960/2030 [08:15<08:27, 2.11it/s]
47%|βββββ | 961/2030 [08:15<09:09, 1.95it/s]
47%|βββββ | 962/2030 [08:16<08:54, 2.00it/s]
47%|βββββ | 963/2030 [08:16<08:40, 2.05it/s]
47%|βββββ | 964/2030 [08:17<08:04, 2.20it/s]
48%|βββββ | 965/2030 [08:17<08:00, 2.22it/s]
48%|βββββ | 966/2030 [08:18<08:27, 2.10it/s]
48%|βββββ | 967/2030 [08:18<08:09, 2.17it/s]
48%|βββββ | 968/2030 [08:18<08:24, 2.10it/s]
48%|βββββ | 969/2030 [08:19<08:04, 2.19it/s]
48%|βββββ | 970/2030 [08:19<07:36, 2.32it/s]
48%|βββββ | 971/2030 [08:20<09:12, 1.92it/s]
48%|βββββ | 972/2030 [08:20<08:09, 2.16it/s]
48%|βββββ | 973/2030 [08:21<08:19, 2.12it/s]
48%|βββββ | 974/2030 [08:21<07:49, 2.25it/s]
48%|βββββ | 975/2030 [08:22<09:14, 1.90it/s]
48%|βββββ | 976/2030 [08:22<08:25, 2.08it/s]
48%|βββββ | 977/2030 [08:23<07:58, 2.20it/s]
48%|βββββ | 978/2030 [08:23<08:04, 2.17it/s]
48%|βββββ | 979/2030 [08:24<08:10, 2.14it/s]
48%|βββββ | 980/2030 [08:24<07:58, 2.19it/s]
48%|βββββ | 981/2030 [08:24<07:45, 2.26it/s]
48%|βββββ | 982/2030 [08:25<07:31, 2.32it/s]
48%|βββββ | 983/2030 [08:25<07:58, 2.19it/s]
48%|βββββ | 984/2030 [08:26<08:16, 2.11it/s]
49%|βββββ | 985/2030 [08:27<09:02, 1.93it/s]
49%|βββββ | 986/2030 [08:27<08:06, 2.15it/s]
49%|βββββ | 987/2030 [08:27<07:50, 2.22it/s]
49%|βββββ | 988/2030 [08:28<07:24, 2.34it/s]
49%|βββββ | 989/2030 [08:28<07:14, 2.39it/s]
49%|βββββ | 990/2030 [08:29<07:38, 2.27it/s]
49%|βββββ | 991/2030 [08:29<09:04, 1.91it/s]
49%|βββββ | 992/2030 [08:30<08:59, 1.92it/s]
49%|βββββ | 993/2030 [08:30<08:35, 2.01it/s]
49%|βββββ | 994/2030 [08:31<08:06, 2.13it/s]
49%|βββββ | 995/2030 [08:31<07:52, 2.19it/s]
49%|βββββ | 996/2030 [08:32<08:18, 2.07it/s]
49%|βββββ | 997/2030 [08:32<08:16, 2.08it/s]
49%|βββββ | 998/2030 [08:33<08:14, 2.09it/s]
49%|βββββ | 999/2030 [08:33<08:17, 2.07it/s]
49%|βββββ | 1000/2030 [08:34<09:05, 1.89it/s]
49%|βββββ | 1000/2030 [08:34<09:05, 1.89it/s]
49%|βββββ | 1001/2030 [08:34<08:10, 2.10it/s]
49%|βββββ | 1002/2030 [08:34<08:00, 2.14it/s]
49%|βββββ | 1003/2030 [08:35<07:39, 2.24it/s]
49%|βββββ | 1004/2030 [08:35<07:57, 2.15it/s]
50%|βββββ | 1005/2030 [08:36<07:59, 2.14it/s]
50%|βββββ | 1006/2030 [08:36<07:23, 2.31it/s]
50%|βββββ | 1007/2030 [08:37<07:28, 2.28it/s]
50%|βββββ | 1008/2030 [08:37<06:59, 2.43it/s]
50%|βββββ | 1009/2030 [08:37<07:12, 2.36it/s]
50%|βββββ | 1010/2030 [08:38<07:46, 2.19it/s]
50%|βββββ | 1011/2030 [08:38<07:43, 2.20it/s]
50%|βββββ | 1012/2030 [08:39<07:44, 2.19it/s]
50%|βββββ | 1013/2030 [08:39<07:04, 2.40it/s]
50%|βββββ | 1014/2030 [08:40<06:32, 2.59it/s]
50%|βββββ | 1015/2030 [08:40<06:24, 2.64it/s]
50%|βββββ | 1016/2030 [08:40<07:14, 2.34it/s]
50%|βββββ | 1017/2030 [08:41<07:24, 2.28it/s][INFO|trainer.py:811] 2024-09-09 12:02:54,359 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:02:54,362 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:02:54,362 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:02:54,362 >> Batch size = 8 |
|
{'eval_loss': 0.21822449564933777, 'eval_precision': 0.6445872466633712, 'eval_recall': 0.7137383689107827, 'eval_f1': 0.6774025974025973, 'eval_accuracy': 0.9482979883858963, 'eval_runtime': 5.872, 'eval_samples_per_second': 428.988, 'eval_steps_per_second': 53.645, 'epoch': 4.0} |
|
{'loss': 0.0248, 'grad_norm': 0.7616795301437378, 'learning_rate': 2.5369458128078822e-05, 'epoch': 4.91} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:04, 75.45it/s][A |
|
5%|β | 16/315 [00:00<00:04, 74.29it/s][A |
|
8%|β | 24/315 [00:00<00:03, 76.05it/s][A |
|
10%|β | 32/315 [00:00<00:03, 71.90it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 75.80it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 74.79it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 74.92it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 72.35it/s][A |
|
23%|βββ | 74/315 [00:00<00:03, 74.85it/s][A |
|
26%|βββ | 82/315 [00:01<00:03, 70.39it/s][A |
|
29%|βββ | 90/315 [00:01<00:03, 68.06it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.10it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 68.68it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 70.49it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 69.18it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 70.47it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 69.27it/s][A |
|
46%|βββββ | 144/315 [00:02<00:02, 68.85it/s][A |
|
49%|βββββ | 153/315 [00:02<00:02, 72.92it/s][A |
|
51%|βββββ | 161/315 [00:02<00:02, 71.98it/s][A |
|
54%|ββββββ | 169/315 [00:02<00:02, 71.90it/s][A |
|
56%|ββββββ | 177/315 [00:02<00:01, 71.35it/s][A |
|
59%|ββββββ | 185/315 [00:02<00:01, 69.25it/s][A |
|
61%|ββββββ | 192/315 [00:02<00:01, 69.09it/s][A |
|
63%|βββββββ | 199/315 [00:02<00:01, 66.22it/s][A |
|
65%|βββββββ | 206/315 [00:02<00:01, 64.49it/s][A |
|
68%|βββββββ | 214/315 [00:03<00:01, 67.78it/s][A |
|
70%|βββββββ | 222/315 [00:03<00:01, 70.08it/s][A |
|
73%|ββββββββ | 231/315 [00:03<00:01, 73.70it/s][A |
|
76%|ββββββββ | 239/315 [00:03<00:01, 75.35it/s][A |
|
78%|ββββββββ | 247/315 [00:03<00:00, 71.30it/s][A |
|
81%|ββββββββ | 255/315 [00:03<00:00, 70.04it/s][A |
|
83%|βββββββββ | 263/315 [00:03<00:00, 71.61it/s][A |
|
86%|βββββββββ | 271/315 [00:03<00:00, 73.92it/s][A |
|
89%|βββββββββ | 280/315 [00:03<00:00, 76.67it/s][A |
|
91%|ββββββββββ| 288/315 [00:04<00:00, 73.35it/s][A |
|
94%|ββββββββββ| 296/315 [00:04<00:00, 71.73it/s][A |
|
97%|ββββββββββ| 304/315 [00:04<00:00, 72.86it/s][A |
|
99%|ββββββββββ| 312/315 [00:04<00:00, 72.71it/s][A
|
|
[A
50%|βββββ | 1017/2030 [08:47<07:24, 2.28it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 72.71it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 12:03:00,209 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-1017 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:03:00,211 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-1017/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:03:01,226 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-1017/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:03:01,227 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-1017/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:03:01,227 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-1017/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:03:06,669 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:03:06,670 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
50%|βββββ | 1018/2030 [08:54<1:09:19, 4.11s/it]
50%|βββββ | 1019/2030 [08:54<50:22, 2.99s/it]
50%|βββββ | 1020/2030 [08:55<38:43, 2.30s/it]
50%|βββββ | 1021/2030 [08:55<29:04, 1.73s/it]
50%|βββββ | 1022/2030 [08:55<22:11, 1.32s/it]
50%|βββββ | 1023/2030 [08:56<17:48, 1.06s/it]
50%|βββββ | 1024/2030 [08:56<14:35, 1.15it/s]
50%|βββββ | 1025/2030 [08:57<12:26, 1.35it/s]
51%|βββββ | 1026/2030 [08:57<12:14, 1.37it/s]
51%|βββββ | 1027/2030 [08:58<11:09, 1.50it/s]
51%|βββββ | 1028/2030 [08:58<09:45, 1.71it/s]
51%|βββββ | 1029/2030 [08:59<08:39, 1.93it/s]
51%|βββββ | 1030/2030 [08:59<08:13, 2.03it/s]
51%|βββββ | 1031/2030 [09:00<07:36, 2.19it/s]
51%|βββββ | 1032/2030 [09:00<07:42, 2.16it/s]
51%|βββββ | 1033/2030 [09:00<07:22, 2.25it/s]
51%|βββββ | 1034/2030 [09:01<07:16, 2.28it/s]
51%|βββββ | 1035/2030 [09:01<06:45, 2.45it/s]
51%|βββββ | 1036/2030 [09:02<07:09, 2.32it/s]
51%|βββββ | 1037/2030 [09:02<07:01, 2.35it/s]
51%|βββββ | 1038/2030 [09:02<07:01, 2.36it/s]
51%|βββββ | 1039/2030 [09:03<07:01, 2.35it/s]
51%|βββββ | 1040/2030 [09:03<07:25, 2.22it/s]
51%|ββββββ | 1041/2030 [09:04<06:56, 2.38it/s]
51%|ββββββ | 1042/2030 [09:04<07:07, 2.31it/s]
51%|ββββββ | 1043/2030 [09:05<07:39, 2.15it/s]
51%|ββββββ | 1044/2030 [09:05<08:31, 1.93it/s]
51%|ββββββ | 1045/2030 [09:06<08:01, 2.04it/s]
52%|ββββββ | 1046/2030 [09:06<08:02, 2.04it/s]
52%|ββββββ | 1047/2030 [09:07<07:29, 2.19it/s]
52%|ββββββ | 1048/2030 [09:07<07:12, 2.27it/s]
52%|ββββββ | 1049/2030 [09:07<06:57, 2.35it/s]
52%|ββββββ | 1050/2030 [09:08<07:29, 2.18it/s]
52%|ββββββ | 1051/2030 [09:08<07:18, 2.23it/s]
52%|ββββββ | 1052/2030 [09:09<07:40, 2.12it/s]
52%|ββββββ | 1053/2030 [09:09<07:47, 2.09it/s]
52%|ββββββ | 1054/2030 [09:10<08:08, 2.00it/s]
52%|ββββββ | 1055/2030 [09:11<09:29, 1.71it/s]
52%|ββββββ | 1056/2030 [09:11<08:53, 1.82it/s]
52%|ββββββ | 1057/2030 [09:12<08:08, 1.99it/s]
52%|ββββββ | 1058/2030 [09:12<07:20, 2.21it/s]
52%|ββββββ | 1059/2030 [09:12<06:51, 2.36it/s]
52%|ββββββ | 1060/2030 [09:13<07:17, 2.22it/s]
52%|ββββββ | 1061/2030 [09:14<10:14, 1.58it/s]
52%|ββββββ | 1062/2030 [09:15<12:14, 1.32it/s]
52%|ββββββ | 1063/2030 [09:15<10:29, 1.54it/s]
52%|ββββββ | 1064/2030 [09:16<09:10, 1.75it/s]
52%|ββββββ | 1065/2030 [09:16<09:02, 1.78it/s]
53%|ββββββ | 1066/2030 [09:17<09:17, 1.73it/s]
53%|ββββββ | 1067/2030 [09:17<08:49, 1.82it/s]
53%|ββββββ | 1068/2030 [09:18<08:43, 1.84it/s]
53%|ββββββ | 1069/2030 [09:18<08:15, 1.94it/s]
53%|ββββββ | 1070/2030 [09:19<07:59, 2.00it/s]
53%|ββββββ | 1071/2030 [09:19<07:19, 2.18it/s]
53%|ββββββ | 1072/2030 [09:20<06:51, 2.33it/s]
53%|ββββββ | 1073/2030 [09:20<07:02, 2.26it/s]
53%|ββββββ | 1074/2030 [09:20<06:52, 2.32it/s]
53%|ββββββ | 1075/2030 [09:21<07:01, 2.27it/s]
53%|ββββββ | 1076/2030 [09:21<06:59, 2.27it/s]
53%|ββββββ | 1077/2030 [09:22<07:14, 2.20it/s]
53%|ββββββ | 1078/2030 [09:22<07:40, 2.07it/s]
53%|ββββββ | 1079/2030 [09:23<07:13, 2.19it/s]
53%|ββββββ | 1080/2030 [09:23<06:52, 2.30it/s]
53%|ββββββ | 1081/2030 [09:24<06:31, 2.42it/s]
53%|ββββββ | 1082/2030 [09:24<06:47, 2.33it/s]
53%|ββββββ | 1083/2030 [09:24<06:26, 2.45it/s]
53%|ββββββ | 1084/2030 [09:25<06:30, 2.42it/s]
53%|ββββββ | 1085/2030 [09:25<06:46, 2.33it/s]
53%|ββββββ | 1086/2030 [09:26<07:32, 2.08it/s]
54%|ββββββ | 1087/2030 [09:26<07:58, 1.97it/s]
54%|ββββββ | 1088/2030 [09:27<07:51, 2.00it/s]
54%|ββββββ | 1089/2030 [09:27<07:42, 2.03it/s]
54%|ββββββ | 1090/2030 [09:28<07:11, 2.18it/s]
54%|ββββββ | 1091/2030 [09:28<07:21, 2.13it/s]
54%|ββββββ | 1092/2030 [09:29<07:13, 2.16it/s]
54%|ββββββ | 1093/2030 [09:29<08:21, 1.87it/s]
54%|ββββββ | 1094/2030 [09:30<08:01, 1.95it/s]
54%|ββββββ | 1095/2030 [09:30<07:27, 2.09it/s]
54%|ββββββ | 1096/2030 [09:31<07:09, 2.18it/s]
54%|ββββββ | 1097/2030 [09:31<07:21, 2.11it/s]
54%|ββββββ | 1098/2030 [09:32<07:03, 2.20it/s]
54%|ββββββ | 1099/2030 [09:32<06:54, 2.25it/s]
54%|ββββββ | 1100/2030 [09:33<08:24, 1.84it/s]
54%|ββββββ | 1101/2030 [09:33<08:08, 1.90it/s]
54%|ββββββ | 1102/2030 [09:34<07:20, 2.11it/s]
54%|ββββββ | 1103/2030 [09:34<07:13, 2.14it/s]
54%|ββββββ | 1104/2030 [09:34<06:49, 2.26it/s]
54%|ββββββ | 1105/2030 [09:35<06:35, 2.34it/s]
54%|ββββββ | 1106/2030 [09:35<06:49, 2.26it/s]
55%|ββββββ | 1107/2030 [09:36<08:54, 1.73it/s]
55%|ββββββ | 1108/2030 [09:37<08:01, 1.91it/s]
55%|ββββββ | 1109/2030 [09:37<07:30, 2.05it/s]
55%|ββββββ | 1110/2030 [09:37<07:03, 2.17it/s]
55%|ββββββ | 1111/2030 [09:38<06:56, 2.20it/s]
55%|ββββββ | 1112/2030 [09:38<06:43, 2.27it/s]
55%|ββββββ | 1113/2030 [09:39<06:58, 2.19it/s]
55%|ββββββ | 1114/2030 [09:39<06:42, 2.28it/s]
55%|ββββββ | 1115/2030 [09:40<07:08, 2.13it/s]
55%|ββββββ | 1116/2030 [09:40<07:11, 2.12it/s]
55%|ββββββ | 1117/2030 [09:41<06:49, 2.23it/s]
55%|ββββββ | 1118/2030 [09:41<06:36, 2.30it/s]
55%|ββββββ | 1119/2030 [09:42<07:02, 2.16it/s]
55%|ββββββ | 1120/2030 [09:42<06:54, 2.20it/s]
55%|ββββββ | 1121/2030 [09:43<07:20, 2.06it/s]
55%|ββββββ | 1122/2030 [09:43<07:35, 2.00it/s]
55%|ββββββ | 1123/2030 [09:43<07:22, 2.05it/s]
55%|ββββββ | 1124/2030 [09:44<07:01, 2.15it/s]
55%|ββββββ | 1125/2030 [09:44<06:42, 2.25it/s]
55%|ββββββ | 1126/2030 [09:45<06:26, 2.34it/s]
56%|ββββββ | 1127/2030 [09:45<06:27, 2.33it/s]
56%|ββββββ | 1128/2030 [09:45<06:08, 2.44it/s]
56%|ββββββ | 1129/2030 [09:46<06:14, 2.41it/s]
56%|ββββββ | 1130/2030 [09:46<06:26, 2.33it/s]
56%|ββββββ | 1131/2030 [09:47<05:52, 2.55it/s]
56%|ββββββ | 1132/2030 [09:47<05:48, 2.58it/s]
56%|ββββββ | 1133/2030 [09:48<06:15, 2.39it/s]
56%|ββββββ | 1134/2030 [09:48<06:03, 2.47it/s]
56%|ββββββ | 1135/2030 [09:48<06:12, 2.41it/s]
56%|ββββββ | 1136/2030 [09:49<06:13, 2.39it/s]
56%|ββββββ | 1137/2030 [09:49<07:03, 2.11it/s]
56%|ββββββ | 1138/2030 [09:50<06:45, 2.20it/s]
56%|ββββββ | 1139/2030 [09:50<07:21, 2.02it/s]
56%|ββββββ | 1140/2030 [09:51<06:42, 2.21it/s]
56%|ββββββ | 1141/2030 [09:51<06:30, 2.27it/s]
56%|ββββββ | 1142/2030 [09:52<06:36, 2.24it/s]
56%|ββββββ | 1143/2030 [09:52<06:07, 2.41it/s]
56%|ββββββ | 1144/2030 [09:52<05:58, 2.47it/s]
56%|ββββββ | 1145/2030 [09:53<06:43, 2.19it/s]
56%|ββββββ | 1146/2030 [09:54<08:05, 1.82it/s]
57%|ββββββ | 1147/2030 [09:54<07:57, 1.85it/s]
57%|ββββββ | 1148/2030 [09:55<07:54, 1.86it/s]
57%|ββββββ | 1149/2030 [09:56<08:59, 1.63it/s]
57%|ββββββ | 1150/2030 [09:56<09:02, 1.62it/s]
57%|ββββββ | 1151/2030 [09:56<07:45, 1.89it/s]
57%|ββββββ | 1152/2030 [09:57<07:13, 2.03it/s]
57%|ββββββ | 1153/2030 [09:57<07:03, 2.07it/s]
57%|ββββββ | 1154/2030 [09:58<06:28, 2.26it/s]
57%|ββββββ | 1155/2030 [09:58<06:20, 2.30it/s]
57%|ββββββ | 1156/2030 [09:59<06:12, 2.35it/s]
57%|ββββββ | 1157/2030 [09:59<06:27, 2.25it/s]
57%|ββββββ | 1158/2030 [10:00<06:44, 2.15it/s]
57%|ββββββ | 1159/2030 [10:00<06:13, 2.33it/s]
57%|ββββββ | 1160/2030 [10:00<05:58, 2.43it/s]
57%|ββββββ | 1161/2030 [10:01<06:03, 2.39it/s]
57%|ββββββ | 1162/2030 [10:01<05:47, 2.50it/s]
57%|ββββββ | 1163/2030 [10:01<06:00, 2.41it/s]
57%|ββββββ | 1164/2030 [10:02<06:17, 2.29it/s]
57%|ββββββ | 1165/2030 [10:02<06:17, 2.29it/s]
57%|ββββββ | 1166/2030 [10:03<06:24, 2.25it/s]
57%|ββββββ | 1167/2030 [10:03<05:59, 2.40it/s]
58%|ββββββ | 1168/2030 [10:04<07:03, 2.04it/s]
58%|ββββββ | 1169/2030 [10:04<06:50, 2.10it/s]
58%|ββββββ | 1170/2030 [10:05<08:30, 1.68it/s]
58%|ββββββ | 1171/2030 [10:06<08:05, 1.77it/s]
58%|ββββββ | 1172/2030 [10:06<07:29, 1.91it/s]
58%|ββββββ | 1173/2030 [10:07<06:58, 2.05it/s]
58%|ββββββ | 1174/2030 [10:07<06:30, 2.19it/s]
58%|ββββββ | 1175/2030 [10:07<06:24, 2.22it/s]
58%|ββββββ | 1176/2030 [10:08<06:11, 2.30it/s]
58%|ββββββ | 1177/2030 [10:08<06:56, 2.05it/s]
58%|ββββββ | 1178/2030 [10:09<07:06, 2.00it/s]
58%|ββββββ | 1179/2030 [10:09<06:39, 2.13it/s]
58%|ββββββ | 1180/2030 [10:10<06:14, 2.27it/s]
58%|ββββββ | 1181/2030 [10:10<06:11, 2.28it/s]
58%|ββββββ | 1182/2030 [10:11<06:31, 2.16it/s]
58%|ββββββ | 1183/2030 [10:11<06:30, 2.17it/s]
58%|ββββββ | 1184/2030 [10:12<06:29, 2.17it/s]
58%|ββββββ | 1185/2030 [10:12<06:29, 2.17it/s]
58%|ββββββ | 1186/2030 [10:12<06:16, 2.24it/s]
58%|ββββββ | 1187/2030 [10:13<06:44, 2.08it/s]
59%|ββββββ | 1188/2030 [10:13<06:23, 2.20it/s]
59%|ββββββ | 1189/2030 [10:14<06:58, 2.01it/s]
59%|ββββββ | 1190/2030 [10:14<06:49, 2.05it/s]
59%|ββββββ | 1191/2030 [10:15<06:23, 2.19it/s]
59%|ββββββ | 1192/2030 [10:15<06:16, 2.22it/s]
59%|ββββββ | 1193/2030 [10:16<06:50, 2.04it/s]
59%|ββββββ | 1194/2030 [10:16<06:36, 2.11it/s]
59%|ββββββ | 1195/2030 [10:17<06:18, 2.21it/s]
59%|ββββββ | 1196/2030 [10:17<06:57, 2.00it/s]
59%|ββββββ | 1197/2030 [10:18<07:00, 1.98it/s]
59%|ββββββ | 1198/2030 [10:18<06:53, 2.01it/s]
59%|ββββββ | 1199/2030 [10:19<06:26, 2.15it/s]
59%|ββββββ | 1200/2030 [10:19<06:14, 2.21it/s]
59%|ββββββ | 1201/2030 [10:20<06:10, 2.24it/s]
59%|ββββββ | 1202/2030 [10:20<06:09, 2.24it/s]
59%|ββββββ | 1203/2030 [10:21<06:38, 2.08it/s]
59%|ββββββ | 1204/2030 [10:21<06:34, 2.09it/s]
59%|ββββββ | 1205/2030 [10:21<06:39, 2.07it/s]
59%|ββββββ | 1206/2030 [10:22<06:01, 2.28it/s]
59%|ββββββ | 1207/2030 [10:22<06:05, 2.25it/s]
60%|ββββββ | 1208/2030 [10:23<05:53, 2.33it/s]
60%|ββββββ | 1209/2030 [10:23<05:37, 2.43it/s]
60%|ββββββ | 1210/2030 [10:24<05:54, 2.31it/s]
60%|ββββββ | 1211/2030 [10:24<05:42, 2.39it/s]
60%|ββββββ | 1212/2030 [10:24<06:12, 2.19it/s]
60%|ββββββ | 1213/2030 [10:25<07:38, 1.78it/s]
60%|ββββββ | 1214/2030 [10:26<06:55, 1.97it/s]
60%|ββββββ | 1215/2030 [10:26<06:25, 2.11it/s]
60%|ββββββ | 1216/2030 [10:27<07:30, 1.81it/s]
60%|ββββββ | 1217/2030 [10:27<06:49, 1.98it/s]
60%|ββββββ | 1218/2030 [10:28<06:40, 2.03it/s]
60%|ββββββ | 1219/2030 [10:28<06:32, 2.07it/s]
60%|ββββββ | 1220/2030 [10:29<07:48, 1.73it/s]
60%|ββββββ | 1221/2030 [10:29<06:46, 1.99it/s][INFO|trainer.py:811] 2024-09-09 12:04:42,494 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:04:42,496 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:04:42,496 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:04:42,496 >> Batch size = 8 |
|
{'eval_loss': 0.24612903594970703, 'eval_precision': 0.6251184834123222, 'eval_recall': 0.7219485495347564, 'eval_f1': 0.6700533401066802, 'eval_accuracy': 0.9448650903140942, 'eval_runtime': 5.8462, 'eval_samples_per_second': 430.877, 'eval_steps_per_second': 53.881, 'epoch': 5.0} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:03, 77.97it/s][A |
|
5%|β | 16/315 [00:00<00:03, 74.88it/s][A |
|
8%|β | 24/315 [00:00<00:03, 76.31it/s][A |
|
10%|β | 32/315 [00:00<00:03, 72.11it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 76.30it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 75.54it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 76.07it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 73.35it/s][A |
|
23%|βββ | 73/315 [00:00<00:03, 75.28it/s][A |
|
26%|βββ | 81/315 [00:01<00:03, 70.69it/s][A |
|
28%|βββ | 89/315 [00:01<00:03, 67.74it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.90it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 69.26it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 70.83it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 69.26it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 70.05it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 69.86it/s][A |
|
46%|βββββ | 145/315 [00:02<00:02, 69.98it/s][A |
|
49%|βββββ | 154/315 [00:02<00:02, 72.98it/s][A |
|
51%|ββββββ | 162/315 [00:02<00:02, 71.62it/s][A |
|
54%|ββββββ | 170/315 [00:02<00:02, 71.50it/s][A |
|
57%|ββββββ | 178/315 [00:02<00:01, 70.67it/s][A |
|
59%|ββββββ | 186/315 [00:02<00:01, 68.80it/s][A |
|
61%|βββββββ | 193/315 [00:02<00:01, 68.00it/s][A |
|
63%|βββββββ | 200/315 [00:02<00:01, 65.53it/s][A |
|
66%|βββββββ | 207/315 [00:02<00:01, 64.23it/s][A |
|
68%|βββββββ | 215/315 [00:03<00:01, 67.46it/s][A |
|
71%|βββββββ | 223/315 [00:03<00:01, 69.72it/s][A |
|
74%|ββββββββ | 232/315 [00:03<00:01, 73.12it/s][A |
|
76%|ββββββββ | 240/315 [00:03<00:01, 72.64it/s][A |
|
79%|ββββββββ | 248/315 [00:03<00:00, 70.33it/s][A |
|
81%|βββββββββ | 256/315 [00:03<00:00, 68.45it/s][A |
|
84%|βββββββββ | 264/315 [00:03<00:00, 69.38it/s][A |
|
86%|βββββββββ | 272/315 [00:03<00:00, 71.97it/s][A |
|
89%|βββββββββ | 281/315 [00:03<00:00, 74.70it/s][A |
|
92%|ββββββββββ| 289/315 [00:04<00:00, 71.14it/s][A |
|
94%|ββββββββββ| 297/315 [00:04<00:00, 71.29it/s][A |
|
97%|ββββββββββ| 305/315 [00:04<00:00, 72.64it/s][A |
|
99%|ββββββββββ| 313/315 [00:04<00:00, 71.74it/s][A
|
|
[A
60%|ββββββ | 1221/2030 [10:35<06:46, 1.99it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 71.74it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 12:04:48,404 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-1221 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:04:48,406 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-1221/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:04:49,434 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-1221/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:04:49,435 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-1221/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:04:49,436 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-1221/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:04:52,502 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:04:52,502 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
60%|ββββββ | 1222/2030 [10:40<46:42, 3.47s/it]
60%|ββββββ | 1223/2030 [10:40<34:30, 2.57s/it]
60%|ββββββ | 1224/2030 [10:40<25:50, 1.92s/it]
60%|ββββββ | 1225/2030 [10:41<19:41, 1.47s/it]
60%|ββββββ | 1226/2030 [10:41<15:06, 1.13s/it]
60%|ββββββ | 1227/2030 [10:42<12:16, 1.09it/s]
60%|ββββββ | 1228/2030 [10:42<10:36, 1.26it/s]
61%|ββββββ | 1229/2030 [10:43<09:27, 1.41it/s]
61%|ββββββ | 1230/2030 [10:43<09:11, 1.45it/s]
61%|ββββββ | 1231/2030 [10:44<08:45, 1.52it/s]
61%|ββββββ | 1232/2030 [10:44<07:48, 1.70it/s]
61%|ββββββ | 1233/2030 [10:45<07:37, 1.74it/s]
61%|ββββββ | 1234/2030 [10:45<06:54, 1.92it/s]
61%|ββββββ | 1235/2030 [10:46<06:58, 1.90it/s]
61%|ββββββ | 1236/2030 [10:46<06:43, 1.97it/s]
61%|ββββββ | 1237/2030 [10:47<06:19, 2.09it/s]
61%|ββββββ | 1238/2030 [10:47<06:10, 2.14it/s]
61%|ββββββ | 1239/2030 [10:48<06:07, 2.15it/s]
61%|ββββββ | 1240/2030 [10:48<05:47, 2.28it/s]
61%|ββββββ | 1241/2030 [10:48<05:34, 2.36it/s]
61%|ββββββ | 1242/2030 [10:49<05:30, 2.38it/s]
61%|ββββββ | 1243/2030 [10:49<05:15, 2.50it/s]
61%|βββββββ | 1244/2030 [10:49<05:00, 2.62it/s]
61%|βββββββ | 1245/2030 [10:50<05:39, 2.31it/s]
61%|βββββββ | 1246/2030 [10:50<05:23, 2.42it/s]
61%|βββββββ | 1247/2030 [10:51<05:31, 2.36it/s]
61%|βββββββ | 1248/2030 [10:51<05:42, 2.29it/s]
62%|βββββββ | 1249/2030 [10:52<05:58, 2.18it/s]
62%|βββββββ | 1250/2030 [10:52<05:54, 2.20it/s]
62%|βββββββ | 1251/2030 [10:53<05:23, 2.41it/s]
62%|βββββββ | 1252/2030 [10:53<05:29, 2.36it/s]
62%|βββββββ | 1253/2030 [10:53<05:18, 2.44it/s]
62%|βββββββ | 1254/2030 [10:54<05:21, 2.41it/s]
62%|βββββββ | 1255/2030 [10:54<05:08, 2.51it/s]
62%|βββββββ | 1256/2030 [10:54<04:53, 2.64it/s]
62%|βββββββ | 1257/2030 [10:55<05:20, 2.41it/s]
62%|βββββββ | 1258/2030 [10:55<05:12, 2.47it/s]
62%|βββββββ | 1259/2030 [10:56<05:34, 2.31it/s]
62%|βββββββ | 1260/2030 [10:56<05:34, 2.30it/s]
62%|βββββββ | 1261/2030 [10:57<05:52, 2.18it/s]
62%|βββββββ | 1262/2030 [10:57<05:34, 2.30it/s]
62%|βββββββ | 1263/2030 [10:58<05:31, 2.31it/s]
62%|βββββββ | 1264/2030 [10:58<05:32, 2.31it/s]
62%|βββββββ | 1265/2030 [10:59<06:11, 2.06it/s]
62%|βββββββ | 1266/2030 [10:59<06:21, 2.00it/s]
62%|βββββββ | 1267/2030 [11:00<05:57, 2.14it/s]
62%|βββββββ | 1268/2030 [11:00<06:53, 1.84it/s]
63%|βββββββ | 1269/2030 [11:01<06:15, 2.03it/s]
63%|βββββββ | 1270/2030 [11:01<06:52, 1.84it/s]
63%|βββββββ | 1271/2030 [11:02<06:33, 1.93it/s]
63%|βββββββ | 1272/2030 [11:02<06:29, 1.95it/s]
63%|βββββββ | 1273/2030 [11:03<07:00, 1.80it/s]
63%|βββββββ | 1274/2030 [11:03<06:38, 1.89it/s]
63%|βββββββ | 1275/2030 [11:04<07:03, 1.78it/s]
63%|βββββββ | 1276/2030 [11:04<06:25, 1.95it/s]
63%|βββββββ | 1277/2030 [11:05<06:16, 2.00it/s]
63%|βββββββ | 1278/2030 [11:05<06:06, 2.05it/s]
63%|βββββββ | 1279/2030 [11:06<05:57, 2.10it/s]
63%|βββββββ | 1280/2030 [11:06<05:35, 2.23it/s]
63%|βββββββ | 1281/2030 [11:07<05:39, 2.21it/s]
63%|βββββββ | 1282/2030 [11:07<05:58, 2.09it/s]
63%|βββββββ | 1283/2030 [11:08<05:59, 2.08it/s]
63%|βββββββ | 1284/2030 [11:08<05:41, 2.19it/s]
63%|βββββββ | 1285/2030 [11:09<05:25, 2.29it/s]
63%|βββββββ | 1286/2030 [11:09<05:27, 2.27it/s]
63%|βββββββ | 1287/2030 [11:10<05:50, 2.12it/s]
63%|βββββββ | 1288/2030 [11:10<05:39, 2.19it/s]
63%|βββββββ | 1289/2030 [11:10<06:00, 2.06it/s]
64%|βββββββ | 1290/2030 [11:11<05:28, 2.25it/s]
64%|βββββββ | 1291/2030 [11:11<05:15, 2.34it/s]
64%|βββββββ | 1292/2030 [11:12<05:38, 2.18it/s]
64%|βββββββ | 1293/2030 [11:12<05:11, 2.37it/s]
64%|βββββββ | 1294/2030 [11:13<05:12, 2.36it/s]
64%|βββββββ | 1295/2030 [11:13<05:44, 2.13it/s]
64%|βββββββ | 1296/2030 [11:14<05:48, 2.11it/s]
64%|βββββββ | 1297/2030 [11:14<05:26, 2.25it/s]
64%|βββββββ | 1298/2030 [11:15<05:58, 2.04it/s]
64%|βββββββ | 1299/2030 [11:15<06:25, 1.90it/s]
64%|βββββββ | 1300/2030 [11:16<05:56, 2.04it/s]
64%|βββββββ | 1301/2030 [11:16<06:46, 1.79it/s]
64%|βββββββ | 1302/2030 [11:17<06:17, 1.93it/s]
64%|βββββββ | 1303/2030 [11:17<05:43, 2.11it/s]
64%|βββββββ | 1304/2030 [11:18<05:44, 2.10it/s]
64%|βββββββ | 1305/2030 [11:18<05:46, 2.09it/s]
64%|βββββββ | 1306/2030 [11:18<05:23, 2.24it/s]
64%|βββββββ | 1307/2030 [11:19<05:05, 2.36it/s]
64%|βββββββ | 1308/2030 [11:19<05:22, 2.24it/s]
64%|βββββββ | 1309/2030 [11:20<05:12, 2.31it/s]
65%|βββββββ | 1310/2030 [11:20<05:07, 2.34it/s]
65%|βββββββ | 1311/2030 [11:21<05:04, 2.36it/s]
65%|βββββββ | 1312/2030 [11:21<05:58, 2.00it/s]
65%|βββββββ | 1313/2030 [11:22<05:47, 2.06it/s]
65%|βββββββ | 1314/2030 [11:22<05:26, 2.19it/s]
65%|βββββββ | 1315/2030 [11:22<05:13, 2.28it/s]
65%|βββββββ | 1316/2030 [11:23<05:18, 2.24it/s]
65%|βββββββ | 1317/2030 [11:23<05:21, 2.22it/s]
65%|βββββββ | 1318/2030 [11:24<04:57, 2.39it/s]
65%|βββββββ | 1319/2030 [11:24<04:58, 2.38it/s]
65%|βββββββ | 1320/2030 [11:25<04:57, 2.38it/s]
65%|βββββββ | 1321/2030 [11:25<05:18, 2.23it/s]
65%|βββββββ | 1322/2030 [11:25<05:05, 2.32it/s]
65%|βββββββ | 1323/2030 [11:26<05:33, 2.12it/s]
65%|βββββββ | 1324/2030 [11:27<06:41, 1.76it/s]
65%|βββββββ | 1325/2030 [11:27<06:31, 1.80it/s]
65%|βββββββ | 1326/2030 [11:28<05:57, 1.97it/s]
65%|βββββββ | 1327/2030 [11:28<05:52, 1.99it/s]
65%|βββββββ | 1328/2030 [11:29<05:34, 2.10it/s]
65%|βββββββ | 1329/2030 [11:29<05:44, 2.03it/s]
66%|βββββββ | 1330/2030 [11:30<06:04, 1.92it/s]
66%|βββββββ | 1331/2030 [11:31<06:54, 1.69it/s]
66%|βββββββ | 1332/2030 [11:31<06:18, 1.84it/s]
66%|βββββββ | 1333/2030 [11:31<06:01, 1.93it/s]
66%|βββββββ | 1334/2030 [11:32<05:35, 2.08it/s]
66%|βββββββ | 1335/2030 [11:32<05:16, 2.20it/s]
66%|βββββββ | 1336/2030 [11:33<05:03, 2.29it/s]
66%|βββββββ | 1337/2030 [11:33<04:49, 2.39it/s]
66%|βββββββ | 1338/2030 [11:33<04:51, 2.37it/s]
66%|βββββββ | 1339/2030 [11:34<04:45, 2.42it/s]
66%|βββββββ | 1340/2030 [11:34<04:52, 2.36it/s]
66%|βββββββ | 1341/2030 [11:35<05:53, 1.95it/s]
66%|βββββββ | 1342/2030 [11:35<05:47, 1.98it/s]
66%|βββββββ | 1343/2030 [11:36<05:19, 2.15it/s]
66%|βββββββ | 1344/2030 [11:36<05:37, 2.03it/s]
66%|βββββββ | 1345/2030 [11:37<05:32, 2.06it/s]
66%|βββββββ | 1346/2030 [11:37<05:13, 2.18it/s]
66%|βββββββ | 1347/2030 [11:38<04:55, 2.31it/s]
66%|βββββββ | 1348/2030 [11:38<04:58, 2.29it/s]
66%|βββββββ | 1349/2030 [11:38<04:55, 2.30it/s]
67%|βββββββ | 1350/2030 [11:39<05:00, 2.26it/s]
67%|βββββββ | 1351/2030 [11:39<04:56, 2.29it/s]
67%|βββββββ | 1352/2030 [11:40<05:05, 2.22it/s]
67%|βββββββ | 1353/2030 [11:40<05:06, 2.21it/s]
67%|βββββββ | 1354/2030 [11:41<05:55, 1.90it/s]
67%|βββββββ | 1355/2030 [11:42<06:26, 1.75it/s]
67%|βββββββ | 1356/2030 [11:42<05:54, 1.90it/s]
67%|βββββββ | 1357/2030 [11:43<05:35, 2.01it/s]
67%|βββββββ | 1358/2030 [11:43<05:16, 2.12it/s]
67%|βββββββ | 1359/2030 [11:43<05:32, 2.02it/s]
67%|βββββββ | 1360/2030 [11:44<05:28, 2.04it/s]
67%|βββββββ | 1361/2030 [11:45<05:42, 1.96it/s]
67%|βββββββ | 1362/2030 [11:45<05:17, 2.10it/s]
67%|βββββββ | 1363/2030 [11:45<05:08, 2.16it/s]
67%|βββββββ | 1364/2030 [11:46<05:10, 2.14it/s]
67%|βββββββ | 1365/2030 [11:47<06:07, 1.81it/s]
67%|βββββββ | 1366/2030 [11:47<05:39, 1.95it/s]
67%|βββββββ | 1367/2030 [11:48<05:59, 1.84it/s]
67%|βββββββ | 1368/2030 [11:49<07:37, 1.45it/s]
67%|βββββββ | 1369/2030 [11:49<06:22, 1.73it/s]
67%|βββββββ | 1370/2030 [11:49<05:55, 1.85it/s]
68%|βββββββ | 1371/2030 [11:50<05:42, 1.92it/s]
68%|βββββββ | 1372/2030 [11:50<05:22, 2.04it/s]
68%|βββββββ | 1373/2030 [11:51<04:57, 2.21it/s]
68%|βββββββ | 1374/2030 [11:51<04:44, 2.31it/s]
68%|βββββββ | 1375/2030 [11:52<04:58, 2.19it/s]
68%|βββββββ | 1376/2030 [11:52<05:04, 2.15it/s]
68%|βββββββ | 1377/2030 [11:53<05:08, 2.12it/s]
68%|βββββββ | 1378/2030 [11:53<04:50, 2.24it/s]
68%|βββββββ | 1379/2030 [11:53<05:10, 2.09it/s]
68%|βββββββ | 1380/2030 [11:54<04:52, 2.22it/s]
68%|βββββββ | 1381/2030 [11:54<04:47, 2.25it/s]
68%|βββββββ | 1382/2030 [11:55<04:50, 2.23it/s]
68%|βββββββ | 1383/2030 [11:55<04:58, 2.17it/s]
68%|βββββββ | 1384/2030 [11:56<04:49, 2.23it/s]
68%|βββββββ | 1385/2030 [11:56<04:43, 2.27it/s]
68%|βββββββ | 1386/2030 [11:57<05:01, 2.13it/s]
68%|βββββββ | 1387/2030 [11:57<04:57, 2.16it/s]
68%|βββββββ | 1388/2030 [11:58<04:54, 2.18it/s]
68%|βββββββ | 1389/2030 [11:58<04:57, 2.15it/s]
68%|βββββββ | 1390/2030 [11:58<04:33, 2.34it/s]
69%|βββββββ | 1391/2030 [11:59<04:30, 2.37it/s]
69%|βββββββ | 1392/2030 [11:59<04:24, 2.42it/s]
69%|βββββββ | 1393/2030 [12:00<04:18, 2.47it/s]
69%|βββββββ | 1394/2030 [12:00<04:20, 2.44it/s]
69%|βββββββ | 1395/2030 [12:00<04:24, 2.40it/s]
69%|βββββββ | 1396/2030 [12:01<05:07, 2.06it/s]
69%|βββββββ | 1397/2030 [12:02<05:16, 2.00it/s]
69%|βββββββ | 1398/2030 [12:02<05:08, 2.05it/s]
69%|βββββββ | 1399/2030 [12:03<05:20, 1.97it/s]
69%|βββββββ | 1400/2030 [12:03<05:05, 2.06it/s]
69%|βββββββ | 1401/2030 [12:04<06:02, 1.73it/s]
69%|βββββββ | 1402/2030 [12:04<05:57, 1.76it/s]
69%|βββββββ | 1403/2030 [12:05<05:56, 1.76it/s]
69%|βββββββ | 1404/2030 [12:05<05:24, 1.93it/s]
69%|βββββββ | 1405/2030 [12:06<04:57, 2.10it/s]
69%|βββββββ | 1406/2030 [12:06<04:57, 2.10it/s]
69%|βββββββ | 1407/2030 [12:07<04:57, 2.09it/s]
69%|βββββββ | 1408/2030 [12:07<04:51, 2.14it/s]
69%|βββββββ | 1409/2030 [12:08<05:42, 1.82it/s]
69%|βββββββ | 1410/2030 [12:08<05:03, 2.04it/s]
70%|βββββββ | 1411/2030 [12:09<04:57, 2.08it/s]
70%|βββββββ | 1412/2030 [12:09<04:44, 2.17it/s]
70%|βββββββ | 1413/2030 [12:10<04:39, 2.21it/s]
70%|βββββββ | 1414/2030 [12:10<04:32, 2.26it/s]
70%|βββββββ | 1415/2030 [12:10<04:26, 2.30it/s]
70%|βββββββ | 1416/2030 [12:11<04:09, 2.46it/s]
70%|βββββββ | 1417/2030 [12:11<04:20, 2.35it/s]
70%|βββββββ | 1418/2030 [12:12<04:12, 2.42it/s]
70%|βββββββ | 1419/2030 [12:12<04:07, 2.47it/s]
70%|βββββββ | 1420/2030 [12:13<04:42, 2.16it/s]
70%|βββββββ | 1421/2030 [12:13<04:41, 2.16it/s]
70%|βββββββ | 1422/2030 [12:14<05:33, 1.83it/s]
70%|βββββββ | 1423/2030 [12:14<05:08, 1.97it/s]
70%|βββββββ | 1424/2030 [12:15<04:43, 2.13it/s][INFO|trainer.py:811] 2024-09-09 12:06:27,952 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:06:27,954 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:06:27,954 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:06:27,954 >> Batch size = 8 |
|
{'eval_loss': 0.26953065395355225, 'eval_precision': 0.6410379625180201, 'eval_recall': 0.7301587301587301, 'eval_f1': 0.6827021494370521, 'eval_accuracy': 0.9469023709454907, 'eval_runtime': 5.9067, 'eval_samples_per_second': 426.468, 'eval_steps_per_second': 53.33, 'epoch': 6.0} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:04, 76.27it/s][A |
|
5%|β | 16/315 [00:00<00:03, 75.30it/s][A |
|
8%|β | 24/315 [00:00<00:03, 76.31it/s][A |
|
10%|β | 32/315 [00:00<00:03, 71.38it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 75.54it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 74.62it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 74.93it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 72.52it/s][A |
|
23%|βββ | 74/315 [00:00<00:03, 75.02it/s][A |
|
26%|βββ | 82/315 [00:01<00:03, 70.42it/s][A |
|
29%|βββ | 90/315 [00:01<00:03, 68.33it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.43it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 69.19it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 70.44it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 69.21it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 70.53it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 68.92it/s][A |
|
46%|βββββ | 144/315 [00:02<00:02, 68.51it/s][A |
|
49%|βββββ | 153/315 [00:02<00:02, 72.85it/s][A |
|
51%|βββββ | 161/315 [00:02<00:02, 72.00it/s][A |
|
54%|ββββββ | 169/315 [00:02<00:02, 71.83it/s][A |
|
56%|ββββββ | 177/315 [00:02<00:01, 71.12it/s][A |
|
59%|ββββββ | 185/315 [00:02<00:01, 69.11it/s][A |
|
61%|ββββββ | 192/315 [00:02<00:01, 69.24it/s][A |
|
63%|βββββββ | 199/315 [00:02<00:01, 66.28it/s][A |
|
65%|βββββββ | 206/315 [00:02<00:01, 64.47it/s][A |
|
68%|βββββββ | 214/315 [00:03<00:01, 67.97it/s][A |
|
70%|βββββββ | 222/315 [00:03<00:01, 70.11it/s][A |
|
73%|ββββββββ | 231/315 [00:03<00:01, 73.40it/s][A |
|
76%|ββββββββ | 239/315 [00:03<00:01, 74.72it/s][A |
|
78%|ββββββββ | 247/315 [00:03<00:00, 70.29it/s][A |
|
81%|ββββββββ | 255/315 [00:03<00:00, 68.85it/s][A |
|
83%|βββββββββ | 263/315 [00:03<00:00, 70.75it/s][A |
|
86%|βββββββββ | 272/315 [00:03<00:00, 73.64it/s][A |
|
89%|βββββββββ | 281/315 [00:03<00:00, 76.10it/s][A |
|
92%|ββββββββββ| 289/315 [00:04<00:00, 71.63it/s][A |
|
94%|ββββββββββ| 297/315 [00:04<00:00, 71.11it/s][A |
|
97%|ββββββββββ| 305/315 [00:04<00:00, 72.37it/s][A |
|
99%|ββββββββββ| 313/315 [00:04<00:00, 71.70it/s][A
|
|
[A
70%|βββββββ | 1424/2030 [12:21<04:43, 2.13it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 71.70it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 12:06:33,812 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-1424 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:06:33,814 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-1424/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:06:34,834 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-1424/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:06:34,835 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-1424/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:06:34,835 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-1424/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:06:39,873 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:06:39,873 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
70%|βββββββ | 1425/2030 [12:27<40:50, 4.05s/it]
70%|βββββββ | 1426/2030 [12:27<29:45, 2.96s/it]
70%|βββββββ | 1427/2030 [12:28<23:04, 2.30s/it]
70%|βββββββ | 1428/2030 [12:29<17:30, 1.74s/it]
70%|βββββββ | 1429/2030 [12:29<14:00, 1.40s/it]
70%|βββββββ | 1430/2030 [12:30<10:59, 1.10s/it]
70%|βββββββ | 1431/2030 [12:30<09:11, 1.09it/s]
71%|βββββββ | 1432/2030 [12:30<07:32, 1.32it/s]
71%|βββββββ | 1433/2030 [12:31<06:46, 1.47it/s]
71%|βββββββ | 1434/2030 [12:31<05:56, 1.67it/s]
71%|βββββββ | 1435/2030 [12:32<05:45, 1.72it/s]
71%|βββββββ | 1436/2030 [12:32<05:28, 1.81it/s]
71%|βββββββ | 1437/2030 [12:33<05:23, 1.84it/s]
71%|βββββββ | 1438/2030 [12:34<05:48, 1.70it/s]
71%|βββββββ | 1439/2030 [12:34<05:12, 1.89it/s]
71%|βββββββ | 1440/2030 [12:34<05:01, 1.96it/s]
71%|βββββββ | 1441/2030 [12:35<04:48, 2.04it/s]
71%|βββββββ | 1442/2030 [12:35<04:41, 2.09it/s]
71%|βββββββ | 1443/2030 [12:36<04:43, 2.07it/s]
71%|βββββββ | 1444/2030 [12:36<04:30, 2.16it/s]
71%|βββββββ | 1445/2030 [12:37<04:59, 1.95it/s]
71%|βββββββ | 1446/2030 [12:37<04:51, 2.00it/s]
71%|ββββββββ | 1447/2030 [12:38<05:21, 1.81it/s]
71%|ββββββββ | 1448/2030 [12:38<04:46, 2.03it/s]
71%|ββββββββ | 1449/2030 [12:39<04:53, 1.98it/s]
71%|ββββββββ | 1450/2030 [12:39<04:34, 2.11it/s]
71%|ββββββββ | 1451/2030 [12:40<04:13, 2.28it/s]
72%|ββββββββ | 1452/2030 [12:40<04:30, 2.14it/s]
72%|ββββββββ | 1453/2030 [12:41<04:35, 2.10it/s]
72%|ββββββββ | 1454/2030 [12:42<05:37, 1.71it/s]
72%|ββββββββ | 1455/2030 [12:42<05:10, 1.85it/s]
72%|ββββββββ | 1456/2030 [12:42<04:45, 2.01it/s]
72%|ββββββββ | 1457/2030 [12:43<04:34, 2.09it/s]
72%|ββββββββ | 1458/2030 [12:43<04:38, 2.05it/s]
72%|ββββββββ | 1459/2030 [12:44<04:42, 2.02it/s]
72%|ββββββββ | 1460/2030 [12:44<04:48, 1.97it/s]
72%|ββββββββ | 1461/2030 [12:45<04:44, 2.00it/s]
72%|ββββββββ | 1462/2030 [12:45<04:29, 2.11it/s]
72%|ββββββββ | 1463/2030 [12:46<04:14, 2.23it/s]
72%|ββββββββ | 1464/2030 [12:46<04:17, 2.20it/s]
72%|ββββββββ | 1465/2030 [12:47<04:51, 1.94it/s]
72%|ββββββββ | 1466/2030 [12:47<04:56, 1.90it/s]
72%|ββββββββ | 1467/2030 [12:48<04:42, 2.00it/s]
72%|ββββββββ | 1468/2030 [12:48<04:35, 2.04it/s]
72%|ββββββββ | 1469/2030 [12:49<04:22, 2.14it/s]
72%|ββββββββ | 1470/2030 [12:49<04:02, 2.31it/s]
72%|ββββββββ | 1471/2030 [12:49<04:06, 2.27it/s]
73%|ββββββββ | 1472/2030 [12:50<03:49, 2.43it/s]
73%|ββββββββ | 1473/2030 [12:50<04:22, 2.12it/s]
73%|ββββββββ | 1474/2030 [12:51<04:24, 2.11it/s]
73%|ββββββββ | 1475/2030 [12:51<04:24, 2.10it/s]
73%|ββββββββ | 1476/2030 [12:52<04:14, 2.18it/s]
73%|ββββββββ | 1477/2030 [12:52<03:51, 2.39it/s]
73%|ββββββββ | 1478/2030 [12:53<04:06, 2.24it/s]
73%|ββββββββ | 1479/2030 [12:53<04:10, 2.20it/s]
73%|ββββββββ | 1480/2030 [12:54<04:35, 1.99it/s]
73%|ββββββββ | 1481/2030 [12:54<04:49, 1.90it/s]
73%|ββββββββ | 1482/2030 [12:55<04:30, 2.03it/s]
73%|ββββββββ | 1483/2030 [12:55<04:36, 1.98it/s]
73%|ββββββββ | 1484/2030 [12:56<04:37, 1.97it/s]
73%|ββββββββ | 1485/2030 [12:56<04:58, 1.82it/s]
73%|ββββββββ | 1486/2030 [12:57<04:28, 2.03it/s]
73%|ββββββββ | 1487/2030 [12:57<04:21, 2.07it/s]
73%|ββββββββ | 1488/2030 [12:58<05:11, 1.74it/s]
73%|ββββββββ | 1489/2030 [12:58<04:53, 1.84it/s]
73%|ββββββββ | 1490/2030 [12:59<04:25, 2.03it/s]
73%|ββββββββ | 1491/2030 [12:59<04:09, 2.16it/s]
73%|ββββββββ | 1492/2030 [13:00<04:18, 2.08it/s]
74%|ββββββββ | 1493/2030 [13:00<04:04, 2.19it/s]
74%|ββββββββ | 1494/2030 [13:01<03:57, 2.26it/s]
74%|ββββββββ | 1495/2030 [13:01<04:05, 2.18it/s]
74%|ββββββββ | 1496/2030 [13:02<04:14, 2.09it/s]
74%|ββββββββ | 1497/2030 [13:02<03:59, 2.22it/s]
74%|ββββββββ | 1498/2030 [13:02<03:55, 2.26it/s]
74%|ββββββββ | 1499/2030 [13:03<03:46, 2.35it/s]
74%|ββββββββ | 1500/2030 [13:03<03:47, 2.33it/s]
74%|ββββββββ | 1500/2030 [13:03<03:47, 2.33it/s]
74%|ββββββββ | 1501/2030 [13:04<03:41, 2.39it/s]
74%|ββββββββ | 1502/2030 [13:04<04:17, 2.05it/s]
74%|ββββββββ | 1503/2030 [13:05<04:08, 2.12it/s]
74%|ββββββββ | 1504/2030 [13:05<03:46, 2.32it/s]
74%|ββββββββ | 1505/2030 [13:05<03:37, 2.41it/s]
74%|ββββββββ | 1506/2030 [13:06<03:40, 2.38it/s]
74%|ββββββββ | 1507/2030 [13:06<03:42, 2.35it/s]
74%|ββββββββ | 1508/2030 [13:07<03:45, 2.32it/s]
74%|ββββββββ | 1509/2030 [13:07<04:28, 1.94it/s]
74%|ββββββββ | 1510/2030 [13:08<04:13, 2.05it/s]
74%|ββββββββ | 1511/2030 [13:08<03:49, 2.26it/s]
74%|ββββββββ | 1512/2030 [13:09<04:02, 2.14it/s]
75%|ββββββββ | 1513/2030 [13:09<04:03, 2.13it/s]
75%|ββββββββ | 1514/2030 [13:10<04:08, 2.08it/s]
75%|ββββββββ | 1515/2030 [13:10<04:03, 2.12it/s]
75%|ββββββββ | 1516/2030 [13:11<03:47, 2.26it/s]
75%|ββββββββ | 1517/2030 [13:11<03:45, 2.27it/s]
75%|ββββββββ | 1518/2030 [13:11<03:26, 2.48it/s]
75%|ββββββββ | 1519/2030 [13:12<03:32, 2.41it/s]
75%|ββββββββ | 1520/2030 [13:12<04:09, 2.04it/s]
75%|ββββββββ | 1521/2030 [13:13<03:46, 2.24it/s]
75%|ββββββββ | 1522/2030 [13:13<03:45, 2.26it/s]
75%|ββββββββ | 1523/2030 [13:14<03:45, 2.24it/s]
75%|ββββββββ | 1524/2030 [13:14<03:48, 2.22it/s]
75%|ββββββββ | 1525/2030 [13:14<03:42, 2.27it/s]
75%|ββββββββ | 1526/2030 [13:15<03:43, 2.26it/s]
75%|ββββββββ | 1527/2030 [13:15<03:37, 2.31it/s]
75%|ββββββββ | 1528/2030 [13:16<03:37, 2.31it/s]
75%|ββββββββ | 1529/2030 [13:16<04:01, 2.07it/s]
75%|ββββββββ | 1530/2030 [13:17<03:54, 2.14it/s]
75%|ββββββββ | 1531/2030 [13:18<04:26, 1.87it/s]
75%|ββββββββ | 1532/2030 [13:18<04:14, 1.95it/s]
76%|ββββββββ | 1533/2030 [13:19<04:21, 1.90it/s]
76%|ββββββββ | 1534/2030 [13:19<04:02, 2.05it/s]
76%|ββββββββ | 1535/2030 [13:19<03:39, 2.25it/s]
76%|ββββββββ | 1536/2030 [13:20<03:28, 2.37it/s]
76%|ββββββββ | 1537/2030 [13:20<03:40, 2.24it/s]
76%|ββββββββ | 1538/2030 [13:21<03:29, 2.35it/s]
76%|ββββββββ | 1539/2030 [13:21<03:12, 2.55it/s]
76%|ββββββββ | 1540/2030 [13:22<03:57, 2.06it/s]
76%|ββββββββ | 1541/2030 [13:22<03:32, 2.30it/s]
76%|ββββββββ | 1542/2030 [13:22<03:19, 2.45it/s]
76%|ββββββββ | 1543/2030 [13:23<03:14, 2.50it/s]
76%|ββββββββ | 1544/2030 [13:23<03:14, 2.51it/s]
76%|ββββββββ | 1545/2030 [13:23<03:27, 2.34it/s]
76%|ββββββββ | 1546/2030 [13:24<03:37, 2.22it/s]
76%|ββββββββ | 1547/2030 [13:25<04:18, 1.87it/s]
76%|ββββββββ | 1548/2030 [13:25<04:12, 1.91it/s]
76%|ββββββββ | 1549/2030 [13:26<03:58, 2.02it/s]
76%|ββββββββ | 1550/2030 [13:26<03:39, 2.18it/s]
76%|ββββββββ | 1551/2030 [13:26<03:38, 2.19it/s]
76%|ββββββββ | 1552/2030 [13:27<03:28, 2.30it/s]
77%|ββββββββ | 1553/2030 [13:27<03:18, 2.41it/s]
77%|ββββββββ | 1554/2030 [13:28<03:10, 2.49it/s]
77%|ββββββββ | 1555/2030 [13:28<02:59, 2.65it/s]
77%|ββββββββ | 1556/2030 [13:28<03:02, 2.60it/s]
77%|ββββββββ | 1557/2030 [13:29<03:10, 2.49it/s]
77%|ββββββββ | 1558/2030 [13:29<03:07, 2.51it/s]
77%|ββββββββ | 1559/2030 [13:30<03:20, 2.34it/s]
77%|ββββββββ | 1560/2030 [13:30<03:24, 2.30it/s]
77%|ββββββββ | 1561/2030 [13:31<03:22, 2.32it/s]
77%|ββββββββ | 1562/2030 [13:31<03:24, 2.28it/s]
77%|ββββββββ | 1563/2030 [13:31<03:21, 2.32it/s]
77%|ββββββββ | 1564/2030 [13:32<04:00, 1.94it/s]
77%|ββββββββ | 1565/2030 [13:33<04:04, 1.90it/s]
77%|ββββββββ | 1566/2030 [13:33<04:39, 1.66it/s]
77%|ββββββββ | 1567/2030 [13:34<04:22, 1.76it/s]
77%|ββββββββ | 1568/2030 [13:34<04:03, 1.89it/s]
77%|ββββββββ | 1569/2030 [13:35<04:35, 1.68it/s]
77%|ββββββββ | 1570/2030 [13:36<04:37, 1.65it/s]
77%|ββββββββ | 1571/2030 [13:36<04:13, 1.81it/s]
77%|ββββββββ | 1572/2030 [13:37<03:53, 1.96it/s]
77%|ββββββββ | 1573/2030 [13:37<03:38, 2.09it/s]
78%|ββββββββ | 1574/2030 [13:37<03:34, 2.12it/s]
78%|ββββββββ | 1575/2030 [13:38<03:23, 2.24it/s]
78%|ββββββββ | 1576/2030 [13:38<03:23, 2.23it/s]
78%|ββββββββ | 1577/2030 [13:39<03:20, 2.26it/s]
78%|ββββββββ | 1578/2030 [13:39<03:10, 2.37it/s]
78%|ββββββββ | 1579/2030 [13:39<03:09, 2.38it/s]
78%|ββββββββ | 1580/2030 [13:40<03:21, 2.24it/s]
78%|ββββββββ | 1581/2030 [13:41<03:35, 2.08it/s]
78%|ββββββββ | 1582/2030 [13:41<03:24, 2.19it/s]
78%|ββββββββ | 1583/2030 [13:41<03:20, 2.23it/s]
78%|ββββββββ | 1584/2030 [13:42<03:16, 2.27it/s]
78%|ββββββββ | 1585/2030 [13:42<03:11, 2.32it/s]
78%|ββββββββ | 1586/2030 [13:43<03:05, 2.39it/s]
78%|ββββββββ | 1587/2030 [13:43<03:02, 2.42it/s]
78%|ββββββββ | 1588/2030 [13:44<03:20, 2.20it/s]
78%|ββββββββ | 1589/2030 [13:44<03:49, 1.92it/s]
78%|ββββββββ | 1590/2030 [13:45<03:27, 2.12it/s]
78%|ββββββββ | 1591/2030 [13:45<03:27, 2.12it/s]
78%|ββββββββ | 1592/2030 [13:46<03:24, 2.14it/s]
78%|ββββββββ | 1593/2030 [13:46<03:22, 2.16it/s]
79%|ββββββββ | 1594/2030 [13:47<03:32, 2.05it/s]
79%|ββββββββ | 1595/2030 [13:47<03:25, 2.12it/s]
79%|ββββββββ | 1596/2030 [13:47<03:08, 2.30it/s]
79%|ββββββββ | 1597/2030 [13:48<03:02, 2.38it/s]
79%|ββββββββ | 1598/2030 [13:48<03:39, 1.97it/s]
79%|ββββββββ | 1599/2030 [13:49<03:39, 1.97it/s]
79%|ββββββββ | 1600/2030 [13:49<03:22, 2.12it/s]
79%|ββββββββ | 1601/2030 [13:50<03:11, 2.24it/s]
79%|ββββββββ | 1602/2030 [13:50<03:34, 1.99it/s]
79%|ββββββββ | 1603/2030 [13:51<03:25, 2.08it/s]
79%|ββββββββ | 1604/2030 [13:51<03:21, 2.11it/s]
79%|ββββββββ | 1605/2030 [13:52<03:13, 2.19it/s]
79%|ββββββββ | 1606/2030 [13:52<03:10, 2.22it/s]
79%|ββββββββ | 1607/2030 [13:53<03:12, 2.19it/s]
79%|ββββββββ | 1608/2030 [13:53<03:13, 2.18it/s]
79%|ββββββββ | 1609/2030 [13:53<03:07, 2.24it/s]
79%|ββββββββ | 1610/2030 [13:54<02:55, 2.40it/s]
79%|ββββββββ | 1611/2030 [13:54<03:18, 2.11it/s]
79%|ββββββββ | 1612/2030 [13:55<03:10, 2.19it/s]
79%|ββββββββ | 1613/2030 [13:55<03:14, 2.14it/s]
80%|ββββββββ | 1614/2030 [13:56<03:06, 2.23it/s]
80%|ββββββββ | 1615/2030 [13:56<03:07, 2.22it/s]
80%|ββββββββ | 1616/2030 [13:57<03:12, 2.15it/s]
80%|ββββββββ | 1617/2030 [13:57<03:03, 2.25it/s]
80%|ββββββββ | 1618/2030 [13:58<03:13, 2.13it/s]
80%|ββββββββ | 1619/2030 [13:58<03:03, 2.24it/s]
80%|ββββββββ | 1620/2030 [13:58<03:03, 2.24it/s]
80%|ββββββββ | 1621/2030 [13:59<03:07, 2.18it/s]
80%|ββββββββ | 1622/2030 [13:59<03:12, 2.12it/s]
80%|ββββββββ | 1623/2030 [14:00<02:55, 2.33it/s]
80%|ββββββββ | 1624/2030 [14:00<02:50, 2.39it/s]
80%|ββββββββ | 1625/2030 [14:01<03:07, 2.17it/s]
80%|ββββββββ | 1626/2030 [14:01<03:19, 2.02it/s]
80%|ββββββββ | 1627/2030 [14:02<04:19, 1.55it/s]
80%|ββββββββ | 1628/2030 [14:03<03:49, 1.75it/s][INFO|trainer.py:811] 2024-09-09 12:08:15,914 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:08:15,916 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:08:15,916 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:08:15,916 >> Batch size = 8 |
|
{'eval_loss': 0.2829184830188751, 'eval_precision': 0.6528724440116845, 'eval_recall': 0.7339901477832512, 'eval_f1': 0.6910590054109765, 'eval_accuracy': 0.9469986204241394, 'eval_runtime': 5.8572, 'eval_samples_per_second': 430.069, 'eval_steps_per_second': 53.78, 'epoch': 7.0} |
|
{'loss': 0.0081, 'grad_norm': 0.2855200171470642, 'learning_rate': 1.3054187192118228e-05, 'epoch': 7.37} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:03, 78.95it/s][A |
|
5%|β | 16/315 [00:00<00:03, 76.05it/s][A |
|
8%|β | 24/315 [00:00<00:03, 77.36it/s][A |
|
10%|β | 32/315 [00:00<00:03, 72.86it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 76.12it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 75.29it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 75.09it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 72.34it/s][A |
|
23%|βββ | 73/315 [00:00<00:03, 74.32it/s][A |
|
26%|βββ | 81/315 [00:01<00:03, 70.35it/s][A |
|
28%|βββ | 89/315 [00:01<00:03, 67.40it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.49it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 68.69it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 70.18it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 68.86it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 69.88it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 69.52it/s][A |
|
46%|βββββ | 144/315 [00:02<00:02, 69.43it/s][A |
|
49%|βββββ | 153/315 [00:02<00:02, 73.73it/s][A |
|
51%|βββββ | 161/315 [00:02<00:02, 72.47it/s][A |
|
54%|ββββββ | 169/315 [00:02<00:02, 72.61it/s][A |
|
56%|ββββββ | 177/315 [00:02<00:01, 71.88it/s][A |
|
59%|ββββββ | 185/315 [00:02<00:01, 69.45it/s][A |
|
61%|ββββββ | 192/315 [00:02<00:01, 68.87it/s][A |
|
63%|βββββββ | 199/315 [00:02<00:01, 65.94it/s][A |
|
65%|βββββββ | 206/315 [00:02<00:01, 64.90it/s][A |
|
68%|βββββββ | 214/315 [00:03<00:01, 68.13it/s][A |
|
70%|βββββββ | 222/315 [00:03<00:01, 70.01it/s][A |
|
73%|ββββββββ | 231/315 [00:03<00:01, 73.17it/s][A |
|
76%|ββββββββ | 239/315 [00:03<00:01, 74.49it/s][A |
|
78%|ββββββββ | 247/315 [00:03<00:00, 70.11it/s][A |
|
81%|ββββββββ | 255/315 [00:03<00:00, 68.71it/s][A |
|
83%|βββββββββ | 263/315 [00:03<00:00, 70.38it/s][A |
|
86%|βββββββββ | 271/315 [00:03<00:00, 72.22it/s][A |
|
89%|βββββββββ | 280/315 [00:03<00:00, 75.42it/s][A |
|
91%|ββββββββββ| 288/315 [00:04<00:00, 72.63it/s][A |
|
94%|ββββββββββ| 296/315 [00:04<00:00, 71.09it/s][A |
|
97%|ββββββββββ| 304/315 [00:04<00:00, 72.18it/s][A |
|
99%|ββββββββββ| 312/315 [00:04<00:00, 72.14it/s][A
|
|
[A
80%|ββββββββ | 1628/2030 [14:09<03:49, 1.75it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 72.14it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 12:08:21,811 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-1628 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:08:21,812 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-1628/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:08:22,832 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-1628/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:08:22,833 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-1628/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:08:22,833 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-1628/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:08:25,863 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:08:25,864 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
80%|ββββββββ | 1629/2030 [14:13<23:29, 3.51s/it]
80%|ββββββββ | 1630/2030 [14:13<17:01, 2.55s/it]
80%|ββββββββ | 1631/2030 [14:14<12:38, 1.90s/it]
80%|ββββββββ | 1632/2030 [14:14<09:39, 1.46s/it]
80%|ββββββββ | 1633/2030 [14:15<07:35, 1.15s/it]
80%|ββββββββ | 1634/2030 [14:15<06:11, 1.07it/s]
81%|ββββββββ | 1635/2030 [14:15<05:08, 1.28it/s]
81%|ββββββββ | 1636/2030 [14:16<04:20, 1.51it/s]
81%|ββββββββ | 1637/2030 [14:16<04:17, 1.53it/s]
81%|ββββββββ | 1638/2030 [14:17<03:44, 1.74it/s]
81%|ββββββββ | 1639/2030 [14:17<03:43, 1.75it/s]
81%|ββββββββ | 1640/2030 [14:18<03:42, 1.75it/s]
81%|ββββββββ | 1641/2030 [14:18<03:17, 1.97it/s]
81%|ββββββββ | 1642/2030 [14:19<03:02, 2.13it/s]
81%|ββββββββ | 1643/2030 [14:19<03:04, 2.09it/s]
81%|ββββββββ | 1644/2030 [14:20<03:13, 1.99it/s]
81%|ββββββββ | 1645/2030 [14:20<03:04, 2.09it/s]
81%|ββββββββ | 1646/2030 [14:21<02:51, 2.24it/s]
81%|ββββββββ | 1647/2030 [14:21<03:02, 2.10it/s]
81%|ββββββββ | 1648/2030 [14:21<02:50, 2.24it/s]
81%|ββββββββ | 1649/2030 [14:22<03:30, 1.81it/s]
81%|βββββββββ | 1650/2030 [14:23<03:16, 1.93it/s]
81%|βββββββββ | 1651/2030 [14:23<03:12, 1.97it/s]
81%|βββββββββ | 1652/2030 [14:24<02:58, 2.11it/s]
81%|βββββββββ | 1653/2030 [14:24<02:48, 2.24it/s]
81%|βββββββββ | 1654/2030 [14:24<02:47, 2.25it/s]
82%|βββββββββ | 1655/2030 [14:25<03:01, 2.06it/s]
82%|βββββββββ | 1656/2030 [14:25<02:45, 2.26it/s]
82%|βββββββββ | 1657/2030 [14:26<02:38, 2.36it/s]
82%|βββββββββ | 1658/2030 [14:26<02:35, 2.39it/s]
82%|βββββββββ | 1659/2030 [14:27<02:33, 2.42it/s]
82%|βββββββββ | 1660/2030 [14:27<02:24, 2.56it/s]
82%|βββββββββ | 1661/2030 [14:27<02:32, 2.41it/s]
82%|βββββββββ | 1662/2030 [14:28<02:43, 2.26it/s]
82%|βββββββββ | 1663/2030 [14:28<02:37, 2.33it/s]
82%|βββββββββ | 1664/2030 [14:29<02:26, 2.50it/s]
82%|βββββββββ | 1665/2030 [14:29<02:36, 2.34it/s]
82%|βββββββββ | 1666/2030 [14:29<02:32, 2.39it/s]
82%|βββββββββ | 1667/2030 [14:30<02:31, 2.40it/s]
82%|βββββββββ | 1668/2030 [14:30<02:23, 2.53it/s]
82%|βββββββββ | 1669/2030 [14:31<02:26, 2.46it/s]
82%|βββββββββ | 1670/2030 [14:31<02:27, 2.44it/s]
82%|βββββββββ | 1671/2030 [14:31<02:29, 2.40it/s]
82%|βββββββββ | 1672/2030 [14:32<02:30, 2.38it/s]
82%|βββββββββ | 1673/2030 [14:32<02:30, 2.37it/s]
82%|βββββββββ | 1674/2030 [14:33<02:31, 2.36it/s]
83%|βββββββββ | 1675/2030 [14:33<02:30, 2.35it/s]
83%|βββββββββ | 1676/2030 [14:34<02:35, 2.28it/s]
83%|βββββββββ | 1677/2030 [14:34<02:47, 2.10it/s]
83%|βββββββββ | 1678/2030 [14:35<02:50, 2.06it/s]
83%|βββββββββ | 1679/2030 [14:35<02:35, 2.26it/s]
83%|βββββββββ | 1680/2030 [14:36<02:37, 2.22it/s]
83%|βββββββββ | 1681/2030 [14:36<02:50, 2.05it/s]
83%|βββββββββ | 1682/2030 [14:37<02:40, 2.17it/s]
83%|βββββββββ | 1683/2030 [14:37<02:39, 2.18it/s]
83%|βββββββββ | 1684/2030 [14:37<02:30, 2.30it/s]
83%|βββββββββ | 1685/2030 [14:38<02:25, 2.38it/s]
83%|βββββββββ | 1686/2030 [14:38<02:24, 2.38it/s]
83%|βββββββββ | 1687/2030 [14:39<02:32, 2.25it/s]
83%|βββββββββ | 1688/2030 [14:39<02:26, 2.33it/s]
83%|βββββββββ | 1689/2030 [14:40<02:32, 2.23it/s]
83%|βββββββββ | 1690/2030 [14:40<02:44, 2.07it/s]
83%|βββββββββ | 1691/2030 [14:41<02:36, 2.16it/s]
83%|βββββββββ | 1692/2030 [14:41<02:33, 2.20it/s]
83%|βββββββββ | 1693/2030 [14:41<02:38, 2.13it/s]
83%|βββββββββ | 1694/2030 [14:42<02:25, 2.32it/s]
83%|βββββββββ | 1695/2030 [14:42<02:11, 2.55it/s]
84%|βββββββββ | 1696/2030 [14:43<02:31, 2.20it/s]
84%|βββββββββ | 1697/2030 [14:43<02:22, 2.34it/s]
84%|βββββββββ | 1698/2030 [14:43<02:14, 2.47it/s]
84%|βββββββββ | 1699/2030 [14:44<02:33, 2.15it/s]
84%|βββββββββ | 1700/2030 [14:44<02:30, 2.20it/s]
84%|βββββββββ | 1701/2030 [14:45<02:29, 2.20it/s]
84%|βββββββββ | 1702/2030 [14:45<02:26, 2.24it/s]
84%|βββββββββ | 1703/2030 [14:46<02:28, 2.20it/s]
84%|βββββββββ | 1704/2030 [14:47<02:57, 1.83it/s]
84%|βββββββββ | 1705/2030 [14:47<02:53, 1.87it/s]
84%|βββββββββ | 1706/2030 [14:48<02:52, 1.88it/s]
84%|βββββββββ | 1707/2030 [14:48<02:46, 1.94it/s]
84%|βββββββββ | 1708/2030 [14:49<02:35, 2.07it/s]
84%|βββββββββ | 1709/2030 [14:49<02:26, 2.19it/s]
84%|βββββββββ | 1710/2030 [14:50<02:44, 1.95it/s]
84%|βββββββββ | 1711/2030 [14:50<02:36, 2.04it/s]
84%|βββββββββ | 1712/2030 [14:50<02:34, 2.05it/s]
84%|βββββββββ | 1713/2030 [14:51<02:46, 1.90it/s]
84%|βββββββββ | 1714/2030 [14:51<02:33, 2.06it/s]
84%|βββββββββ | 1715/2030 [14:52<02:30, 2.09it/s]
85%|βββββββββ | 1716/2030 [14:52<02:18, 2.27it/s]
85%|βββββββββ | 1717/2030 [14:53<02:34, 2.02it/s]
85%|βββββββββ | 1718/2030 [14:53<02:36, 2.00it/s]
85%|βββββββββ | 1719/2030 [14:54<02:30, 2.07it/s]
85%|βββββββββ | 1720/2030 [14:54<02:20, 2.21it/s]
85%|βββββββββ | 1721/2030 [14:55<02:31, 2.04it/s]
85%|βββββββββ | 1722/2030 [14:55<02:24, 2.14it/s]
85%|βββββββββ | 1723/2030 [14:56<02:16, 2.24it/s]
85%|βββββββββ | 1724/2030 [14:56<02:25, 2.11it/s]
85%|βββββββββ | 1725/2030 [14:57<02:33, 1.99it/s]
85%|βββββββββ | 1726/2030 [14:57<02:34, 1.97it/s]
85%|βββββββββ | 1727/2030 [14:58<03:02, 1.66it/s]
85%|βββββββββ | 1728/2030 [14:59<02:55, 1.72it/s]
85%|βββββββββ | 1729/2030 [14:59<02:52, 1.74it/s]
85%|βββββββββ | 1730/2030 [15:00<02:48, 1.78it/s]
85%|βββββββββ | 1731/2030 [15:00<02:40, 1.86it/s]
85%|βββββββββ | 1732/2030 [15:01<02:25, 2.05it/s]
85%|βββββββββ | 1733/2030 [15:01<02:20, 2.11it/s]
85%|βββββββββ | 1734/2030 [15:01<02:19, 2.11it/s]
85%|βββββββββ | 1735/2030 [15:02<02:15, 2.18it/s]
86%|βββββββββ | 1736/2030 [15:02<02:15, 2.16it/s]
86%|βββββββββ | 1737/2030 [15:03<03:09, 1.55it/s]
86%|βββββββββ | 1738/2030 [15:04<03:03, 1.59it/s]
86%|βββββββββ | 1739/2030 [15:05<03:16, 1.48it/s]
86%|βββββββββ | 1740/2030 [15:05<02:56, 1.64it/s]
86%|βββββββββ | 1741/2030 [15:06<02:37, 1.84it/s]
86%|βββββββββ | 1742/2030 [15:06<02:34, 1.86it/s]
86%|βββββββββ | 1743/2030 [15:07<02:17, 2.08it/s]
86%|βββββββββ | 1744/2030 [15:07<02:23, 1.99it/s]
86%|βββββββββ | 1745/2030 [15:08<02:16, 2.09it/s]
86%|βββββββββ | 1746/2030 [15:08<02:05, 2.27it/s]
86%|βββββββββ | 1747/2030 [15:08<02:03, 2.30it/s]
86%|βββββββββ | 1748/2030 [15:09<02:15, 2.08it/s]
86%|βββββββββ | 1749/2030 [15:09<02:13, 2.11it/s]
86%|βββββββββ | 1750/2030 [15:10<02:11, 2.13it/s]
86%|βββββββββ | 1751/2030 [15:11<02:34, 1.80it/s]
86%|βββββββββ | 1752/2030 [15:11<02:20, 1.98it/s]
86%|βββββββββ | 1753/2030 [15:12<02:36, 1.77it/s]
86%|βββββββββ | 1754/2030 [15:12<02:26, 1.89it/s]
86%|βββββββββ | 1755/2030 [15:12<02:14, 2.04it/s]
87%|βββββββββ | 1756/2030 [15:13<02:02, 2.23it/s]
87%|βββββββββ | 1757/2030 [15:13<01:52, 2.42it/s]
87%|βββββββββ | 1758/2030 [15:14<02:16, 1.99it/s]
87%|βββββββββ | 1759/2030 [15:14<02:07, 2.13it/s]
87%|βββββββββ | 1760/2030 [15:15<02:03, 2.18it/s]
87%|βββββββββ | 1761/2030 [15:15<02:17, 1.96it/s]
87%|βββββββββ | 1762/2030 [15:16<02:09, 2.07it/s]
87%|βββββββββ | 1763/2030 [15:16<02:01, 2.20it/s]
87%|βββββββββ | 1764/2030 [15:17<01:57, 2.26it/s]
87%|βββββββββ | 1765/2030 [15:17<01:57, 2.25it/s]
87%|βββββββββ | 1766/2030 [15:17<01:54, 2.30it/s]
87%|βββββββββ | 1767/2030 [15:18<02:00, 2.18it/s]
87%|βββββββββ | 1768/2030 [15:18<01:52, 2.33it/s]
87%|βββββββββ | 1769/2030 [15:19<01:58, 2.21it/s]
87%|βββββββββ | 1770/2030 [15:19<01:55, 2.25it/s]
87%|βββββββββ | 1771/2030 [15:20<02:11, 1.97it/s]
87%|βββββββββ | 1772/2030 [15:20<02:00, 2.13it/s]
87%|βββββββββ | 1773/2030 [15:21<02:00, 2.14it/s]
87%|βββββββββ | 1774/2030 [15:21<01:52, 2.28it/s]
87%|βββββββββ | 1775/2030 [15:22<01:50, 2.30it/s]
87%|βββββββββ | 1776/2030 [15:22<01:55, 2.20it/s]
88%|βββββββββ | 1777/2030 [15:22<01:47, 2.35it/s]
88%|βββββββββ | 1778/2030 [15:23<01:55, 2.19it/s]
88%|βββββββββ | 1779/2030 [15:24<02:06, 1.98it/s]
88%|βββββββββ | 1780/2030 [15:24<02:00, 2.08it/s]
88%|βββββββββ | 1781/2030 [15:24<01:53, 2.20it/s]
88%|βββββββββ | 1782/2030 [15:25<01:52, 2.20it/s]
88%|βββββββββ | 1783/2030 [15:25<01:53, 2.18it/s]
88%|βββββββββ | 1784/2030 [15:26<01:47, 2.29it/s]
88%|βββββββββ | 1785/2030 [15:26<01:45, 2.33it/s]
88%|βββββββββ | 1786/2030 [15:27<01:48, 2.24it/s]
88%|βββββββββ | 1787/2030 [15:27<01:49, 2.23it/s]
88%|βββββββββ | 1788/2030 [15:28<02:13, 1.81it/s]
88%|βββββββββ | 1789/2030 [15:28<02:07, 1.89it/s]
88%|βββββββββ | 1790/2030 [15:29<01:59, 2.02it/s]
88%|βββββββββ | 1791/2030 [15:29<01:53, 2.11it/s]
88%|βββββββββ | 1792/2030 [15:30<01:58, 2.01it/s]
88%|βββββββββ | 1793/2030 [15:30<01:55, 2.05it/s]
88%|βββββββββ | 1794/2030 [15:31<01:47, 2.19it/s]
88%|βββββββββ | 1795/2030 [15:31<01:42, 2.28it/s]
88%|βββββββββ | 1796/2030 [15:31<01:47, 2.17it/s]
89%|βββββββββ | 1797/2030 [15:32<01:44, 2.24it/s]
89%|βββββββββ | 1798/2030 [15:32<01:42, 2.26it/s]
89%|βββββββββ | 1799/2030 [15:33<01:35, 2.42it/s]
89%|βββββββββ | 1800/2030 [15:33<01:31, 2.50it/s]
89%|βββββββββ | 1801/2030 [15:34<01:41, 2.25it/s]
89%|βββββββββ | 1802/2030 [15:34<01:38, 2.31it/s]
89%|βββββββββ | 1803/2030 [15:34<01:37, 2.34it/s]
89%|βββββββββ | 1804/2030 [15:35<01:41, 2.23it/s]
89%|βββββββββ | 1805/2030 [15:35<01:52, 2.01it/s]
89%|βββββββββ | 1806/2030 [15:36<01:50, 2.02it/s]
89%|βββββββββ | 1807/2030 [15:36<01:44, 2.12it/s]
89%|βββββββββ | 1808/2030 [15:37<01:38, 2.26it/s]
89%|βββββββββ | 1809/2030 [15:37<01:34, 2.35it/s]
89%|βββββββββ | 1810/2030 [15:38<01:35, 2.30it/s]
89%|βββββββββ | 1811/2030 [15:38<01:34, 2.33it/s]
89%|βββββββββ | 1812/2030 [15:39<01:49, 1.99it/s]
89%|βββββββββ | 1813/2030 [15:39<01:53, 1.92it/s]
89%|βββββββββ | 1814/2030 [15:40<01:41, 2.13it/s]
89%|βββββββββ | 1815/2030 [15:40<01:36, 2.23it/s]
89%|βββββββββ | 1816/2030 [15:40<01:30, 2.35it/s]
90%|βββββββββ | 1817/2030 [15:41<01:28, 2.40it/s]
90%|βββββββββ | 1818/2030 [15:41<01:30, 2.34it/s]
90%|βββββββββ | 1819/2030 [15:42<01:34, 2.23it/s]
90%|βββββββββ | 1820/2030 [15:42<01:41, 2.07it/s]
90%|βββββββββ | 1821/2030 [15:43<01:36, 2.16it/s]
90%|βββββββββ | 1822/2030 [15:43<01:34, 2.20it/s]
90%|βββββββββ | 1823/2030 [15:44<01:35, 2.17it/s]
90%|βββββββββ | 1824/2030 [15:44<01:35, 2.15it/s]
90%|βββββββββ | 1825/2030 [15:44<01:33, 2.20it/s]
90%|βββββββββ | 1826/2030 [15:45<01:34, 2.15it/s]
90%|βββββββββ | 1827/2030 [15:46<01:59, 1.71it/s]
90%|βββββββββ | 1828/2030 [15:46<01:48, 1.86it/s]
90%|βββββββββ | 1829/2030 [15:47<01:40, 2.00it/s]
90%|βββββββββ | 1830/2030 [15:47<01:35, 2.10it/s]
90%|βββββββββ | 1831/2030 [15:48<01:35, 2.08it/s][INFO|trainer.py:811] 2024-09-09 12:10:01,062 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:10:01,064 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:10:01,064 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:10:01,064 >> Batch size = 8 |
|
{'eval_loss': 0.29823970794677734, 'eval_precision': 0.6710997442455243, 'eval_recall': 0.7181171319102354, 'eval_f1': 0.6938127974616606, 'eval_accuracy': 0.9494048573903558, 'eval_runtime': 5.8929, 'eval_samples_per_second': 427.463, 'eval_steps_per_second': 53.454, 'epoch': 8.0} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:04, 75.73it/s][A |
|
5%|β | 16/315 [00:00<00:04, 74.72it/s][A |
|
8%|β | 24/315 [00:00<00:03, 76.94it/s][A |
|
10%|β | 32/315 [00:00<00:03, 72.33it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 76.51it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 75.25it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 75.56it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 72.89it/s][A |
|
23%|βββ | 74/315 [00:00<00:03, 75.37it/s][A |
|
26%|βββ | 82/315 [00:01<00:03, 70.53it/s][A |
|
29%|βββ | 90/315 [00:01<00:03, 67.89it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.18it/s][A |
|
33%|ββββ | 105/315 [00:01<00:03, 69.00it/s][A |
|
36%|ββββ | 113/315 [00:01<00:02, 70.22it/s][A |
|
38%|ββββ | 121/315 [00:01<00:02, 68.84it/s][A |
|
41%|ββββ | 129/315 [00:01<00:02, 70.13it/s][A |
|
43%|βββββ | 137/315 [00:01<00:02, 69.16it/s][A |
|
46%|βββββ | 144/315 [00:02<00:02, 68.53it/s][A |
|
49%|βββββ | 153/315 [00:02<00:02, 72.94it/s][A |
|
51%|βββββ | 161/315 [00:02<00:02, 71.92it/s][A |
|
54%|ββββββ | 169/315 [00:02<00:02, 71.74it/s][A |
|
56%|ββββββ | 177/315 [00:02<00:01, 71.07it/s][A |
|
59%|ββββββ | 185/315 [00:02<00:01, 69.18it/s][A |
|
61%|ββββββ | 192/315 [00:02<00:01, 68.97it/s][A |
|
63%|βββββββ | 199/315 [00:02<00:01, 65.96it/s][A |
|
65%|βββββββ | 206/315 [00:02<00:01, 64.41it/s][A |
|
68%|βββββββ | 214/315 [00:03<00:01, 68.01it/s][A |
|
70%|βββββββ | 222/315 [00:03<00:01, 70.24it/s][A |
|
73%|ββββββββ | 231/315 [00:03<00:01, 73.30it/s][A |
|
76%|ββββββββ | 239/315 [00:03<00:01, 74.13it/s][A |
|
78%|ββββββββ | 247/315 [00:03<00:00, 69.67it/s][A |
|
81%|ββββββββ | 255/315 [00:03<00:00, 68.59it/s][A |
|
83%|βββββββββ | 263/315 [00:03<00:00, 70.33it/s][A |
|
86%|βββββββββ | 271/315 [00:03<00:00, 71.94it/s][A |
|
89%|βββββββββ | 280/315 [00:03<00:00, 75.09it/s][A |
|
91%|ββββββββββ| 288/315 [00:04<00:00, 72.29it/s][A |
|
94%|ββββββββββ| 296/315 [00:04<00:00, 70.81it/s][A |
|
97%|ββββββββββ| 304/315 [00:04<00:00, 72.11it/s][A |
|
99%|ββββββββββ| 312/315 [00:04<00:00, 72.06it/s][A
|
|
[A
90%|βββββββββ | 1831/2030 [15:54<01:35, 2.08it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 72.06it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 12:10:06,932 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-1831 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:10:06,933 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-1831/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:10:07,950 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-1831/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:10:07,951 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-1831/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:10:07,952 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-1831/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:10:10,965 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:10:10,966 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
90%|βββββββββ | 1832/2030 [15:58<11:20, 3.44s/it]
90%|βββββββββ | 1833/2030 [15:58<08:13, 2.50s/it]
90%|βββββββββ | 1834/2030 [15:59<06:04, 1.86s/it]
90%|βββββββββ | 1835/2030 [15:59<04:38, 1.43s/it]
90%|βββββββββ | 1836/2030 [15:59<03:38, 1.13s/it]
90%|βββββββββ | 1837/2030 [16:00<03:08, 1.02it/s]
91%|βββββββββ | 1838/2030 [16:01<02:37, 1.22it/s]
91%|βββββββββ | 1839/2030 [16:01<02:35, 1.23it/s]
91%|βββββββββ | 1840/2030 [16:02<02:33, 1.24it/s]
91%|βββββββββ | 1841/2030 [16:03<02:19, 1.35it/s]
91%|βββββββββ | 1842/2030 [16:03<02:03, 1.52it/s]
91%|βββββββββ | 1843/2030 [16:04<01:51, 1.68it/s]
91%|βββββββββ | 1844/2030 [16:04<01:41, 1.83it/s]
91%|βββββββββ | 1845/2030 [16:04<01:29, 2.06it/s]
91%|βββββββββ | 1846/2030 [16:05<01:23, 2.20it/s]
91%|βββββββββ | 1847/2030 [16:05<01:24, 2.17it/s]
91%|βββββββββ | 1848/2030 [16:06<01:28, 2.06it/s]
91%|βββββββββ | 1849/2030 [16:07<01:57, 1.54it/s]
91%|βββββββββ | 1850/2030 [16:07<01:49, 1.65it/s]
91%|βββββββββ | 1851/2030 [16:08<01:42, 1.74it/s]
91%|βββββββββ | 1852/2030 [16:08<01:33, 1.90it/s]
91%|ββββββββββ| 1853/2030 [16:09<01:34, 1.87it/s]
91%|ββββββββββ| 1854/2030 [16:09<01:26, 2.03it/s]
91%|ββββββββββ| 1855/2030 [16:10<01:24, 2.08it/s]
91%|ββββββββββ| 1856/2030 [16:10<01:17, 2.23it/s]
91%|ββββββββββ| 1857/2030 [16:10<01:13, 2.37it/s]
92%|ββββββββββ| 1858/2030 [16:11<01:14, 2.32it/s]
92%|ββββββββββ| 1859/2030 [16:11<01:11, 2.40it/s]
92%|ββββββββββ| 1860/2030 [16:12<01:10, 2.39it/s]
92%|ββββββββββ| 1861/2030 [16:12<01:07, 2.51it/s]
92%|ββββββββββ| 1862/2030 [16:13<01:11, 2.34it/s]
92%|ββββββββββ| 1863/2030 [16:13<01:10, 2.36it/s]
92%|ββββββββββ| 1864/2030 [16:13<01:08, 2.43it/s]
92%|ββββββββββ| 1865/2030 [16:14<01:11, 2.30it/s]
92%|ββββββββββ| 1866/2030 [16:14<01:10, 2.33it/s]
92%|ββββββββββ| 1867/2030 [16:15<01:07, 2.40it/s]
92%|ββββββββββ| 1868/2030 [16:15<01:06, 2.45it/s]
92%|ββββββββββ| 1869/2030 [16:16<01:14, 2.15it/s]
92%|ββββββββββ| 1870/2030 [16:16<01:11, 2.25it/s]
92%|ββββββββββ| 1871/2030 [16:16<01:07, 2.34it/s]
92%|ββββββββββ| 1872/2030 [16:17<01:09, 2.27it/s]
92%|ββββββββββ| 1873/2030 [16:17<01:11, 2.20it/s]
92%|ββββββββββ| 1874/2030 [16:18<01:06, 2.36it/s]
92%|ββββββββββ| 1875/2030 [16:18<01:08, 2.26it/s]
92%|ββββββββββ| 1876/2030 [16:19<01:11, 2.16it/s]
92%|ββββββββββ| 1877/2030 [16:19<01:19, 1.93it/s]
93%|ββββββββββ| 1878/2030 [16:20<01:16, 1.99it/s]
93%|ββββββββββ| 1879/2030 [16:20<01:14, 2.01it/s]
93%|ββββββββββ| 1880/2030 [16:21<01:21, 1.84it/s]
93%|ββββββββββ| 1881/2030 [16:21<01:14, 2.01it/s]
93%|ββββββββββ| 1882/2030 [16:22<01:08, 2.15it/s]
93%|ββββββββββ| 1883/2030 [16:22<01:05, 2.24it/s]
93%|ββββββββββ| 1884/2030 [16:23<01:03, 2.29it/s]
93%|ββββββββββ| 1885/2030 [16:23<01:05, 2.23it/s]
93%|ββββββββββ| 1886/2030 [16:23<01:03, 2.26it/s]
93%|ββββββββββ| 1887/2030 [16:24<01:00, 2.37it/s]
93%|ββββββββββ| 1888/2030 [16:24<00:59, 2.37it/s]
93%|ββββββββββ| 1889/2030 [16:25<00:58, 2.42it/s]
93%|ββββββββββ| 1890/2030 [16:25<01:01, 2.29it/s]
93%|ββββββββββ| 1891/2030 [16:26<01:02, 2.23it/s]
93%|ββββββββββ| 1892/2030 [16:26<01:00, 2.30it/s]
93%|ββββββββββ| 1893/2030 [16:26<00:59, 2.32it/s]
93%|ββββββββββ| 1894/2030 [16:27<00:57, 2.38it/s]
93%|ββββββββββ| 1895/2030 [16:27<00:56, 2.38it/s]
93%|ββββββββββ| 1896/2030 [16:28<00:58, 2.29it/s]
93%|ββββββββββ| 1897/2030 [16:28<00:53, 2.49it/s]
93%|ββββββββββ| 1898/2030 [16:29<00:57, 2.30it/s]
94%|ββββββββββ| 1899/2030 [16:29<01:11, 1.84it/s]
94%|ββββββββββ| 1900/2030 [16:30<01:05, 1.98it/s]
94%|ββββββββββ| 1901/2030 [16:30<00:59, 2.18it/s]
94%|ββββββββββ| 1902/2030 [16:31<01:02, 2.06it/s]
94%|ββββββββββ| 1903/2030 [16:31<01:01, 2.06it/s]
94%|ββββββββββ| 1904/2030 [16:32<01:00, 2.09it/s]
94%|ββββββββββ| 1905/2030 [16:32<00:55, 2.24it/s]
94%|ββββββββββ| 1906/2030 [16:33<01:00, 2.06it/s]
94%|ββββββββββ| 1907/2030 [16:33<00:55, 2.21it/s]
94%|ββββββββββ| 1908/2030 [16:34<01:01, 1.97it/s]
94%|ββββββββββ| 1909/2030 [16:34<00:57, 2.12it/s]
94%|ββββββββββ| 1910/2030 [16:34<00:52, 2.27it/s]
94%|ββββββββββ| 1911/2030 [16:35<00:54, 2.17it/s]
94%|ββββββββββ| 1912/2030 [16:35<00:54, 2.18it/s]
94%|ββββββββββ| 1913/2030 [16:36<00:54, 2.13it/s]
94%|ββββββββββ| 1914/2030 [16:36<01:00, 1.92it/s]
94%|ββββββββββ| 1915/2030 [16:37<01:01, 1.88it/s]
94%|ββββββββββ| 1916/2030 [16:37<00:55, 2.05it/s]
94%|ββββββββββ| 1917/2030 [16:38<00:55, 2.05it/s]
94%|ββββββββββ| 1918/2030 [16:38<00:51, 2.17it/s]
95%|ββββββββββ| 1919/2030 [16:39<00:49, 2.24it/s]
95%|ββββββββββ| 1920/2030 [16:39<00:51, 2.14it/s]
95%|ββββββββββ| 1921/2030 [16:40<00:50, 2.14it/s]
95%|ββββββββββ| 1922/2030 [16:40<00:47, 2.27it/s]
95%|ββββββββββ| 1923/2030 [16:40<00:46, 2.30it/s]
95%|ββββββββββ| 1924/2030 [16:41<00:47, 2.23it/s]
95%|ββββββββββ| 1925/2030 [16:41<00:44, 2.35it/s]
95%|ββββββββββ| 1926/2030 [16:42<00:41, 2.48it/s]
95%|ββββββββββ| 1927/2030 [16:42<00:41, 2.50it/s]
95%|ββββββββββ| 1928/2030 [16:43<00:46, 2.21it/s]
95%|ββββββββββ| 1929/2030 [16:43<00:45, 2.22it/s]
95%|ββββββββββ| 1930/2030 [16:43<00:42, 2.33it/s]
95%|ββββββββββ| 1931/2030 [16:44<00:44, 2.20it/s]
95%|ββββββββββ| 1932/2030 [16:44<00:42, 2.29it/s]
95%|ββββββββββ| 1933/2030 [16:45<00:42, 2.27it/s]
95%|ββββββββββ| 1934/2030 [16:45<00:50, 1.91it/s]
95%|ββββββββββ| 1935/2030 [16:46<00:48, 1.96it/s]
95%|ββββββββββ| 1936/2030 [16:46<00:45, 2.07it/s]
95%|ββββββββββ| 1937/2030 [16:47<00:42, 2.17it/s]
95%|ββββββββββ| 1938/2030 [16:47<00:44, 2.05it/s]
96%|ββββββββββ| 1939/2030 [16:48<00:41, 2.19it/s]
96%|ββββββββββ| 1940/2030 [16:48<00:37, 2.41it/s]
96%|ββββββββββ| 1941/2030 [16:49<00:38, 2.30it/s]
96%|ββββββββββ| 1942/2030 [16:49<00:38, 2.28it/s]
96%|ββββββββββ| 1943/2030 [16:49<00:36, 2.39it/s]
96%|ββββββββββ| 1944/2030 [16:50<00:46, 1.86it/s]
96%|ββββββββββ| 1945/2030 [16:51<00:42, 1.98it/s]
96%|ββββββββββ| 1946/2030 [16:51<00:38, 2.19it/s]
96%|ββββββββββ| 1947/2030 [16:51<00:38, 2.17it/s]
96%|ββββββββββ| 1948/2030 [16:52<00:35, 2.31it/s]
96%|ββββββββββ| 1949/2030 [16:52<00:31, 2.53it/s]
96%|ββββββββββ| 1950/2030 [16:53<00:35, 2.26it/s]
96%|ββββββββββ| 1951/2030 [16:53<00:34, 2.32it/s]
96%|ββββββββββ| 1952/2030 [16:54<00:38, 2.04it/s]
96%|ββββββββββ| 1953/2030 [16:54<00:37, 2.05it/s]
96%|ββββββββββ| 1954/2030 [16:55<00:35, 2.17it/s]
96%|ββββββββββ| 1955/2030 [16:55<00:31, 2.39it/s]
96%|ββββββββββ| 1956/2030 [16:56<00:36, 2.05it/s]
96%|ββββββββββ| 1957/2030 [16:56<00:34, 2.12it/s]
96%|ββββββββββ| 1958/2030 [16:56<00:31, 2.29it/s]
97%|ββββββββββ| 1959/2030 [16:57<00:31, 2.26it/s]
97%|ββββββββββ| 1960/2030 [16:57<00:29, 2.38it/s]
97%|ββββββββββ| 1961/2030 [16:58<00:28, 2.43it/s]
97%|ββββββββββ| 1962/2030 [16:58<00:27, 2.48it/s]
97%|ββββββββββ| 1963/2030 [16:58<00:27, 2.43it/s]
97%|ββββββββββ| 1964/2030 [16:59<00:30, 2.20it/s]
97%|ββββββββββ| 1965/2030 [17:00<00:36, 1.79it/s]
97%|ββββββββββ| 1966/2030 [17:00<00:34, 1.83it/s]
97%|ββββββββββ| 1967/2030 [17:01<00:33, 1.90it/s]
97%|ββββββββββ| 1968/2030 [17:01<00:33, 1.82it/s]
97%|ββββββββββ| 1969/2030 [17:02<00:31, 1.92it/s]
97%|ββββββββββ| 1970/2030 [17:02<00:30, 1.94it/s]
97%|ββββββββββ| 1971/2030 [17:03<00:28, 2.05it/s]
97%|ββββββββββ| 1972/2030 [17:03<00:28, 2.05it/s]
97%|ββββββββββ| 1973/2030 [17:04<00:27, 2.07it/s]
97%|ββββββββββ| 1974/2030 [17:04<00:26, 2.12it/s]
97%|ββββββββββ| 1975/2030 [17:05<00:25, 2.13it/s]
97%|ββββββββββ| 1976/2030 [17:05<00:23, 2.28it/s]
97%|ββββββββββ| 1977/2030 [17:05<00:21, 2.42it/s]
97%|ββββββββββ| 1978/2030 [17:06<00:21, 2.47it/s]
97%|ββββββββββ| 1979/2030 [17:06<00:21, 2.40it/s]
98%|ββββββββββ| 1980/2030 [17:07<00:20, 2.41it/s]
98%|ββββββββββ| 1981/2030 [17:07<00:22, 2.17it/s]
98%|ββββββββββ| 1982/2030 [17:08<00:22, 2.16it/s]
98%|ββββββββββ| 1983/2030 [17:08<00:23, 1.98it/s]
98%|ββββββββββ| 1984/2030 [17:09<00:21, 2.14it/s]
98%|ββββββββββ| 1985/2030 [17:09<00:25, 1.80it/s]
98%|ββββββββββ| 1986/2030 [17:10<00:26, 1.66it/s]
98%|ββββββββββ| 1987/2030 [17:10<00:23, 1.85it/s]
98%|ββββββββββ| 1988/2030 [17:11<00:22, 1.86it/s]
98%|ββββββββββ| 1989/2030 [17:12<00:23, 1.72it/s]
98%|ββββββββββ| 1990/2030 [17:12<00:21, 1.90it/s]
98%|ββββββββββ| 1991/2030 [17:12<00:19, 2.02it/s]
98%|ββββββββββ| 1992/2030 [17:13<00:18, 2.02it/s]
98%|ββββββββββ| 1993/2030 [17:13<00:16, 2.19it/s]
98%|ββββββββββ| 1994/2030 [17:14<00:16, 2.15it/s]
98%|ββββββββββ| 1995/2030 [17:14<00:15, 2.28it/s]
98%|ββββββββββ| 1996/2030 [17:15<00:14, 2.30it/s]
98%|ββββββββββ| 1997/2030 [17:15<00:15, 2.18it/s]
98%|ββββββββββ| 1998/2030 [17:15<00:13, 2.35it/s]
98%|ββββββββββ| 1999/2030 [17:16<00:13, 2.23it/s]
99%|ββββββββββ| 2000/2030 [17:17<00:14, 2.02it/s]
99%|ββββββββββ| 2000/2030 [17:17<00:14, 2.02it/s]
99%|ββββββββββ| 2001/2030 [17:17<00:13, 2.08it/s]
99%|ββββββββββ| 2002/2030 [17:17<00:13, 2.11it/s]
99%|ββββββββββ| 2003/2030 [17:18<00:12, 2.22it/s]
99%|ββββββββββ| 2004/2030 [17:18<00:11, 2.22it/s]
99%|ββββββββββ| 2005/2030 [17:19<00:12, 2.03it/s]
99%|ββββββββββ| 2006/2030 [17:20<00:12, 1.86it/s]
99%|ββββββββββ| 2007/2030 [17:20<00:12, 1.85it/s]
99%|ββββββββββ| 2008/2030 [17:21<00:11, 1.98it/s]
99%|ββββββββββ| 2009/2030 [17:21<00:09, 2.10it/s]
99%|ββββββββββ| 2010/2030 [17:21<00:08, 2.25it/s]
99%|ββββββββββ| 2011/2030 [17:22<00:08, 2.12it/s]
99%|ββββββββββ| 2012/2030 [17:22<00:08, 2.05it/s]
99%|ββββββββββ| 2013/2030 [17:23<00:07, 2.15it/s]
99%|ββββββββββ| 2014/2030 [17:23<00:07, 2.22it/s]
99%|ββββββββββ| 2015/2030 [17:24<00:07, 2.01it/s]
99%|ββββββββββ| 2016/2030 [17:24<00:06, 2.12it/s]
99%|ββββββββββ| 2017/2030 [17:25<00:07, 1.71it/s]
99%|ββββββββββ| 2018/2030 [17:25<00:06, 1.96it/s]
99%|ββββββββββ| 2019/2030 [17:26<00:05, 1.99it/s]
100%|ββββββββββ| 2020/2030 [17:26<00:04, 2.08it/s]
100%|ββββββββββ| 2021/2030 [17:27<00:03, 2.27it/s]
100%|ββββββββββ| 2022/2030 [17:27<00:03, 2.32it/s]
100%|ββββββββββ| 2023/2030 [17:28<00:03, 2.28it/s]
100%|ββββββββββ| 2024/2030 [17:28<00:03, 1.98it/s]
100%|ββββββββββ| 2025/2030 [17:29<00:02, 1.92it/s]
100%|ββββββββββ| 2026/2030 [17:29<00:02, 1.71it/s]
100%|ββββββββββ| 2027/2030 [17:30<00:01, 1.91it/s]
100%|ββββββββββ| 2028/2030 [17:30<00:01, 1.84it/s]
100%|ββββββββββ| 2029/2030 [17:31<00:00, 1.75it/s]
100%|ββββββββββ| 2030/2030 [17:32<00:00, 1.75it/s][INFO|trainer.py:3503] 2024-09-09 12:11:44,921 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-2030 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:11:44,922 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-2030/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:11:45,981 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-2030/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:11:45,982 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-2030/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:11:45,982 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-2030/special_tokens_map.json |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:11:48,995 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:11:48,995 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
[INFO|trainer.py:811] 2024-09-09 12:11:49,046 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:11:49,048 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:11:49,048 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:11:49,048 >> Batch size = 8 |
|
{'eval_loss': 0.30729904770851135, 'eval_precision': 0.6764102564102564, 'eval_recall': 0.7219485495347564, 'eval_f1': 0.6984379136881121, 'eval_accuracy': 0.9500465205813469, 'eval_runtime': 5.8665, 'eval_samples_per_second': 429.386, 'eval_steps_per_second': 53.695, 'epoch': 9.0} |
|
{'loss': 0.0038, 'grad_norm': 0.6682894825935364, 'learning_rate': 7.389162561576355e-07, 'epoch': 9.83} |
|
|
|
0%| | 0/315 [00:00<?, ?it/s][A |
|
3%|β | 8/315 [00:00<00:03, 78.29it/s][A |
|
5%|β | 16/315 [00:00<00:03, 75.16it/s][A |
|
8%|β | 24/315 [00:00<00:03, 76.32it/s][A |
|
10%|β | 32/315 [00:00<00:03, 71.92it/s][A |
|
13%|ββ | 41/315 [00:00<00:03, 75.23it/s][A |
|
16%|ββ | 49/315 [00:00<00:03, 74.25it/s][A |
|
18%|ββ | 57/315 [00:00<00:03, 74.44it/s][A |
|
21%|ββ | 65/315 [00:00<00:03, 72.11it/s][A |
|
23%|βββ | 73/315 [00:00<00:03, 73.85it/s][A |
|
26%|βββ | 81/315 [00:01<00:03, 69.73it/s][A |
|
28%|βββ | 89/315 [00:01<00:03, 67.25it/s][A |
|
31%|βββ | 97/315 [00:01<00:03, 67.10it/s][A |
|
33%|ββββ | 104/315 [00:01<00:03, 67.74it/s][A |
|
36%|ββββ | 112/315 [00:01<00:02, 69.75it/s][A |
|
38%|ββββ | 120/315 [00:01<00:02, 69.52it/s][A |
|
40%|ββββ | 127/315 [00:01<00:02, 68.90it/s][A |
|
43%|βββββ | 134/315 [00:01<00:02, 68.30it/s][A |
|
45%|βββββ | 142/315 [00:02<00:02, 68.18it/s][A |
|
48%|βββββ | 150/315 [00:02<00:02, 71.45it/s][A |
|
50%|βββββ | 159/315 [00:02<00:02, 74.01it/s][A |
|
53%|ββββββ | 167/315 [00:02<00:02, 71.51it/s][A |
|
56%|ββββββ | 175/315 [00:02<00:02, 69.51it/s][A |
|
58%|ββββββ | 182/315 [00:02<00:01, 68.29it/s][A |
|
60%|ββββββ | 189/315 [00:02<00:01, 68.44it/s][A |
|
62%|βββββββ | 196/315 [00:02<00:01, 67.57it/s][A |
|
64%|βββββββ | 203/315 [00:02<00:01, 64.58it/s][A |
|
67%|βββββββ | 210/315 [00:03<00:01, 65.33it/s][A |
|
69%|βββββββ | 218/315 [00:03<00:01, 68.81it/s][A |
|
72%|ββββββββ | 226/315 [00:03<00:01, 71.31it/s][A |
|
75%|ββββββββ | 235/315 [00:03<00:01, 74.35it/s][A |
|
77%|ββββββββ | 243/315 [00:03<00:01, 71.09it/s][A |
|
80%|ββββββββ | 251/315 [00:03<00:00, 71.00it/s][A |
|
82%|βββββββββ | 259/315 [00:03<00:00, 69.89it/s][A |
|
85%|βββββββββ | 267/315 [00:03<00:00, 70.95it/s][A |
|
88%|βββββββββ | 276/315 [00:03<00:00, 74.02it/s][A |
|
90%|βββββββββ | 284/315 [00:04<00:00, 74.49it/s][A |
|
93%|ββββββββββ| 292/315 [00:04<00:00, 72.69it/s][A |
|
95%|ββββββββββ| 300/315 [00:04<00:00, 72.16it/s][A |
|
98%|ββββββββββ| 308/315 [00:04<00:00, 72.43it/s][A
|
|
[A
100%|ββββββββββ| 2030/2030 [17:42<00:00, 1.75it/s] |
|
100%|ββββββββββ| 315/315 [00:05<00:00, 72.43it/s][A |
|
[A[INFO|trainer.py:3503] 2024-09-09 12:11:54,953 >> Saving model checkpoint to /content/dissertation/scripts/ner/output/checkpoint-2030 |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:11:54,954 >> Configuration saved in /content/dissertation/scripts/ner/output/checkpoint-2030/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:11:56,378 >> Model weights saved in /content/dissertation/scripts/ner/output/checkpoint-2030/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:11:56,381 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/checkpoint-2030/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:11:56,381 >> Special tokens file saved in /content/dissertation/scripts/ner/output/checkpoint-2030/special_tokens_map.json |
|
[INFO|trainer.py:2394] 2024-09-09 12:11:58,332 >> |
|
|
|
Training completed. Do not forget to share your model on huggingface.co/models =) |
|
|
|
|
|
[INFO|trainer.py:2632] 2024-09-09 12:11:58,332 >> Loading best model from /content/dissertation/scripts/ner/output/checkpoint-1831 (score: 0.6984379136881121). |
|
100%|ββββββββββ| 2030/2030 [17:45<00:00, 1.75it/s]
100%|ββββββββββ| 2030/2030 [17:45<00:00, 1.90it/s] |
|
[INFO|trainer.py:4283] 2024-09-09 12:11:58,535 >> Waiting for the current checkpoint push to be finished, this might take a couple of minutes. |
|
[INFO|trainer.py:3503] 2024-09-09 12:12:20,226 >> Saving model checkpoint to /content/dissertation/scripts/ner/output |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:12:20,228 >> Configuration saved in /content/dissertation/scripts/ner/output/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:12:21,587 >> Model weights saved in /content/dissertation/scripts/ner/output/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:12:21,588 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:12:21,588 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
[INFO|trainer.py:3503] 2024-09-09 12:12:21,637 >> Saving model checkpoint to /content/dissertation/scripts/ner/output |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:12:21,638 >> Configuration saved in /content/dissertation/scripts/ner/output/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:12:22,908 >> Model weights saved in /content/dissertation/scripts/ner/output/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:12:22,909 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:12:22,909 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
{'eval_loss': 0.3079104423522949, 'eval_precision': 0.6712820512820513, 'eval_recall': 0.7164750957854407, 'eval_f1': 0.6931427058512046, 'eval_accuracy': 0.9500465205813469, 'eval_runtime': 5.9033, 'eval_samples_per_second': 426.708, 'eval_steps_per_second': 53.36, 'epoch': 9.98} |
|
{'train_runtime': 1065.756, 'train_samples_per_second': 122.101, 'train_steps_per_second': 1.905, 'train_loss': 0.04138289297302368, 'epoch': 9.98} |
|
events.out.tfevents.1725882852.0a1c9bec2a53.9893.0: 0%| | 0.00/11.1k [00:00<?, ?B/s]
events.out.tfevents.1725882852.0a1c9bec2a53.9893.0: 100%|ββββββββββ| 11.1k/11.1k [00:00<00:00, 36.9kB/s] |
|
***** train metrics ***** |
|
epoch = 9.9754 |
|
total_flos = 5964967GF |
|
train_loss = 0.0414 |
|
train_runtime = 0:17:45.75 |
|
train_samples = 13013 |
|
train_samples_per_second = 122.101 |
|
train_steps_per_second = 1.905 |
|
09/09/2024 12:12:29 - INFO - __main__ - *** Evaluate *** |
|
[INFO|trainer.py:811] 2024-09-09 12:12:29,073 >> The following columns in the evaluation set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:12:29,076 >> |
|
***** Running Evaluation ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:12:29,076 >> Num examples = 2519 |
|
[INFO|trainer.py:3824] 2024-09-09 12:12:29,076 >> Batch size = 8 |
|
0%| | 0/315 [00:00<?, ?it/s]
3%|β | 8/315 [00:00<00:03, 79.87it/s]
5%|β | 16/315 [00:00<00:03, 76.37it/s]
8%|β | 24/315 [00:00<00:03, 76.98it/s]
10%|β | 32/315 [00:00<00:03, 73.14it/s]
13%|ββ | 41/315 [00:00<00:03, 77.06it/s]
16%|ββ | 49/315 [00:00<00:03, 75.87it/s]
18%|ββ | 57/315 [00:00<00:03, 75.22it/s]
21%|ββ | 65/315 [00:00<00:03, 72.75it/s]
23%|βββ | 73/315 [00:00<00:03, 74.58it/s]
26%|βββ | 81/315 [00:01<00:03, 70.30it/s]
28%|βββ | 89/315 [00:01<00:03, 67.40it/s]
31%|βββ | 97/315 [00:01<00:03, 67.21it/s]
33%|ββββ | 105/315 [00:01<00:03, 68.92it/s]
36%|ββββ | 113/315 [00:01<00:02, 71.06it/s]
38%|ββββ | 121/315 [00:01<00:02, 69.27it/s]
41%|ββββ | 129/315 [00:01<00:02, 70.12it/s]
43%|βββββ | 137/315 [00:01<00:02, 69.43it/s]
46%|βββββ | 144/315 [00:02<00:02, 69.31it/s]
49%|βββββ | 153/315 [00:02<00:02, 73.00it/s]
51%|βββββ | 161/315 [00:02<00:02, 71.79it/s]
54%|ββββββ | 169/315 [00:02<00:02, 71.32it/s]
56%|ββββββ | 177/315 [00:02<00:01, 70.34it/s]
59%|ββββββ | 185/315 [00:02<00:01, 68.51it/s]
61%|ββββββ | 192/315 [00:02<00:01, 68.60it/s]
63%|βββββββ | 199/315 [00:02<00:01, 65.97it/s]
65%|βββββββ | 206/315 [00:02<00:01, 64.76it/s]
68%|βββββββ | 214/315 [00:03<00:01, 68.25it/s]
70%|βββββββ | 222/315 [00:03<00:01, 70.05it/s]
73%|ββββββββ | 230/315 [00:03<00:01, 72.77it/s]
76%|ββββββββ | 239/315 [00:03<00:01, 74.50it/s]
78%|ββββββββ | 247/315 [00:03<00:00, 70.67it/s]
81%|ββββββββ | 255/315 [00:03<00:00, 69.38it/s]
83%|βββββββββ | 263/315 [00:03<00:00, 70.77it/s]
86%|βββββββββ | 271/315 [00:03<00:00, 72.89it/s]
89%|βββββββββ | 280/315 [00:03<00:00, 75.53it/s]
91%|ββββββββββ| 288/315 [00:04<00:00, 72.20it/s]
94%|ββββββββββ| 296/315 [00:04<00:00, 70.67it/s]
97%|ββββββββββ| 304/315 [00:04<00:00, 72.18it/s]
99%|ββββββββββ| 312/315 [00:04<00:00, 72.30it/s]
100%|ββββββββββ| 315/315 [00:06<00:00, 51.84it/s] |
|
***** eval metrics ***** |
|
epoch = 9.9754 |
|
eval_accuracy = 0.95 |
|
eval_f1 = 0.6984 |
|
eval_loss = 0.3073 |
|
eval_precision = 0.6764 |
|
eval_recall = 0.7219 |
|
eval_runtime = 0:00:06.09 |
|
eval_samples = 2519 |
|
eval_samples_per_second = 413.484 |
|
eval_steps_per_second = 51.706 |
|
09/09/2024 12:12:35 - INFO - __main__ - *** Predict *** |
|
[INFO|trainer.py:811] 2024-09-09 12:12:35,170 >> The following columns in the test set don't have a corresponding argument in `RobertaForTokenClassification.forward` and have been ignored: tokens, ner_tags, id. If tokens, ner_tags, id are not expected by `RobertaForTokenClassification.forward`, you can safely ignore this message. |
|
[INFO|trainer.py:3819] 2024-09-09 12:12:35,172 >> |
|
***** Running Prediction ***** |
|
[INFO|trainer.py:3821] 2024-09-09 12:12:35,172 >> Num examples = 4047 |
|
[INFO|trainer.py:3824] 2024-09-09 12:12:35,172 >> Batch size = 8 |
|
0%| | 0/506 [00:00<?, ?it/s]
2%|β | 10/506 [00:00<00:05, 89.99it/s]
4%|β | 19/506 [00:00<00:06, 78.47it/s]
5%|β | 27/506 [00:00<00:06, 77.29it/s]
7%|β | 35/506 [00:00<00:06, 76.19it/s]
8%|β | 43/506 [00:00<00:06, 75.01it/s]
10%|β | 51/506 [00:00<00:06, 74.72it/s]
12%|ββ | 59/506 [00:00<00:06, 72.73it/s]
13%|ββ | 67/506 [00:00<00:05, 74.41it/s]
15%|ββ | 75/506 [00:00<00:05, 73.98it/s]
16%|ββ | 83/506 [00:01<00:06, 64.09it/s]
18%|ββ | 90/506 [00:01<00:06, 64.05it/s]
19%|ββ | 98/506 [00:01<00:06, 67.57it/s]
21%|ββ | 106/506 [00:01<00:05, 69.34it/s]
23%|βββ | 114/506 [00:01<00:05, 72.09it/s]
24%|βββ | 122/506 [00:01<00:05, 70.62it/s]
26%|βββ | 130/506 [00:01<00:06, 60.47it/s]
27%|βββ | 137/506 [00:02<00:06, 59.29it/s]
29%|βββ | 145/506 [00:02<00:05, 63.13it/s]
30%|βββ | 153/506 [00:02<00:05, 62.09it/s]
32%|ββββ | 160/506 [00:02<00:05, 60.95it/s]
33%|ββββ | 167/506 [00:02<00:05, 61.89it/s]
34%|ββββ | 174/506 [00:02<00:05, 63.30it/s]
36%|ββββ | 182/506 [00:02<00:04, 65.88it/s]
38%|ββββ | 190/506 [00:02<00:04, 68.04it/s]
39%|ββββ | 197/506 [00:02<00:04, 67.64it/s]
41%|ββββ | 205/506 [00:03<00:04, 69.76it/s]
42%|βββββ | 213/506 [00:03<00:04, 67.95it/s]
43%|βββββ | 220/506 [00:03<00:04, 66.58it/s]
45%|βββββ | 227/506 [00:03<00:04, 63.22it/s]
46%|βββββ | 234/506 [00:03<00:04, 61.33it/s]
48%|βββββ | 241/506 [00:03<00:04, 63.41it/s]
49%|βββββ | 249/506 [00:03<00:03, 66.94it/s]
51%|βββββ | 256/506 [00:03<00:03, 67.40it/s]
52%|ββββββ | 264/506 [00:03<00:03, 70.60it/s]
54%|ββββββ | 272/506 [00:04<00:03, 72.82it/s]
55%|ββββββ | 280/506 [00:04<00:03, 72.01it/s]
57%|ββββββ | 288/506 [00:04<00:03, 70.69it/s]
58%|ββββββ | 296/506 [00:04<00:02, 70.79it/s]
60%|ββββββ | 304/506 [00:04<00:02, 71.70it/s]
62%|βββββββ | 312/506 [00:04<00:02, 71.70it/s]
63%|βββββββ | 320/506 [00:04<00:02, 73.71it/s]
65%|βββββββ | 329/506 [00:04<00:02, 76.51it/s]
67%|βββββββ | 337/506 [00:04<00:02, 76.82it/s]
68%|βββββββ | 345/506 [00:04<00:02, 77.52it/s]
70%|βββββββ | 353/506 [00:05<00:01, 77.18it/s]
71%|ββββββββ | 361/506 [00:05<00:01, 76.54it/s]
73%|ββββββββ | 369/506 [00:05<00:01, 71.00it/s]
75%|ββββββββ | 377/506 [00:05<00:01, 66.99it/s]
76%|ββββββββ | 384/506 [00:05<00:01, 64.26it/s]
77%|ββββββββ | 391/506 [00:05<00:01, 60.26it/s]
79%|ββββββββ | 398/506 [00:05<00:01, 58.75it/s]
80%|ββββββββ | 405/506 [00:05<00:01, 59.98it/s]
81%|βββββββββ | 412/506 [00:06<00:01, 61.53it/s]
83%|βββββββββ | 419/506 [00:06<00:01, 63.24it/s]
84%|βββββββββ | 426/506 [00:06<00:01, 63.10it/s]
86%|βββββββββ | 434/506 [00:06<00:01, 66.36it/s]
87%|βββββββββ | 441/506 [00:06<00:00, 66.96it/s]
89%|βββββββββ | 448/506 [00:06<00:00, 66.98it/s]
90%|βββββββββ | 456/506 [00:06<00:00, 69.30it/s]
92%|ββββββββββ| 465/506 [00:06<00:00, 71.88it/s]
93%|ββββββββββ| 473/506 [00:06<00:00, 73.65it/s]
95%|ββββββββββ| 481/506 [00:07<00:00, 74.93it/s]
97%|ββββββββββ| 489/506 [00:07<00:00, 70.10it/s]
98%|ββββββββββ| 497/506 [00:07<00:00, 71.43it/s]
100%|ββββββββββ| 505/506 [00:07<00:00, 73.77it/s]
100%|ββββββββββ| 506/506 [00:09<00:00, 51.99it/s] |
|
[INFO|trainer.py:3503] 2024-09-09 12:12:45,082 >> Saving model checkpoint to /content/dissertation/scripts/ner/output |
|
[INFO|configuration_utils.py:472] 2024-09-09 12:12:45,084 >> Configuration saved in /content/dissertation/scripts/ner/output/config.json |
|
[INFO|modeling_utils.py:2799] 2024-09-09 12:12:46,408 >> Model weights saved in /content/dissertation/scripts/ner/output/model.safetensors |
|
[INFO|tokenization_utils_base.py:2684] 2024-09-09 12:12:46,409 >> tokenizer config file saved in /content/dissertation/scripts/ner/output/tokenizer_config.json |
|
[INFO|tokenization_utils_base.py:2693] 2024-09-09 12:12:46,410 >> Special tokens file saved in /content/dissertation/scripts/ner/output/special_tokens_map.json |
|
***** predict metrics ***** |
|
predict_accuracy = 0.9467 |
|
predict_f1 = 0.6952 |
|
predict_loss = 0.3348 |
|
predict_precision = 0.6863 |
|
predict_recall = 0.7042 |
|
predict_runtime = 0:00:09.74 |
|
predict_samples_per_second = 415.118 |
|
predict_steps_per_second = 51.903 |
|
events.out.tfevents.1725883955.0a1c9bec2a53.9893.1: 0%| | 0.00/560 [00:00<?, ?B/s]
events.out.tfevents.1725883955.0a1c9bec2a53.9893.1: 100%|ββββββββββ| 560/560 [00:00<00:00, 2.28kB/s] |
|
|