diff --git a/checkpoint-1000/config.json b/checkpoint-1000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-1000/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-1000/optimizer.pt b/checkpoint-1000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd77113ec86f5fdeedc28b034430d19935e0a2fa --- /dev/null +++ b/checkpoint-1000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5162cdc7e150c38199a0bf2f6b022e86fe4e5fab0a4b1571eb3cfd1e04c3595a +size 93515251 diff --git a/checkpoint-1000/pytorch_model.bin b/checkpoint-1000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..06cfe8b79f725c7636087ec1c8dd61d5c9abd029 --- /dev/null +++ b/checkpoint-1000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:287a721123004c8d73c220ae75a7e6b149cf0be72e47e01c77e97b730ce43f39 +size 46763397 diff --git a/checkpoint-1000/rng_state.pth b/checkpoint-1000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..7bfdb7720ef3d0fd1d2252391fde3002f08b6988 --- /dev/null +++ b/checkpoint-1000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee7b70f7fa47ac37bcbe098e2b10c20b3b195f8c1766739e3db895348a26874 +size 14575 diff --git a/checkpoint-1000/scheduler.pt b/checkpoint-1000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b546af01f66362feab8cb3d8d5dfe2f2d4c677 --- /dev/null +++ b/checkpoint-1000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:084ebba0eb2a420ffdfb3098966cebfb8672516d6cdb7cb9bd358081a446703c +size 627 diff --git a/checkpoint-1000/trainer_state.json b/checkpoint-1000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..4081ef1b9a447dc21efacb7f7581175ce2c72327 --- /dev/null +++ b/checkpoint-1000/trainer_state.json @@ -0,0 +1,28 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.4452359750667854, + "global_step": 1000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + }, + { + "epoch": 0.45, + "learning_rate": 4.37374749498998e-05, + "loss": 1.0848, + "step": 1000 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 382483021824000.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-1000/training_args.bin b/checkpoint-1000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-1000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/checkpoint-1500/config.json b/checkpoint-1500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-1500/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-1500/optimizer.pt b/checkpoint-1500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fda56814cf8ac0a445f574966b31bd50424bf4a --- /dev/null +++ b/checkpoint-1500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631adef8f48cc879fc1772f0a4ab1210dbad8d9c5355bc16922c4432659e0e07 +size 93515251 diff --git a/checkpoint-1500/pytorch_model.bin b/checkpoint-1500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac8a3df66bfaac12d599b3ac1647fdf64d447379 --- /dev/null +++ b/checkpoint-1500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e078665c7f18286737bf025cff999343ec68bc3f367c66f6e8c7a1baa40a6b3e +size 46763397 diff --git a/checkpoint-1500/rng_state.pth b/checkpoint-1500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e0187916bec19e844bd09f996833e734ddc6e75 --- /dev/null +++ b/checkpoint-1500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf83649e305fc92e7f425c75319d8d8f11a58bbf5ed6ad6d1f21875f76f9f51 +size 14575 diff --git a/checkpoint-1500/scheduler.pt b/checkpoint-1500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eebc1d109faaaa3888f8b7f28b94538e8d17f19 --- /dev/null +++ b/checkpoint-1500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94bfc714f526b0ce075c39d8e757ea14a02823f50580140d9d9927a3c16307f +size 627 diff --git a/checkpoint-1500/trainer_state.json b/checkpoint-1500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..096cf3fc32a846ca81f5d899d5cb337c2c5ed3f0 --- /dev/null +++ b/checkpoint-1500/trainer_state.json @@ -0,0 +1,34 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.667853962600178, + "global_step": 1500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + }, + { + "epoch": 0.45, + "learning_rate": 4.37374749498998e-05, + "loss": 1.0848, + "step": 1000 + }, + { + "epoch": 0.67, + "learning_rate": 3.74749498997996e-05, + "loss": 1.0004, + "step": 1500 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 573724532736000.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-1500/training_args.bin b/checkpoint-1500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-1500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/checkpoint-2000/config.json b/checkpoint-2000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-2000/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-2000/optimizer.pt b/checkpoint-2000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a8f7de64a4132286cb884c4ba546211ac628c51 --- /dev/null +++ b/checkpoint-2000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e122441167c8b2acaae70972155a403a7af29ff8205ad3895b1ee87c23e8f1 +size 93515251 diff --git a/checkpoint-2000/pytorch_model.bin b/checkpoint-2000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..c9c11c6d9a24b91fbf278136343cbc46c12a7bde --- /dev/null +++ b/checkpoint-2000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a2747097db5358954b136384a9032ab622e51e4496c59fcc9bf6f19ad75258 +size 46763397 diff --git a/checkpoint-2000/rng_state.pth b/checkpoint-2000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..97ff2f3b67daf88ed5ef5eed35fb07d2890cfd6d --- /dev/null +++ b/checkpoint-2000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41916c11c52ae9eb1f8eb57fa5e92ab81b4719df8e81cf9955d611fff46c648 +size 14575 diff --git a/checkpoint-2000/scheduler.pt b/checkpoint-2000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba86cb8ea70d3472411d2a0964393c41b6b04286 --- /dev/null +++ b/checkpoint-2000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:514cee12839556455629fe90048db0fbd080eb8fab678afa2636814da5a87b0b +size 627 diff --git a/checkpoint-2000/trainer_state.json b/checkpoint-2000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..16411589a8da810524cc072b1f46a054e4c97916 --- /dev/null +++ b/checkpoint-2000/trainer_state.json @@ -0,0 +1,40 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.8904719501335708, + "global_step": 2000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + }, + { + "epoch": 0.45, + "learning_rate": 4.37374749498998e-05, + "loss": 1.0848, + "step": 1000 + }, + { + "epoch": 0.67, + "learning_rate": 3.74749498997996e-05, + "loss": 1.0004, + "step": 1500 + }, + { + "epoch": 0.89, + "learning_rate": 3.12124248496994e-05, + "loss": 0.9697, + "step": 2000 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 764966043648000.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-2000/training_args.bin b/checkpoint-2000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-2000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/checkpoint-2500/config.json b/checkpoint-2500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-2500/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-2500/optimizer.pt b/checkpoint-2500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd82db8e3459c5ff3ca52a895c9b5b00f484dd6 --- /dev/null +++ b/checkpoint-2500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1926b9f4407cddf2624857403d0a49eaed378a219e2395a47b5d58712e20b199 +size 93515251 diff --git a/checkpoint-2500/pytorch_model.bin b/checkpoint-2500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..572c430cb73bb2c219bdd757bebf10dece60099f --- /dev/null +++ b/checkpoint-2500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee437a17f548e4badf2b4432a5ed01d1d00c2e411f797e1ed5c30c2328b5146 +size 46763397 diff --git a/checkpoint-2500/rng_state.pth b/checkpoint-2500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..09732e55b741dac6d78f59975c3791e218c9a4fa --- /dev/null +++ b/checkpoint-2500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50a44eb54b4705cdd4d53277365f55b77947a284fdf9040322c04e7f4228ea32 +size 14575 diff --git a/checkpoint-2500/scheduler.pt b/checkpoint-2500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..788d60d2edae7bde3b12df2b6914051920404890 --- /dev/null +++ b/checkpoint-2500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34cf069b87bb3938fb90cccd941ef9160d044d428876ee79ec13296d8ba0514 +size 627 diff --git a/checkpoint-2500/trainer_state.json b/checkpoint-2500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..15e9be9af075cd10dc3b8c8fc2b00dce2c00284d --- /dev/null +++ b/checkpoint-2500/trainer_state.json @@ -0,0 +1,46 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.1130899376669634, + "global_step": 2500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + }, + { + "epoch": 0.45, + "learning_rate": 4.37374749498998e-05, + "loss": 1.0848, + "step": 1000 + }, + { + "epoch": 0.67, + "learning_rate": 3.74749498997996e-05, + "loss": 1.0004, + "step": 1500 + }, + { + "epoch": 0.89, + "learning_rate": 3.12124248496994e-05, + "loss": 0.9697, + "step": 2000 + }, + { + "epoch": 1.11, + "learning_rate": 2.49498997995992e-05, + "loss": 0.9269, + "step": 2500 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 955872881915904.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-2500/training_args.bin b/checkpoint-2500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-2500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/checkpoint-3000/config.json b/checkpoint-3000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-3000/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-3000/optimizer.pt b/checkpoint-3000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c7990816a5b2cf336169564e4312e834607006 --- /dev/null +++ b/checkpoint-3000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420dd64f23e2b68d1b1b96356faa6548bd8615714a986e6ee6234b2a4491c8d8 +size 93515251 diff --git a/checkpoint-3000/pytorch_model.bin b/checkpoint-3000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0aaa9df69570fa8d0aa96c87720f3e24f7ecaad --- /dev/null +++ b/checkpoint-3000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220a74606152bcd98b4a03ad30c8ff16aaf209fd0087a5b832c1412bf5970408 +size 46763397 diff --git a/checkpoint-3000/rng_state.pth b/checkpoint-3000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..95893484c0f00c4a8351828a3b9a038231cdf043 --- /dev/null +++ b/checkpoint-3000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa4f5ffc0dcf47df51739d4080dfd7ed935455d66016e6df47a65d8446b90f4 +size 14575 diff --git a/checkpoint-3000/scheduler.pt b/checkpoint-3000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..39727c003bc13a8b1a1e5df127c8fe37fb64248b --- /dev/null +++ b/checkpoint-3000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3a9f861b0aa1ad29b5b6d84f6cb654853bead44b67a901b2a1205cae12b3c8 +size 627 diff --git a/checkpoint-3000/trainer_state.json b/checkpoint-3000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..930fa4817f4e79e7f6167a2b1cb9967d858385d3 --- /dev/null +++ b/checkpoint-3000/trainer_state.json @@ -0,0 +1,52 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.335707925200356, + "global_step": 3000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + }, + { + "epoch": 0.45, + "learning_rate": 4.37374749498998e-05, + "loss": 1.0848, + "step": 1000 + }, + { + "epoch": 0.67, + "learning_rate": 3.74749498997996e-05, + "loss": 1.0004, + "step": 1500 + }, + { + "epoch": 0.89, + "learning_rate": 3.12124248496994e-05, + "loss": 0.9697, + "step": 2000 + }, + { + "epoch": 1.11, + "learning_rate": 2.49498997995992e-05, + "loss": 0.9269, + "step": 2500 + }, + { + "epoch": 1.34, + "learning_rate": 1.8687374749499e-05, + "loss": 0.8869, + "step": 3000 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 1147114392827904.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-3000/training_args.bin b/checkpoint-3000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-3000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/checkpoint-3500/config.json b/checkpoint-3500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-3500/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-3500/optimizer.pt b/checkpoint-3500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbf18622492682f5b97c6dc5069cf81ba820ed6 --- /dev/null +++ b/checkpoint-3500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a27e283edff413aeedb98a353a22c1c2cce0c9961588fa8cbb016f443ff514 +size 93515251 diff --git a/checkpoint-3500/pytorch_model.bin b/checkpoint-3500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..d267a283b85e1edbc3e5a7525b4ad7ca23fa64f6 --- /dev/null +++ b/checkpoint-3500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1baeda303de05e8e64bfde4afcdf46197d5dc8c11ec34f00e4c920d05e739bbc +size 46763397 diff --git a/checkpoint-3500/rng_state.pth b/checkpoint-3500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..c1e52847efeb9f8b9ebfbf0e7b1b65293fc1c109 --- /dev/null +++ b/checkpoint-3500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4780cc04e020a8b669447bf7cac1162c22e0ba149ef578c010549619f16d0224 +size 14575 diff --git a/checkpoint-3500/scheduler.pt b/checkpoint-3500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e3596efaa4dfd2f8ed173dd4102df361fdb48a9 --- /dev/null +++ b/checkpoint-3500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a30d94ddf9dc46a22db21308fefceeafa29b5fef8c980796e0c5fd1af84e31 +size 627 diff --git a/checkpoint-3500/trainer_state.json b/checkpoint-3500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..8db8a9d7d9f0a9bf1a0d1b2ae2444f133bfc1455 --- /dev/null +++ b/checkpoint-3500/trainer_state.json @@ -0,0 +1,58 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.558325912733749, + "global_step": 3500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + }, + { + "epoch": 0.45, + "learning_rate": 4.37374749498998e-05, + "loss": 1.0848, + "step": 1000 + }, + { + "epoch": 0.67, + "learning_rate": 3.74749498997996e-05, + "loss": 1.0004, + "step": 1500 + }, + { + "epoch": 0.89, + "learning_rate": 3.12124248496994e-05, + "loss": 0.9697, + "step": 2000 + }, + { + "epoch": 1.11, + "learning_rate": 2.49498997995992e-05, + "loss": 0.9269, + "step": 2500 + }, + { + "epoch": 1.34, + "learning_rate": 1.8687374749499e-05, + "loss": 0.8869, + "step": 3000 + }, + { + "epoch": 1.56, + "learning_rate": 1.2424849699398798e-05, + "loss": 0.8755, + "step": 3500 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 1338355903739904.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-3500/training_args.bin b/checkpoint-3500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-3500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/checkpoint-4000/config.json b/checkpoint-4000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-4000/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-4000/optimizer.pt b/checkpoint-4000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4e6b6d047c3dea9c32dd9f2ef4e2a28f10faee --- /dev/null +++ b/checkpoint-4000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee87f7e203e5c399b85d4b01bca398f5344b1c8e7514b66e630de26d00b577a +size 93515251 diff --git a/checkpoint-4000/pytorch_model.bin b/checkpoint-4000/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f1128fa9ab4c7c0f65871bb854a741c670642640 --- /dev/null +++ b/checkpoint-4000/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ed86d884ee503ba33952cd210b5dca3d77fd3fa3a06fcfd220a9c559bdf181b +size 46763397 diff --git a/checkpoint-4000/rng_state.pth b/checkpoint-4000/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..31eb26d260155338617b42f3b56a6ecf4dc2e1ff --- /dev/null +++ b/checkpoint-4000/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1eb381eb47fc8f7a1209158a79968f4c1e6905e6dc1f0625995fe2c4d3427e7 +size 14575 diff --git a/checkpoint-4000/scheduler.pt b/checkpoint-4000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..3028705f4620c3592a7a71124da135f29c86da6a --- /dev/null +++ b/checkpoint-4000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b126e824777601f7f9b00008258a8085739902f490ab32ff2eea0b26ad0a9428 +size 627 diff --git a/checkpoint-4000/trainer_state.json b/checkpoint-4000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..0690a7df4b9eb004845121e7e62042e56a0357fc --- /dev/null +++ b/checkpoint-4000/trainer_state.json @@ -0,0 +1,64 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.7809439002671414, + "global_step": 4000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + }, + { + "epoch": 0.45, + "learning_rate": 4.37374749498998e-05, + "loss": 1.0848, + "step": 1000 + }, + { + "epoch": 0.67, + "learning_rate": 3.74749498997996e-05, + "loss": 1.0004, + "step": 1500 + }, + { + "epoch": 0.89, + "learning_rate": 3.12124248496994e-05, + "loss": 0.9697, + "step": 2000 + }, + { + "epoch": 1.11, + "learning_rate": 2.49498997995992e-05, + "loss": 0.9269, + "step": 2500 + }, + { + "epoch": 1.34, + "learning_rate": 1.8687374749499e-05, + "loss": 0.8869, + "step": 3000 + }, + { + "epoch": 1.56, + "learning_rate": 1.2424849699398798e-05, + "loss": 0.8755, + "step": 3500 + }, + { + "epoch": 1.78, + "learning_rate": 6.162324649298597e-06, + "loss": 0.8698, + "step": 4000 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 1529597414651904.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-4000/training_args.bin b/checkpoint-4000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-4000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/checkpoint-500/config.json b/checkpoint-500/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/checkpoint-500/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/checkpoint-500/optimizer.pt b/checkpoint-500/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c99762e9c93193ccd0aebda7906312767e5db577 --- /dev/null +++ b/checkpoint-500/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62c2ad1da57372c3076c720f7eb96efd6b61e2d07823733edac011b729223637 +size 93515251 diff --git a/checkpoint-500/pytorch_model.bin b/checkpoint-500/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6bf6e2023fdfecf5d584f11abfd1d8152d57f11 --- /dev/null +++ b/checkpoint-500/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c5c33946a4dd914232f236c4085efc0126d60c462ba5097a0da8b912986c06 +size 46763397 diff --git a/checkpoint-500/rng_state.pth b/checkpoint-500/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..86517f72d7d1af263ea13afb4ac0d47f2b082e1f --- /dev/null +++ b/checkpoint-500/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848f52f48a329e352c832f23fbde64aa1efae54c59bd39253c95ef6d0c1dad1a +size 14575 diff --git a/checkpoint-500/scheduler.pt b/checkpoint-500/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8adedcfe6ca473eebf68f588e3fe2e9226534ba0 --- /dev/null +++ b/checkpoint-500/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c05be3962c0b78b7a603157e0a8d651a7e7f492381267255975412abcca2156 +size 627 diff --git a/checkpoint-500/trainer_state.json b/checkpoint-500/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..24fb85b03ba0941a0363c7e66c421cb2ee7c2a92 --- /dev/null +++ b/checkpoint-500/trainer_state.json @@ -0,0 +1,22 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.2226179875333927, + "global_step": 500, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.22, + "learning_rate": 5e-05, + "loss": 1.3082, + "step": 500 + } + ], + "max_steps": 4492, + "num_train_epochs": 2, + "total_flos": 191241510912000.0, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-500/training_args.bin b/checkpoint-500/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/checkpoint-500/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899 diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0a43ca8c9b3b47a955c94a961cf27058773d6bc8 --- /dev/null +++ b/config.json @@ -0,0 +1,48 @@ +{ + "_name_or_path": "albert-base-v2", + "architectures": [ + "AlbertForSequenceClassification" + ], + "attention_probs_dropout_prob": 0, + "bos_token_id": 2, + "classifier_dropout_prob": 0.1, + "down_scale_factor": 1, + "embedding_size": 128, + "eos_token_id": 3, + "gap_size": 0, + "hidden_act": "gelu_new", + "hidden_dropout_prob": 0, + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1", + "2": "LABEL_2", + "3": "LABEL_3", + "4": "LABEL_4" + }, + "initializer_range": 0.02, + "inner_group_num": 1, + "intermediate_size": 3072, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1, + "LABEL_2": 2, + "LABEL_3": 3, + "LABEL_4": 4 + }, + "layer_norm_eps": 1e-12, + "max_position_embeddings": 512, + "model_type": "albert", + "net_structure_type": 0, + "num_attention_heads": 12, + "num_hidden_groups": 1, + "num_hidden_layers": 12, + "num_memory_blocks": 0, + "pad_token_id": 0, + "position_embedding_type": "absolute", + "problem_type": "single_label_classification", + "torch_dtype": "float32", + "transformers_version": "4.30.2", + "type_vocab_size": 2, + "vocab_size": 30000 +} diff --git a/pytorch_model.bin b/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..344e47aa17c73bf0c49d09077002cbf7150ad170 --- /dev/null +++ b/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a033a4afaf7bd6bb15d78d9e84df11a72583cb0b3c12c61ed1f16b4f66bccf +size 46763397 diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..205f9aa66656d6dbd571c708a776ef297d868d00 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c74f0fea927ae5a6dd93c20442abe9cb0ec0c27b1feb0ae3d88288eefccf96 +size 3899