tessaig commited on 27 days ago

Commit

0cef54c

1 Parent(s): 1b14406

checkpoint added

Browse files

Files changed (44) hide show

i/checkpoint-586/config.json +45 -0
i/checkpoint-586/optimizer.pt +3 -0
i/checkpoint-586/pytorch_model.bin +3 -0
i/checkpoint-586/rng_state.pth +3 -0
i/checkpoint-586/scheduler.pt +3 -0
i/checkpoint-586/special_tokens_map.json +7 -0
i/checkpoint-586/tokenizer.json +0 -0
i/checkpoint-586/tokenizer_config.json +13 -0
i/checkpoint-586/trainer_state.json +40 -0
i/checkpoint-586/training_args.bin +3 -0
i/checkpoint-586/vocab.txt +0 -0
i_context/checkpoint-586/config.json +45 -0
i_context/checkpoint-586/optimizer.pt +3 -0
i_context/checkpoint-586/pytorch_model.bin +3 -0
i_context/checkpoint-586/rng_state.pth +3 -0
i_context/checkpoint-586/scheduler.pt +3 -0
i_context/checkpoint-586/special_tokens_map.json +7 -0
i_context/checkpoint-586/tokenizer.json +0 -0
i_context/checkpoint-586/tokenizer_config.json +13 -0
i_context/checkpoint-586/trainer_state.json +40 -0
i_context/checkpoint-586/training_args.bin +3 -0
i_context/checkpoint-586/vocab.txt +0 -0
l/checkpoint-586/config.json +45 -0
l/checkpoint-586/optimizer.pt +3 -0
l/checkpoint-586/pytorch_model.bin +3 -0
l/checkpoint-586/rng_state.pth +3 -0
l/checkpoint-586/scheduler.pt +3 -0
l/checkpoint-586/special_tokens_map.json +7 -0
l/checkpoint-586/tokenizer.json +0 -0
l/checkpoint-586/tokenizer_config.json +13 -0
l/checkpoint-586/trainer_state.json +40 -0
l/checkpoint-586/training_args.bin +3 -0
l/checkpoint-586/vocab.txt +0 -0
l_context/checkpoint-586/config.json +45 -0
l_context/checkpoint-586/optimizer.pt +3 -0
l_context/checkpoint-586/pytorch_model.bin +3 -0
l_context/checkpoint-586/rng_state.pth +3 -0
l_context/checkpoint-586/scheduler.pt +3 -0
l_context/checkpoint-586/special_tokens_map.json +7 -0
l_context/checkpoint-586/tokenizer.json +0 -0
l_context/checkpoint-586/tokenizer_config.json +13 -0
l_context/checkpoint-586/trainer_state.json +40 -0
l_context/checkpoint-586/training_args.bin +3 -0
l_context/checkpoint-586/vocab.txt +0 -0

i/checkpoint-586/config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "_name_or_path": "bert-large-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "conflict",
+    "1": "inference",
+    "2": "no_rel",
+    "3": "rephrase"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "conflict": 0,
+    "inference": 1,
+    "no_rel": 2,
+    "rephrase": 3
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.31.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 28996
+}

i/checkpoint-586/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c071b119f8a8d2def9bc6b38b6705d36d793826fa884507ce442aa400681bd6f
+size 2668897797

i/checkpoint-586/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:53075d76ecb13d2ffbd1bc6f724603c0ce9547fc44e33ce350a4d7f4a4334f22
+size 1334467889

i/checkpoint-586/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02fb5630d7730234c36bdb4fb7e880dcb58367c0f810d19ba2082d8485b09c7c
+size 14575

i/checkpoint-586/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f99ebd2ec61759520f0786a379b7aa2b000e3a0998709cfd6554185df948834c
+size 627

i/checkpoint-586/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

i/checkpoint-586/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

i/checkpoint-586/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

i/checkpoint-586/trainer_state.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "best_metric": 1.0550591945648193,
+  "best_model_checkpoint": "clean_output/bert-large-cased/i/checkpoint-586",
+  "epoch": 2.0,
+  "global_step": 586,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.5,
+      "eval_loss": 1.1290996074676514,
+      "eval_runtime": 10.4475,
+      "eval_samples_per_second": 223.978,
+      "eval_steps_per_second": 28.045,
+      "step": 293
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 7.680097680097681e-06,
+      "loss": 1.174,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5547008547008547,
+      "eval_loss": 1.0550591945648193,
+      "eval_runtime": 10.4781,
+      "eval_samples_per_second": 223.323,
+      "eval_steps_per_second": 27.963,
+      "step": 586
+    }
+  ],
+  "max_steps": 1758,
+  "num_train_epochs": 6,
+  "total_flos": 6812609916643200.0,
+  "trial_name": null,
+  "trial_params": null
+}

i/checkpoint-586/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06b07181fa39b72a45b37e999ef96b344aa5d73c1378eb6fbf7bcac9cb1ec357
+size 3963

i/checkpoint-586/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

i_context/checkpoint-586/config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "_name_or_path": "bert-large-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "conflict",
+    "1": "inference",
+    "2": "no_rel",
+    "3": "rephrase"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "conflict": 0,
+    "inference": 1,
+    "no_rel": 2,
+    "rephrase": 3
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.31.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 28996
+}

i_context/checkpoint-586/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:559ef893eee26ebfaf78999f62491999f95298cc468c8a8d40cc967d5a027384
+size 2668897797

i_context/checkpoint-586/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2d5c5a5fd576f61fff46221d942d38c6096f39c2362998e3e182fb3d5f14b6c7
+size 1334467889

i_context/checkpoint-586/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02fb5630d7730234c36bdb4fb7e880dcb58367c0f810d19ba2082d8485b09c7c
+size 14575

i_context/checkpoint-586/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f99ebd2ec61759520f0786a379b7aa2b000e3a0998709cfd6554185df948834c
+size 627

i_context/checkpoint-586/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

i_context/checkpoint-586/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

i_context/checkpoint-586/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

i_context/checkpoint-586/trainer_state.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "best_metric": 1.0713884830474854,
+  "best_model_checkpoint": "clean_output/bert-large-cased/i_context/checkpoint-586",
+  "epoch": 2.0,
+  "global_step": 586,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.505982905982906,
+      "eval_loss": 1.1140286922454834,
+      "eval_runtime": 10.4473,
+      "eval_samples_per_second": 223.981,
+      "eval_steps_per_second": 28.045,
+      "step": 293
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 7.680097680097681e-06,
+      "loss": 1.1604,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5525641025641026,
+      "eval_loss": 1.0713884830474854,
+      "eval_runtime": 10.4432,
+      "eval_samples_per_second": 224.069,
+      "eval_steps_per_second": 28.056,
+      "step": 586
+    }
+  ],
+  "max_steps": 1758,
+  "num_train_epochs": 6,
+  "total_flos": 6812609916643200.0,
+  "trial_name": null,
+  "trial_params": null
+}

i_context/checkpoint-586/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06df57ca0dfd63b697410147ad9225e8f4f93e6f69a771a4a4be4228b0806d53
+size 4027

i_context/checkpoint-586/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

l/checkpoint-586/config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "_name_or_path": "bert-large-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "conflict",
+    "1": "inference",
+    "2": "no_rel",
+    "3": "rephrase"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "conflict": 0,
+    "inference": 1,
+    "no_rel": 2,
+    "rephrase": 3
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.31.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 28996
+}

l/checkpoint-586/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2fe404824bff6205d153485212c451c040068a75cfd640442d71423911e117e3
+size 2668897797

l/checkpoint-586/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0e207d853bb70695bb8fc98af2e739a914dd03304bb635ee1a1349832a999f82
+size 1334467889

l/checkpoint-586/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02fb5630d7730234c36bdb4fb7e880dcb58367c0f810d19ba2082d8485b09c7c
+size 14575

l/checkpoint-586/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f99ebd2ec61759520f0786a379b7aa2b000e3a0998709cfd6554185df948834c
+size 627

l/checkpoint-586/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

l/checkpoint-586/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

l/checkpoint-586/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

l/checkpoint-586/trainer_state.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "best_metric": 1.0608546733856201,
+  "best_model_checkpoint": "clean_output/bert-large-cased/l/checkpoint-586",
+  "epoch": 2.0,
+  "global_step": 586,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.5034188034188034,
+      "eval_loss": 1.1321873664855957,
+      "eval_runtime": 10.4655,
+      "eval_samples_per_second": 223.593,
+      "eval_steps_per_second": 27.997,
+      "step": 293
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 7.680097680097681e-06,
+      "loss": 1.2069,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5576923076923077,
+      "eval_loss": 1.0608546733856201,
+      "eval_runtime": 10.4441,
+      "eval_samples_per_second": 224.049,
+      "eval_steps_per_second": 28.054,
+      "step": 586
+    }
+  ],
+  "max_steps": 1758,
+  "num_train_epochs": 6,
+  "total_flos": 6812609916643200.0,
+  "trial_name": null,
+  "trial_params": null
+}

l/checkpoint-586/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee04b6d4116139a70cf03a37ca11d73bb196bd288da167e5c8cb8cff4b157379
+size 3963

l/checkpoint-586/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

l_context/checkpoint-586/config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "_name_or_path": "bert-large-cased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
+  "id2label": {
+    "0": "conflict",
+    "1": "inference",
+    "2": "no_rel",
+    "3": "rephrase"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 4096,
+  "label2id": {
+    "conflict": 0,
+    "inference": 1,
+    "no_rel": 2,
+    "rephrase": 3
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.31.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 28996
+}

l_context/checkpoint-586/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e768a441837a5d026b0a1265654666f012f6be5229e031ab813984c514edb280
+size 2668897797

l_context/checkpoint-586/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5810cde225e21af1ca4682005c1744989599639719aac93bb563d447d9852036
+size 1334467889

l_context/checkpoint-586/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02fb5630d7730234c36bdb4fb7e880dcb58367c0f810d19ba2082d8485b09c7c
+size 14575

l_context/checkpoint-586/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f99ebd2ec61759520f0786a379b7aa2b000e3a0998709cfd6554185df948834c
+size 627

l_context/checkpoint-586/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

l_context/checkpoint-586/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

l_context/checkpoint-586/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

l_context/checkpoint-586/trainer_state.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "best_metric": 1.117621898651123,
+  "best_model_checkpoint": "clean_output/bert-large-cased/l_context/checkpoint-586",
+  "epoch": 2.0,
+  "global_step": 586,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.49786324786324787,
+      "eval_loss": 1.1456269025802612,
+      "eval_runtime": 10.4236,
+      "eval_samples_per_second": 224.491,
+      "eval_steps_per_second": 28.109,
+      "step": 293
+    },
+    {
+      "epoch": 1.71,
+      "learning_rate": 7.680097680097681e-06,
+      "loss": 1.2045,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5205128205128206,
+      "eval_loss": 1.117621898651123,
+      "eval_runtime": 10.4232,
+      "eval_samples_per_second": 224.499,
+      "eval_steps_per_second": 28.11,
+      "step": 586
+    }
+  ],
+  "max_steps": 1758,
+  "num_train_epochs": 6,
+  "total_flos": 6812609916643200.0,
+  "trial_name": null,
+  "trial_params": null
+}

l_context/checkpoint-586/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:38d41b07860c38688aa574373cb58e67ae3cae813d8b9e26d4b717ab98c7e820
+size 4027

l_context/checkpoint-586/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff