Training in progress, epoch 1

Files changed (13) hide show

config.json ADDED Viewed

+{
+  "architectures": [
+    "BertModel"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

eval/Information-Retrieval_evaluation_dim_128_results.csv ADDED Viewed


1	+ epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
2	+ 1.0,2,0.30392156862745096,0.4411764705882353,0.5392156862745098,0.6078431372549019,0.30392156862745096,0.30392156862745096,0.14705882352941177,0.4411764705882353,0.10784313725490192,0.5392156862745098,0.060784313725490174,0.6078431372549019,0.39530034235916583,0.44634475989899486,0.40970204787491

eval/Information-Retrieval_evaluation_dim_256_results.csv ADDED Viewed


1	+ epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
2	+ 1.0,2,0.38235294117647056,0.5490196078431373,0.6372549019607843,0.7156862745098039,0.38235294117647056,0.38235294117647056,0.18300653594771235,0.5490196078431373,0.12745098039215683,0.6372549019607843,0.07156862745098037,0.7156862745098039,0.4888149704326176,0.54335681809196,0.4995675194986066

eval/Information-Retrieval_evaluation_dim_512_results.csv ADDED Viewed


1	+ epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
2	+ 1.0,2,0.4019607843137255,0.5490196078431373,0.6862745098039216,0.7745098039215687,0.4019607843137255,0.4019607843137255,0.18300653594771235,0.5490196078431373,0.13725490196078427,0.6862745098039216,0.07745098039215684,0.7745098039215687,0.512180983504513,0.5747623594698829,0.5205335935305102

eval/Information-Retrieval_evaluation_dim_64_results.csv ADDED Viewed


1	+ epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
2	+ 1.0,2,0.24509803921568626,0.3333333333333333,0.4019607843137255,0.5392156862745098,0.24509803921568626,0.24509803921568626,0.11111111111111113,0.3333333333333333,0.08039215686274509,0.4019607843137255,0.05392156862745096,0.5392156862745098,0.31789993775287884,0.3694701009449219,0.33007283175656127

eval/Information-Retrieval_evaluation_dim_768_results.csv ADDED Viewed

+epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
+1.0,2,0.4019607843137255,0.5784313725490197,0.7058823529411765,0.7843137254901961,0.4019607843137255,0.4019607843137255,0.19281045751633982,0.5784313725490197,0.14117647058823524,0.7058823529411765,0.07843137254901959,0.7843137254901961,0.5180944600062248,0.5817103636294029,0.5254064096528579
+2.0,4,0.4019607843137255,0.5686274509803921,0.7156862745098039,0.7843137254901961,0.4019607843137255,0.4019607843137255,0.18954248366013068,0.5686274509803921,0.14313725490196072,0.7156862745098039,0.07843137254901959,0.7843137254901961,0.5188958916900095,0.5825071579190789,0.5270476353988504

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:36018bef8f9420c1c36a3733587ecdbe6154cd398ac654b4806ac6d1b5f04fef
+size 437951328

runs/May01_03-32-52_modal/events.out.tfevents.1746070374.modal.2.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:afb60fca89541a9b5c408ebeb7163453cfce315b21ec10a13e5729bfb31704ef
+size 9635

special_tokens_map.json ADDED Viewed

+{
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:34f68e7249fafb5ae74934a63872dcbfd14151f53ec177488285b9e6ad59c16f
+size 6033

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff