dd123 commited on
Commit
5c547c9
·
1 Parent(s): 2f0af45

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,14 +1,13 @@
1
  {
2
- "_name_or_path": "bert-base-uncased",
 
3
  "architectures": [
4
- "BertForSequenceClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "gradient_checkpointing": false,
9
- "hidden_act": "gelu",
10
- "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
  "id2label": {
13
  "0": "none",
14
  "1": "like",
@@ -23,7 +22,6 @@
23
  "9": "meme"
24
  },
25
  "initializer_range": 0.02,
26
- "intermediate_size": 3072,
27
  "label2id": {
28
  "express_abashed": "10",
29
  "express_sad": "7",
@@ -37,17 +35,17 @@
37
  "tease": "8",
38
  "unlike": "2"
39
  },
40
- "layer_norm_eps": 1e-12,
41
  "max_position_embeddings": 512,
42
- "model_type": "bert",
43
- "num_attention_heads": 12,
44
- "num_hidden_layers": 12,
45
  "pad_token_id": 0,
46
- "position_embedding_type": "absolute",
47
  "problem_type": "single_label_classification",
 
 
 
 
48
  "torch_dtype": "float32",
49
  "transformers_version": "4.27.1",
50
- "type_vocab_size": 2,
51
- "use_cache": true,
52
  "vocab_size": 30522
53
  }
 
1
  {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
  "architectures": [
5
+ "DistilBertForSequenceClassification"
6
  ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
 
 
11
  "id2label": {
12
  "0": "none",
13
  "1": "like",
 
22
  "9": "meme"
23
  },
24
  "initializer_range": 0.02,
 
25
  "label2id": {
26
  "express_abashed": "10",
27
  "express_sad": "7",
 
35
  "tease": "8",
36
  "unlike": "2"
37
  },
 
38
  "max_position_embeddings": 512,
39
+ "model_type": "distilbert",
40
+ "n_heads": 12,
41
+ "n_layers": 6,
42
  "pad_token_id": 0,
 
43
  "problem_type": "single_label_classification",
44
+ "qa_dropout": 0.1,
45
+ "seq_classif_dropout": 0.2,
46
+ "sinusoidal_pos_embds": false,
47
+ "tie_weights_": true,
48
  "torch_dtype": "float32",
49
  "transformers_version": "4.27.1",
 
 
50
  "vocab_size": 30522
51
  }
logs/1686801026.404191/events.out.tfevents.1686801026.ls.3972074.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bceeded2f3cc2c22040449bcc63184fa4f013a75257e040e4edd1037c379712e
3
+ size 5791
logs/events.out.tfevents.1686801026.ls.3972074.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53cd8c3f5c180664aa990e93928bb3977d60ae745795dd953828bd0b16baf501
3
+ size 4808
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e06cceef3eefe5e21831011c8afabb789e5584ff3feccfa1c6b5c87067e09b5
3
- size 438035573
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:408571547fd9b95d791961eea5cd4b63ca25fb0aa8621ec82223d02f0a42a012
3
+ size 267883181
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2006d2b8b6d65831100ae61207fc0c767eab5baf2f7791488cb5c789b93cf22d
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:758effd6e8891c593a864281f10a42e9c315404096144e88f495c543577d6278
3
  size 3579