willwade commited on
Commit
4864cd6
·
verified ·
1 Parent(s): d867a64

Upload 2 files

Browse files

From https://drive.google.com/file/d/1g31HGxJnnOwYl17b70ObFQZ1TSnPvRQv/view

Files changed (2) hide show
  1. model.json +45 -0
  2. model.pth +3 -0
model.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "accum_grad": 1,
3
+ "att_dropout_rate": 0.0,
4
+ "att_unit": 512,
5
+ "backend": "pytorch",
6
+ "beta1": 0.9,
7
+ "beta2": 0.999,
8
+ "config2": null,
9
+ "config3": null,
10
+ "debugmode": 1,
11
+ "dropout_rate": 0.0,
12
+ "dump_hdf5_path": null,
13
+ "early_stop_criterion": "validation/main/loss",
14
+ "emb_dropout_rate": 0.0,
15
+ "embed_unit": 128,
16
+ "epoch": 50,
17
+ "gradclip": 1.0,
18
+ "head": 8,
19
+ "layer": 16,
20
+ "lr": 0.0008,
21
+ "lr_cosine_total": 100000,
22
+ "lr_cosine_warmup": 1000,
23
+ "maxlen": 60,
24
+ "model_module": "transformer",
25
+ "n_vocab": 5049,
26
+ "ngpu": 8,
27
+ "opt": "adam",
28
+ "patience": 0,
29
+ "pos_enc": "none",
30
+ "report_interval_iters": 100,
31
+ "schedulers": [
32
+ [
33
+ "lr",
34
+ "cosine"
35
+ ]
36
+ ],
37
+ "seed": 1,
38
+ "sortagrad": 0,
39
+ "test_label": null,
40
+ "tie_weights": false,
41
+ "train_dtype": "float32",
42
+ "unit": 2048,
43
+ "verbose": 1,
44
+ "weight_decay": 0.0
45
+ }
model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c75aa39020dec98f432c8689b145d3f4cc407d4daa90a0c64202386c34f83c18
3
+ size 215076928