diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..211f9478428c6be3d133406b0d33d64b0138c4ea --- /dev/null +++ b/config.json @@ -0,0 +1,15 @@ +{ + "vocab_size": 86583, + "dim_model": 4096, + "dim_ff" : 1024, + "num_layers" : 48, + "num_heads": 32, + "dim_head" : 40, + "dropout_p" : 0.0, + "position_bias_num_buckets" : 256, + "position_bias_num_segment_buckets": 256, + "position_bias_max_distance" : 2048, + "eps" : 1e-6, + "half" : true, + "mask_modules": [[false, false], [true, false], [false, false], [true, false], [true, true], [true, false], [true, true], [true, true], [false, false], [false, false], [true, true], [true, false], [true, false], [true, true], [false, false], [true, true], [false, false], [false, true], [true, false], [true, true], [false, false], [false, true], [true, true], [true, true], [false, false], [true, true], [false, false], [true, true], [true, true], [false, false], [true, true], [false, false], [true, true], [false, false], [true, true], [true, false], [true, true], [true, true], [true, true], [false, false], [true, true], [false, false], [true, true], [true, true], [false, false], [true, true], [false, false], [false, false]] +} diff --git a/pytorch_model.bin b/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d3e134b3618fa81233683fe619a575b39affdfe --- /dev/null +++ b/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4900eb67843181959ea77043a59a7d7e78fb688bd9ee61858658c10823c1b33 +size 2110668093 diff --git a/vocab.txt b/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..b977bdaf9898e679a19e338be19321bc1d6f7ede --- /dev/null +++ b/vocab.txt @@ -0,0 +1,86583 @@ + + + + + + + + + + +