Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- aggregator_config.json +1 -0
- projector_0.json +20 -0
- projector_0.pt +3 -0
- projector_1.json +20 -0
- projector_1.pt +3 -0
- projector_10.json +20 -0
- projector_10.pt +3 -0
- projector_11.json +20 -0
- projector_11.pt +3 -0
- projector_12.json +20 -0
- projector_12.pt +3 -0
- projector_13.json +20 -0
- projector_13.pt +3 -0
- projector_14.json +20 -0
- projector_14.pt +3 -0
- projector_15.json +20 -0
- projector_15.pt +3 -0
- projector_16.json +20 -0
- projector_16.pt +3 -0
- projector_17.json +20 -0
- projector_17.pt +3 -0
- projector_18.json +20 -0
- projector_18.pt +3 -0
- projector_19.json +20 -0
- projector_19.pt +3 -0
- projector_2.json +20 -0
- projector_2.pt +3 -0
- projector_20.json +20 -0
- projector_20.pt +3 -0
- projector_21.json +20 -0
- projector_21.pt +3 -0
- projector_22.json +20 -0
- projector_22.pt +3 -0
- projector_23.json +20 -0
- projector_23.pt +3 -0
- projector_24.json +20 -0
- projector_24.pt +3 -0
- projector_25.json +20 -0
- projector_25.pt +3 -0
- projector_26.json +20 -0
- projector_26.pt +3 -0
- projector_27.json +20 -0
- projector_27.pt +3 -0
- projector_3.json +20 -0
- projector_3.pt +3 -0
- projector_4.json +20 -0
- projector_4.pt +3 -0
- projector_5.json +20 -0
- projector_5.pt +3 -0
- projector_6.json +20 -0
aggregator_config.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{}
|
projector_0.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3ffcb1bcafd9595b3cd42c01e50fc1f812a04aa54e7804b7fb2dbe67ef36462
|
| 3 |
+
size 34145223
|
projector_1.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81830bc38f9d8600e30cc91ef23657c14201659eb68985342fc0d99f4b2288c8
|
| 3 |
+
size 34145223
|
projector_10.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_10.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50fd2c2caf3bae0c61b110e67f07ec98ff8619d5c3e2c11fb33ce0c3dc53f886
|
| 3 |
+
size 34145260
|
projector_11.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_11.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17558797306549f27317d41ff5b73f74a59db34d7503bc62e854c35df8e2315e
|
| 3 |
+
size 34145260
|
projector_12.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_12.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2623ea8cac3f49063b9f78bff9a73f6f63afceecba854b246fa1d4d9fb533f1
|
| 3 |
+
size 34145260
|
projector_13.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_13.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:927f645ecd97b2a39b681d21197def470ceab26265703e8134ca3a7693debf9a
|
| 3 |
+
size 34145260
|
projector_14.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_14.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d11efdf54b2c3e9e7cef8036f98d7814bbdb3260b8701b0efbcb1d0f104f4c7
|
| 3 |
+
size 34145260
|
projector_15.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_15.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa38d18285736700f298357079b05338224959d74606e3ac7586b3167e424aad
|
| 3 |
+
size 34145260
|
projector_16.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_16.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d58bda06c5f9f241ef0bba45a2f8f05a67a0794bf013989d4aea0e01765ba16
|
| 3 |
+
size 34145260
|
projector_17.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_17.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb2ea53b60eef83b8eddc2419b40cf9c8042a5eb04c8aa6c3f6b2aed38a8c64f
|
| 3 |
+
size 34145260
|
projector_18.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_18.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba5ccbad02cb564cc419ac2894da70f523270e9f66fcab76524def7a80c78c2f
|
| 3 |
+
size 34145260
|
projector_19.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_19.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5ee9c7b28a77a3c93d00382015f122e5d2e508c36a13ab960a015e0aa241cfd
|
| 3 |
+
size 34145260
|
projector_2.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:abb288aa8a7f6a1631d1f257950a4375287518b227ac09a98f674de84aa6d5a9
|
| 3 |
+
size 34145223
|
projector_20.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_20.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a762579f0b6362a4df71b4d04c63191d4443762fe1e44611298be7475da9ce1
|
| 3 |
+
size 34145260
|
projector_21.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_21.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e3c97f05d6d18e4d81d2e86bc5a0516f3f004786c8afaf9c0026f36b317c3f5
|
| 3 |
+
size 34145260
|
projector_22.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_22.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4191d257f1392ff6a1040337f7fcf51168e1aed06103e92ab195a581752935c6
|
| 3 |
+
size 34145260
|
projector_23.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_23.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2784f88e57a9460cca8f2c1059e4070673137c83bbfac27ec2e38c599cfd5ecd
|
| 3 |
+
size 34145260
|
projector_24.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_24.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebdffd4b8c2112bd64043ea23a0f05ac5ce4ebe70bfe1302bc61743cc4d0f444
|
| 3 |
+
size 34145260
|
projector_25.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_25.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e058b5e22d39a240f6f016dad0ceb314a40887c7c47006fd45b883e1d6218559
|
| 3 |
+
size 34145260
|
projector_26.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_26.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09e0fe14b7a05602f01a4d299ac39f8adac7dd4f2f729ad5f81a318647bfd14f
|
| 3 |
+
size 34145260
|
projector_27.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_27.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e04e43fee29dda4eb5cdca463aa67a4cf9b8d076e3dcfed18ae1bebed3883e2
|
| 3 |
+
size 34145260
|
projector_3.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:412f4da6bb70e3314b6f82b05279018a1cf8e4ba7028f76206b31b4b17d499f6
|
| 3 |
+
size 34145223
|
projector_4.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4a277663d1a631b60f28b04a09f1c8cd450c1d16cd9b9444f71feb25f9cd9ca8
|
| 3 |
+
size 34145223
|
projector_5.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|
projector_5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45806b09dbfe7f4cadcead2897b4da4f269f1b13ad1edc8cd8a44d309e16cbe8
|
| 3 |
+
size 34145223
|
projector_6.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"class": "C2CProjector",
|
| 3 |
+
"init_args": {
|
| 4 |
+
"source_dim": 64,
|
| 5 |
+
"target_dim": 128,
|
| 6 |
+
"source_num_heads": 2,
|
| 7 |
+
"target_num_heads": 8,
|
| 8 |
+
"hidden_dim": 1024,
|
| 9 |
+
"intermediate_dim": 1024,
|
| 10 |
+
"num_layers": 3,
|
| 11 |
+
"dropout": 0.1,
|
| 12 |
+
"initial_temperature": 1.0,
|
| 13 |
+
"final_temperature": 0.001,
|
| 14 |
+
"anneal_steps": 1929,
|
| 15 |
+
"dtype": {
|
| 16 |
+
"__type__": "torch.dtype",
|
| 17 |
+
"value": "bfloat16"
|
| 18 |
+
}
|
| 19 |
+
}
|
| 20 |
+
}
|