Preliminary state
This commit is contained in:
+3
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:aa6e12899b0d9f2fc819ce141dc1d43f9e29f4aebafb3b690b61c3a95537b322
|
||||
size 384
|
||||
+3
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1dfaa4971d98dcc0b9cefe1f59b5d83bdb15300aba3851d8bb2117567321600e
|
||||
size 384
|
||||
+3
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:cf6482c376ff2dee008e3277a0b87bd034e85e96d0b5959b319c1af0cab8dfff
|
||||
size 6583
|
||||
@@ -0,0 +1,12 @@
|
||||
{
|
||||
"command": "grad",
|
||||
"network": "resources/transformer_single_block_network.mininn",
|
||||
"inputs": [
|
||||
"resources/input_0.bin"
|
||||
],
|
||||
"expected_outputs": [
|
||||
"expected_grad_0.bin"
|
||||
],
|
||||
"description": "single-head transformer block (pre-norm): LN\u2192attention(Q/K/V dot+softmax)\u2192residual\u2192LN\u2192FFN(gelu)\u2192residual\u2192gelu; seq=6, d_model=8, d_head=4, d_ff=16; softmax via exp+reduce_sum+reciprocal; upsampling matrix via dot",
|
||||
"points": 3
|
||||
}
|
||||
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:e9687215d2ac36923bd0dbbfe01a513adbd7cd9cd7cd553477cc6cf2a7c038b4
|
||||
size 384
|
||||
+3
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:1dfaa4971d98dcc0b9cefe1f59b5d83bdb15300aba3851d8bb2117567321600e
|
||||
size 384
|
||||
+3
@@ -0,0 +1,3 @@
|
||||
version https://git-lfs.github.com/spec/v1
|
||||
oid sha256:a3e418b35d338902d487e4a67d3ccbbe4ad408b69d478953f62021b40ad71042
|
||||
size 13102
|
||||
@@ -0,0 +1,12 @@
|
||||
{
|
||||
"command": "grad",
|
||||
"network": "resources/transformer_two_blocks_network.mininn",
|
||||
"inputs": [
|
||||
"resources/input_0.bin"
|
||||
],
|
||||
"expected_outputs": [
|
||||
"expected_grad_0.bin"
|
||||
],
|
||||
"description": "two stacked pre-norm single-head transformer blocks; each block has independent Q/K/V/O/FFN weights; seq=6, d_model=8, d_head=4, d_ff=16",
|
||||
"points": 3
|
||||
}
|
||||
Reference in New Issue
Block a user