Variable decoder/block_000/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_000/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_000/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_000/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_000/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_000/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_000/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_000/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_000/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_000/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_000/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_001/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_001/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_001/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_001/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_001/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_001/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_001/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_001/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_001/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_001/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_001/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_002/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_002/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_002/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_002/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_002/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_002/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_002/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_002/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_002/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_002/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_002/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_003/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_003/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_003/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_003/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_003/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_003/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_003/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_003/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_003/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_003/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_003/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_004/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_004/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_004/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_004/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_004/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_004/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_004/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_004/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_004/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_004/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_004/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_005/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_005/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_005/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_005/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_005/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_005/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_005/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_005/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_005/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_005/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_005/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_006/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_006/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_006/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_006/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_006/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_006/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_006/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_006/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_006/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_006/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_006/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_007/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_007/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_007/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_007/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_007/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_007/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_007/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_007/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_007/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_007/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_007/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_008/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_008/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_008/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_008/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_008/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_008/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_008/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_008/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_008/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_008/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_008/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_009/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_009/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_009/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_009/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_009/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_009/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_009/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_009/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_009/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_009/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_009/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_010/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_010/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_010/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_010/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_010/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_010/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_010/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_010/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_010/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_010/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_010/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_011/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_011/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_011/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_011/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_011/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_011/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_011/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_011/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_011/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_011/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_011/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_012/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_012/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_012/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_012/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_012/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_012/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_012/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_012/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_012/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_012/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_012/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_013/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_013/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_013/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_013/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_013/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_013/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_013/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_013/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_013/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_013/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_013/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_014/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_014/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_014/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_014/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_014/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_014/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_014/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_014/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_014/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_014/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_014/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_015/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_015/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_015/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_015/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_015/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_015/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_015/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_015/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_015/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_015/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_015/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_016/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_016/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_016/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_016/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_016/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_016/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_016/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_016/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_016/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_016/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_016/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_017/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_017/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_017/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_017/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_017/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_017/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_017/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_017/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_017/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_017/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_017/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_018/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_018/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_018/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_018/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_018/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_018/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_018/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_018/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_018/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_018/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_018/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_019/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_019/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_019/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_019/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_019/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_019/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_019/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_019/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_019/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_019/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_019/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_020/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_020/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_020/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_020/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_020/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_020/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_020/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_020/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_020/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_020/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_020/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_021/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_021/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_021/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_021/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_021/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_021/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_021/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_021/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_021/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_021/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_021/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_022/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_022/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_022/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_022/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_022/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_022/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_022/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_022/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_022/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_022/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_022/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/block_023/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_023/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_023/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_023/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_023/layer_001/EncDecAttention/k                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_023/layer_001/EncDecAttention/o                size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable decoder/block_023/layer_001/EncDecAttention/q                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_023/layer_001/EncDecAttention/v                size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable decoder/block_023/layer_002/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_023/layer_002/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable decoder/block_023/layer_002/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable decoder/logits/kernel                                        size 32899072     slice_size 16449536     Shape[d_model=1024, vocab=32128]                            
Variable encoder/block_000/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_000/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_000/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_000/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_000/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_000/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_000/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_001/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_001/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_001/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_001/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_001/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_001/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_001/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_002/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_002/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_002/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_002/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_002/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_002/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_002/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_003/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_003/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_003/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_003/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_003/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_003/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_003/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_004/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_004/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_004/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_004/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_004/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_004/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_004/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_005/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_005/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_005/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_005/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_005/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_005/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_005/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_006/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_006/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_006/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_006/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_006/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_006/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_006/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_007/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_007/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_007/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_007/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_007/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_007/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_007/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_008/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_008/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_008/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_008/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_008/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_008/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_008/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_009/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_009/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_009/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_009/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_009/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_009/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_009/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_010/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_010/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_010/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_010/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_010/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_010/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_010/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_011/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_011/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_011/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_011/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_011/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_011/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_011/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_012/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_012/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_012/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_012/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_012/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_012/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_012/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_013/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_013/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_013/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_013/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_013/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_013/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_013/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_014/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_014/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_014/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_014/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_014/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_014/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_014/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_015/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_015/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_015/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_015/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_015/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_015/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_015/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_016/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_016/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_016/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_016/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_016/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_016/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_016/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_017/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_017/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_017/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_017/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_017/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_017/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_017/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_018/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_018/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_018/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_018/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_018/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_018/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_018/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_019/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_019/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_019/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_019/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_019/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_019/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_019/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_020/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_020/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_020/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_020/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_020/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_020/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_020/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_021/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_021/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_021/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_021/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_021/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_021/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_021/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_022/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_022/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_022/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_022/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_022/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_022/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_022/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable encoder/block_023/layer_000/SelfAttention/k                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_023/layer_000/SelfAttention/o                  size 1048576      slice_size 524288       Shape[heads=1024, d_model=1024]                             
Variable encoder/block_023/layer_000/SelfAttention/q                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_023/layer_000/SelfAttention/v                  size 1048576      slice_size 524288       Shape[d_model=1024, heads=1024]                             
Variable encoder/block_023/layer_001/DenseReluDense/wi_0/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_023/layer_001/DenseReluDense/wi_1/kernel       size 2883584      slice_size 1441792      Shape[d_model=1024, d_ff=2816]                              
Variable encoder/block_023/layer_001/DenseReluDense/wo/kernel         size 2883584      slice_size 1441792      Shape[d_ff=2816, d_model=1024]                              
Variable shared/embedding                                             size 32899072     slice_size 16449536     Shape[vocab=32128, d_model=1024]                            
Variable stacked/decoder/block_005/layer_000/layer_norm/scale         size 59392        slice_size 59392        Shape[stacked=58, d_model=1024]                             
    decoder/block_005/layer_000/layer_norm/scale
    decoder/block_005/layer_001/layer_norm/scale
    decoder/block_005/layer_002/layer_norm/scale
    decoder/block_006/layer_000/layer_norm/scale
    decoder/block_006/layer_001/layer_norm/scale
    decoder/block_006/layer_002/layer_norm/scale
    decoder/block_007/layer_000/layer_norm/scale
    decoder/block_007/layer_001/layer_norm/scale
    decoder/block_007/layer_002/layer_norm/scale
    decoder/block_008/layer_000/layer_norm/scale
    decoder/block_008/layer_001/layer_norm/scale
    decoder/block_008/layer_002/layer_norm/scale
    decoder/block_009/layer_000/layer_norm/scale
    decoder/block_009/layer_001/layer_norm/scale
    decoder/block_009/layer_002/layer_norm/scale
    decoder/block_010/layer_000/layer_norm/scale
    decoder/block_010/layer_001/layer_norm/scale
    decoder/block_010/layer_002/layer_norm/scale
    decoder/block_011/layer_000/layer_norm/scale
    decoder/block_011/layer_001/layer_norm/scale
    decoder/block_011/layer_002/layer_norm/scale
    decoder/block_012/layer_000/layer_norm/scale
    decoder/block_012/layer_001/layer_norm/scale
    decoder/block_012/layer_002/layer_norm/scale
    decoder/block_013/layer_000/layer_norm/scale
    decoder/block_013/layer_001/layer_norm/scale
    decoder/block_013/layer_002/layer_norm/scale
    decoder/block_014/layer_000/layer_norm/scale
    decoder/block_014/layer_001/layer_norm/scale
    decoder/block_014/layer_002/layer_norm/scale
    decoder/block_015/layer_000/layer_norm/scale
    decoder/block_015/layer_001/layer_norm/scale
    decoder/block_015/layer_002/layer_norm/scale
    decoder/block_016/layer_000/layer_norm/scale
    decoder/block_016/layer_001/layer_norm/scale
    decoder/block_016/layer_002/layer_norm/scale
    decoder/block_017/layer_000/layer_norm/scale
    decoder/block_017/layer_001/layer_norm/scale
    decoder/block_017/layer_002/layer_norm/scale
    decoder/block_018/layer_000/layer_norm/scale
    decoder/block_018/layer_001/layer_norm/scale
    decoder/block_018/layer_002/layer_norm/scale
    decoder/block_019/layer_000/layer_norm/scale
    decoder/block_019/layer_001/layer_norm/scale
    decoder/block_019/layer_002/layer_norm/scale
    decoder/block_020/layer_000/layer_norm/scale
    decoder/block_020/layer_001/layer_norm/scale
    decoder/block_020/layer_002/layer_norm/scale
    decoder/block_021/layer_000/layer_norm/scale
    decoder/block_021/layer_001/layer_norm/scale
    decoder/block_021/layer_002/layer_norm/scale
    decoder/block_022/layer_000/layer_norm/scale
    decoder/block_022/layer_001/layer_norm/scale
    decoder/block_022/layer_002/layer_norm/scale
    decoder/block_023/layer_000/layer_norm/scale
    decoder/block_023/layer_001/layer_norm/scale
    decoder/block_023/layer_002/layer_norm/scale
    decoder/final_layer_norm/scale
Variable stacked/encoder/block_000/layer_000/SelfAttention/relative_attention_bias size 1024         slice_size 512          Shape[stacked=2, heads=16, buckets=32]                      
    encoder/block_000/layer_000/SelfAttention/relative_attention_bias
    decoder/block_000/layer_000/SelfAttention/relative_attention_bias
Variable stacked/encoder/block_000/layer_000/layer_norm/scale         size 65536        slice_size 65536        Shape[stacked=64, d_model=1024]                             
    encoder/block_000/layer_000/layer_norm/scale
    encoder/block_000/layer_001/layer_norm/scale
    encoder/block_001/layer_000/layer_norm/scale
    encoder/block_001/layer_001/layer_norm/scale
    encoder/block_002/layer_000/layer_norm/scale
    encoder/block_002/layer_001/layer_norm/scale
    encoder/block_003/layer_000/layer_norm/scale
    encoder/block_003/layer_001/layer_norm/scale
    encoder/block_004/layer_000/layer_norm/scale
    encoder/block_004/layer_001/layer_norm/scale
    encoder/block_005/layer_000/layer_norm/scale
    encoder/block_005/layer_001/layer_norm/scale
    encoder/block_006/layer_000/layer_norm/scale
    encoder/block_006/layer_001/layer_norm/scale
    encoder/block_007/layer_000/layer_norm/scale
    encoder/block_007/layer_001/layer_norm/scale
    encoder/block_008/layer_000/layer_norm/scale
    encoder/block_008/layer_001/layer_norm/scale
    encoder/block_009/layer_000/layer_norm/scale
    encoder/block_009/layer_001/layer_norm/scale
    encoder/block_010/layer_000/layer_norm/scale
    encoder/block_010/layer_001/layer_norm/scale
    encoder/block_011/layer_000/layer_norm/scale
    encoder/block_011/layer_001/layer_norm/scale
    encoder/block_012/layer_000/layer_norm/scale
    encoder/block_012/layer_001/layer_norm/scale
    encoder/block_013/layer_000/layer_norm/scale
    encoder/block_013/layer_001/layer_norm/scale
    encoder/block_014/layer_000/layer_norm/scale
    encoder/block_014/layer_001/layer_norm/scale
    encoder/block_015/layer_000/layer_norm/scale
    encoder/block_015/layer_001/layer_norm/scale
    encoder/block_016/layer_000/layer_norm/scale
    encoder/block_016/layer_001/layer_norm/scale
    encoder/block_017/layer_000/layer_norm/scale
    encoder/block_017/layer_001/layer_norm/scale
    encoder/block_018/layer_000/layer_norm/scale
    encoder/block_018/layer_001/layer_norm/scale
    encoder/block_019/layer_000/layer_norm/scale
    encoder/block_019/layer_001/layer_norm/scale
    encoder/block_020/layer_000/layer_norm/scale
    encoder/block_020/layer_001/layer_norm/scale
    encoder/block_021/layer_000/layer_norm/scale
    encoder/block_021/layer_001/layer_norm/scale
    encoder/block_022/layer_000/layer_norm/scale
    encoder/block_022/layer_001/layer_norm/scale
    encoder/block_023/layer_000/layer_norm/scale
    encoder/block_023/layer_001/layer_norm/scale
    encoder/final_layer_norm/scale
    decoder/block_000/layer_000/layer_norm/scale
    decoder/block_000/layer_001/layer_norm/scale
    decoder/block_000/layer_002/layer_norm/scale
    decoder/block_001/layer_000/layer_norm/scale
    decoder/block_001/layer_001/layer_norm/scale
    decoder/block_001/layer_002/layer_norm/scale
    decoder/block_002/layer_000/layer_norm/scale
    decoder/block_002/layer_001/layer_norm/scale
    decoder/block_002/layer_002/layer_norm/scale
    decoder/block_003/layer_000/layer_norm/scale
    decoder/block_003/layer_001/layer_norm/scale
    decoder/block_003/layer_002/layer_norm/scale
    decoder/block_004/layer_000/layer_norm/scale
    decoder/block_004/layer_001/layer_norm/scale
    decoder/block_004/layer_002/layer_norm/scale
Trainable Variables            count: 437     Total size: 783150080        Total slice_size: 391637504      
All Variables                  count: 455     Total size: 784485120        Total slice_size: 392589696      
Counters:
allreduce: 4.82e+10
 allreduce/[0]: 1.42e+10
  allreduce/[0]/einsum_op: 1.25e+10
  allreduce/[0]/reduce_op: 1.67e+09
 allreduce/[1]: 3.4e+10
  allreduce/[1]/einsum_op: 3.4e+10
  allreduce/[1]/reduce_op: 1.45e+07
einsum: 2e+14
einsum_unique: 1.99e+14
output: 1.51e+11
 output/AddOperation: 3.05e+07
 output/Constant: 32
 output/EinsumOperation: 5.01e+10
 output/ImportOperation: 1.2e+08
 output/MinMaxOperation: 3.57e+04
 output/ReduceOperation: 2.65e+07
 output/ReshapeOperation: 7.52e+06
 output/ScalarAddOperation: 1.25e+10
 output/ScalarMultiplyOperation: 8.75e+07
 output/SlicewiseOperation: 6.27e+10
 output/StackOperation: 3.45e+07
 output/StackedVariable: 3.45e+07
 output/UnstackOperation: 3.45e+07
 output/Variable: 1.25e+10
 output/WhileLoopOperation: 1.25e+10
output_unique: 9.42e+09
 output_unique/AddOperation: 1.34e+06
 output_unique/Constant: 1
 output_unique/EinsumOperation: 3.13e+09
 output_unique/ImportOperation: 3.76e+06
 output_unique/MinMaxOperation: 1.12e+03
 output_unique/ReduceOperation: 1.21e+06
 output_unique/ReshapeOperation: 3.76e+06
 output_unique/ScalarAddOperation: 7.83e+08
 output_unique/ScalarMultiplyOperation: 3.88e+06
 output_unique/SlicewiseOperation: 3.92e+09
 output_unique/StackOperation: 1.46e+06
 output_unique/StackedVariable: 1.46e+06
 output_unique/UnstackOperation: 1.46e+06
 output_unique/Variable: 7.83e+08
 output_unique/WhileLoopOperation: 7.83e+08
variables: 7.84e+08
 variables/trainable: 7.83e+08
 variables/untrainable: 1.34e+06
