bsz=1
input_len8000: 35.428616000000005 ms
input_len16000: 35.646415000000005 ms
input_len32000: 37.589977 ms
input_len64000: 43.910373 ms
input_len128000: 56.096137 ms

overlap
input_len8000: 34.355629 ms
input_len16000: 38.263941 ms
input_len32000: 36.361567 ms
input_len64000: 38.482003 ms
input_len128000: 47.545507 ms

bsz=4
input_len10240: 57.740753000000005 ms
input_len20480: 72.634816 ms
input_len36120: 79.891092 ms

overlap

input_len10240: 57.780038999999995 ms
input_len20480: 39.760764 ms
input_len36120: 46.388686 ms

input_len32000: 39.365274 ms
input_len8000: 37.602398 ms
input_len16000: 38.189326 ms
input_len32000: 39.321833999999996 ms
input_len64000: 41.70580700000001 ms
input_len128000: 47.886360999999994 ms
input_len60000: 109.923547 ms
input_len90000: 92.998627 ms
input_len128000: 97.787567 ms
input_len60000: 89.60024600000001 ms
input_len90000: 91.083353 ms
input_len128000: 96.131484 ms
input_len10000: 550.820692 ms
input_len20000: 547.66707 ms
input_len30000: 552.7096319999999 ms


input_len32000: 37.96298 ms
input_len32000: 48.597992999999995 ms
input_len32000: 63.631053 ms
input_len32000: 63.019977 ms
input_len32000: 74.692739 ms
input_len32000: 183.638766 ms
