14-10:
  model.blocks.0.attn.k: 4
  model.blocks.0.attn.proj: 4
  model.blocks.0.attn.q: 4
  model.blocks.0.attn.v: 4
  model.blocks.0.attn_temp.k: 4
  model.blocks.0.attn_temp.proj: 4
  model.blocks.0.attn_temp.q: 4
  model.blocks.0.attn_temp.v: 4
  model.blocks.0.cross_attn.kv_linear: 4
  model.blocks.0.cross_attn.proj: 4
  model.blocks.0.cross_attn.q_linear: 4
  model.blocks.0.mlp.fc1: 8
  model.blocks.0.mlp.fc2: 8
  model.blocks.1.attn.k: 4
  model.blocks.1.attn.proj: 4
  model.blocks.1.attn.q: 4
  model.blocks.1.attn.v: 4
  model.blocks.1.attn_temp.k: 4
  model.blocks.1.attn_temp.proj: 4
  model.blocks.1.attn_temp.q: 4
  model.blocks.1.attn_temp.v: 4
  model.blocks.1.cross_attn.kv_linear: 4
  model.blocks.1.cross_attn.proj: 4
  model.blocks.1.cross_attn.q_linear: 4
  model.blocks.1.mlp.fc1: 8
  model.blocks.1.mlp.fc2: 8
  model.blocks.10.attn.k: 4
  model.blocks.10.attn.proj: 4
  model.blocks.10.attn.q: 4
  model.blocks.10.attn.v: 4
  model.blocks.10.attn_temp.k: 4
  model.blocks.10.attn_temp.proj: 4
  model.blocks.10.attn_temp.q: 4
  model.blocks.10.attn_temp.v: 4
  model.blocks.10.cross_attn.kv_linear: 4
  model.blocks.10.cross_attn.proj: 4
  model.blocks.10.cross_attn.q_linear: 4
  model.blocks.10.mlp.fc1: 8
  model.blocks.10.mlp.fc2: 8
  model.blocks.11.attn.k: 4
  model.blocks.11.attn.proj: 4
  model.blocks.11.attn.q: 4
  model.blocks.11.attn.v: 4
  model.blocks.11.attn_temp.k: 4
  model.blocks.11.attn_temp.proj: 4
  model.blocks.11.attn_temp.q: 4
  model.blocks.11.attn_temp.v: 4
  model.blocks.11.cross_attn.kv_linear: 4
  model.blocks.11.cross_attn.proj: 4
  model.blocks.11.cross_attn.q_linear: 4
  model.blocks.11.mlp.fc1: 8
  model.blocks.11.mlp.fc2: 8
  model.blocks.12.attn.k: 4
  model.blocks.12.attn.proj: 4
  model.blocks.12.attn.q: 4
  model.blocks.12.attn.v: 4
  model.blocks.12.attn_temp.k: 4
  model.blocks.12.attn_temp.proj: 4
  model.blocks.12.attn_temp.q: 4
  model.blocks.12.attn_temp.v: 4
  model.blocks.12.cross_attn.kv_linear: 4
  model.blocks.12.cross_attn.proj: 4
  model.blocks.12.cross_attn.q_linear: 4
  model.blocks.12.mlp.fc1: 8
  model.blocks.12.mlp.fc2: 8
  model.blocks.13.attn.k: 4
  model.blocks.13.attn.proj: 4
  model.blocks.13.attn.q: 4
  model.blocks.13.attn.v: 4
  model.blocks.13.attn_temp.k: 4
  model.blocks.13.attn_temp.proj: 4
  model.blocks.13.attn_temp.q: 4
  model.blocks.13.attn_temp.v: 4
  model.blocks.13.cross_attn.kv_linear: 4
  model.blocks.13.cross_attn.proj: 4
  model.blocks.13.cross_attn.q_linear: 4
  model.blocks.13.mlp.fc1: 8
  model.blocks.13.mlp.fc2: 8
  model.blocks.14.attn.k: 4
  model.blocks.14.attn.proj: 4
  model.blocks.14.attn.q: 4
  model.blocks.14.attn.v: 4
  model.blocks.14.attn_temp.k: 4
  model.blocks.14.attn_temp.proj: 4
  model.blocks.14.attn_temp.q: 4
  model.blocks.14.attn_temp.v: 4
  model.blocks.14.cross_attn.kv_linear: 4
  model.blocks.14.cross_attn.proj: 4
  model.blocks.14.cross_attn.q_linear: 4
  model.blocks.14.mlp.fc1: 8
  model.blocks.14.mlp.fc2: 8
  model.blocks.15.attn.k: 4
  model.blocks.15.attn.proj: 4
  model.blocks.15.attn.q: 4
  model.blocks.15.attn.v: 4
  model.blocks.15.attn_temp.k: 4
  model.blocks.15.attn_temp.proj: 4
  model.blocks.15.attn_temp.q: 4
  model.blocks.15.attn_temp.v: 4
  model.blocks.15.cross_attn.kv_linear: 4
  model.blocks.15.cross_attn.proj: 4
  model.blocks.15.cross_attn.q_linear: 4
  model.blocks.15.mlp.fc1: 8
  model.blocks.15.mlp.fc2: 8
  model.blocks.16.attn.k: 4
  model.blocks.16.attn.proj: 4
  model.blocks.16.attn.q: 4
  model.blocks.16.attn.v: 4
  model.blocks.16.attn_temp.k: 4
  model.blocks.16.attn_temp.proj: 4
  model.blocks.16.attn_temp.q: 4
  model.blocks.16.attn_temp.v: 4
  model.blocks.16.cross_attn.kv_linear: 4
  model.blocks.16.cross_attn.proj: 4
  model.blocks.16.cross_attn.q_linear: 4
  model.blocks.16.mlp.fc1: 8
  model.blocks.16.mlp.fc2: 8
  model.blocks.17.attn.k: 4
  model.blocks.17.attn.proj: 4
  model.blocks.17.attn.q: 4
  model.blocks.17.attn.v: 4
  model.blocks.17.attn_temp.k: 4
  model.blocks.17.attn_temp.proj: 4
  model.blocks.17.attn_temp.q: 4
  model.blocks.17.attn_temp.v: 4
  model.blocks.17.cross_attn.kv_linear: 4
  model.blocks.17.cross_attn.proj: 4
  model.blocks.17.cross_attn.q_linear: 4
  model.blocks.17.mlp.fc1: 8
  model.blocks.17.mlp.fc2: 8
  model.blocks.18.attn.k: 4
  model.blocks.18.attn.proj: 4
  model.blocks.18.attn.q: 4
  model.blocks.18.attn.v: 4
  model.blocks.18.attn_temp.k: 4
  model.blocks.18.attn_temp.proj: 4
  model.blocks.18.attn_temp.q: 4
  model.blocks.18.attn_temp.v: 4
  model.blocks.18.cross_attn.kv_linear: 4
  model.blocks.18.cross_attn.proj: 4
  model.blocks.18.cross_attn.q_linear: 4
  model.blocks.18.mlp.fc1: 8
  model.blocks.18.mlp.fc2: 8
  model.blocks.19.attn.k: 4
  model.blocks.19.attn.proj: 4
  model.blocks.19.attn.q: 4
  model.blocks.19.attn.v: 4
  model.blocks.19.attn_temp.k: 4
  model.blocks.19.attn_temp.proj: 4
  model.blocks.19.attn_temp.q: 4
  model.blocks.19.attn_temp.v: 4
  model.blocks.19.cross_attn.kv_linear: 4
  model.blocks.19.cross_attn.proj: 4
  model.blocks.19.cross_attn.q_linear: 4
  model.blocks.19.mlp.fc1: 8
  model.blocks.19.mlp.fc2: 8
  model.blocks.2.attn.k: 4
  model.blocks.2.attn.proj: 4
  model.blocks.2.attn.q: 4
  model.blocks.2.attn.v: 4
  model.blocks.2.attn_temp.k: 4
  model.blocks.2.attn_temp.proj: 4
  model.blocks.2.attn_temp.q: 4
  model.blocks.2.attn_temp.v: 4
  model.blocks.2.cross_attn.kv_linear: 4
  model.blocks.2.cross_attn.proj: 4
  model.blocks.2.cross_attn.q_linear: 4
  model.blocks.2.mlp.fc1: 8
  model.blocks.2.mlp.fc2: 8
  model.blocks.20.attn.k: 4
  model.blocks.20.attn.proj: 4
  model.blocks.20.attn.q: 4
  model.blocks.20.attn.v: 4
  model.blocks.20.attn_temp.k: 4
  model.blocks.20.attn_temp.proj: 4
  model.blocks.20.attn_temp.q: 4
  model.blocks.20.attn_temp.v: 4
  model.blocks.20.cross_attn.kv_linear: 4
  model.blocks.20.cross_attn.proj: 4
  model.blocks.20.cross_attn.q_linear: 4
  model.blocks.20.mlp.fc1: 8
  model.blocks.20.mlp.fc2: 8
  model.blocks.21.attn.k: 4
  model.blocks.21.attn.proj: 4
  model.blocks.21.attn.q: 4
  model.blocks.21.attn.v: 4
  model.blocks.21.attn_temp.k: 4
  model.blocks.21.attn_temp.proj: 4
  model.blocks.21.attn_temp.q: 4
  model.blocks.21.attn_temp.v: 4
  model.blocks.21.cross_attn.kv_linear: 4
  model.blocks.21.cross_attn.proj: 4
  model.blocks.21.cross_attn.q_linear: 4
  model.blocks.21.mlp.fc1: 8
  model.blocks.21.mlp.fc2: 8
  model.blocks.22.attn.k: 4
  model.blocks.22.attn.proj: 4
  model.blocks.22.attn.q: 4
  model.blocks.22.attn.v: 4
  model.blocks.22.attn_temp.k: 4
  model.blocks.22.attn_temp.proj: 4
  model.blocks.22.attn_temp.q: 4
  model.blocks.22.attn_temp.v: 4
  model.blocks.22.cross_attn.kv_linear: 4
  model.blocks.22.cross_attn.proj: 4
  model.blocks.22.cross_attn.q_linear: 4
  model.blocks.22.mlp.fc1: 8
  model.blocks.22.mlp.fc2: 8
  model.blocks.23.attn.k: 4
  model.blocks.23.attn.proj: 4
  model.blocks.23.attn.q: 4
  model.blocks.23.attn.v: 4
  model.blocks.23.attn_temp.k: 4
  model.blocks.23.attn_temp.proj: 4
  model.blocks.23.attn_temp.q: 4
  model.blocks.23.attn_temp.v: 4
  model.blocks.23.cross_attn.kv_linear: 4
  model.blocks.23.cross_attn.proj: 4
  model.blocks.23.cross_attn.q_linear: 4
  model.blocks.23.mlp.fc1: 8
  model.blocks.23.mlp.fc2: 8
  model.blocks.24.attn.k: 4
  model.blocks.24.attn.proj: 4
  model.blocks.24.attn.q: 4
  model.blocks.24.attn.v: 4
  model.blocks.24.attn_temp.k: 4
  model.blocks.24.attn_temp.proj: 4
  model.blocks.24.attn_temp.q: 4
  model.blocks.24.attn_temp.v: 4
  model.blocks.24.cross_attn.kv_linear: 4
  model.blocks.24.cross_attn.proj: 4
  model.blocks.24.cross_attn.q_linear: 4
  model.blocks.24.mlp.fc1: 8
  model.blocks.24.mlp.fc2: 8
  model.blocks.25.attn.k: 4
  model.blocks.25.attn.proj: 4
  model.blocks.25.attn.q: 4
  model.blocks.25.attn.v: 4
  model.blocks.25.attn_temp.k: 4
  model.blocks.25.attn_temp.proj: 4
  model.blocks.25.attn_temp.q: 4
  model.blocks.25.attn_temp.v: 4
  model.blocks.25.cross_attn.kv_linear: 4
  model.blocks.25.cross_attn.proj: 4
  model.blocks.25.cross_attn.q_linear: 4
  model.blocks.25.mlp.fc1: 8
  model.blocks.25.mlp.fc2: 8
  model.blocks.26.attn.k: 4
  model.blocks.26.attn.proj: 4
  model.blocks.26.attn.q: 4
  model.blocks.26.attn.v: 4
  model.blocks.26.attn_temp.k: 4
  model.blocks.26.attn_temp.proj: 4
  model.blocks.26.attn_temp.q: 4
  model.blocks.26.attn_temp.v: 4
  model.blocks.26.cross_attn.kv_linear: 4
  model.blocks.26.cross_attn.proj: 4
  model.blocks.26.cross_attn.q_linear: 4
  model.blocks.26.mlp.fc1: 8
  model.blocks.26.mlp.fc2: 8
  model.blocks.27.attn.k: 4
  model.blocks.27.attn.proj: 4
  model.blocks.27.attn.q: 4
  model.blocks.27.attn.v: 4
  model.blocks.27.attn_temp.k: 4
  model.blocks.27.attn_temp.proj: 4
  model.blocks.27.attn_temp.q: 4
  model.blocks.27.attn_temp.v: 4
  model.blocks.27.cross_attn.kv_linear: 4
  model.blocks.27.cross_attn.proj: 4
  model.blocks.27.cross_attn.q_linear: 4
  model.blocks.27.mlp.fc1: 8
  model.blocks.27.mlp.fc2: 8
  model.blocks.3.attn.k: 4
  model.blocks.3.attn.proj: 4
  model.blocks.3.attn.q: 4
  model.blocks.3.attn.v: 4
  model.blocks.3.attn_temp.k: 4
  model.blocks.3.attn_temp.proj: 4
  model.blocks.3.attn_temp.q: 4
  model.blocks.3.attn_temp.v: 4
  model.blocks.3.cross_attn.kv_linear: 4
  model.blocks.3.cross_attn.proj: 4
  model.blocks.3.cross_attn.q_linear: 4
  model.blocks.3.mlp.fc1: 8
  model.blocks.3.mlp.fc2: 8
  model.blocks.4.attn.k: 4
  model.blocks.4.attn.proj: 4
  model.blocks.4.attn.q: 4
  model.blocks.4.attn.v: 4
  model.blocks.4.attn_temp.k: 4
  model.blocks.4.attn_temp.proj: 4
  model.blocks.4.attn_temp.q: 4
  model.blocks.4.attn_temp.v: 4
  model.blocks.4.cross_attn.kv_linear: 4
  model.blocks.4.cross_attn.proj: 4
  model.blocks.4.cross_attn.q_linear: 4
  model.blocks.4.mlp.fc1: 8
  model.blocks.4.mlp.fc2: 8
  model.blocks.5.attn.k: 4
  model.blocks.5.attn.proj: 4
  model.blocks.5.attn.q: 4
  model.blocks.5.attn.v: 4
  model.blocks.5.attn_temp.k: 4
  model.blocks.5.attn_temp.proj: 4
  model.blocks.5.attn_temp.q: 4
  model.blocks.5.attn_temp.v: 4
  model.blocks.5.cross_attn.kv_linear: 4
  model.blocks.5.cross_attn.proj: 4
  model.blocks.5.cross_attn.q_linear: 4
  model.blocks.5.mlp.fc1: 8
  model.blocks.5.mlp.fc2: 8
  model.blocks.6.attn.k: 4
  model.blocks.6.attn.proj: 4
  model.blocks.6.attn.q: 4
  model.blocks.6.attn.v: 4
  model.blocks.6.attn_temp.k: 4
  model.blocks.6.attn_temp.proj: 4
  model.blocks.6.attn_temp.q: 4
  model.blocks.6.attn_temp.v: 4
  model.blocks.6.cross_attn.kv_linear: 4
  model.blocks.6.cross_attn.proj: 4
  model.blocks.6.cross_attn.q_linear: 4
  model.blocks.6.mlp.fc1: 8
  model.blocks.6.mlp.fc2: 8
  model.blocks.7.attn.k: 4
  model.blocks.7.attn.proj: 4
  model.blocks.7.attn.q: 4
  model.blocks.7.attn.v: 4
  model.blocks.7.attn_temp.k: 4
  model.blocks.7.attn_temp.proj: 4
  model.blocks.7.attn_temp.q: 4
  model.blocks.7.attn_temp.v: 4
  model.blocks.7.cross_attn.kv_linear: 4
  model.blocks.7.cross_attn.proj: 4
  model.blocks.7.cross_attn.q_linear: 4
  model.blocks.7.mlp.fc1: 8
  model.blocks.7.mlp.fc2: 8
  model.blocks.8.attn.k: 4
  model.blocks.8.attn.proj: 4
  model.blocks.8.attn.q: 4
  model.blocks.8.attn.v: 4
  model.blocks.8.attn_temp.k: 4
  model.blocks.8.attn_temp.proj: 4
  model.blocks.8.attn_temp.q: 4
  model.blocks.8.attn_temp.v: 4
  model.blocks.8.cross_attn.kv_linear: 4
  model.blocks.8.cross_attn.proj: 4
  model.blocks.8.cross_attn.q_linear: 4
  model.blocks.8.mlp.fc1: 8
  model.blocks.8.mlp.fc2: 8
  model.blocks.9.attn.k: 4
  model.blocks.9.attn.proj: 4
  model.blocks.9.attn.q: 4
  model.blocks.9.attn.v: 4
  model.blocks.9.attn_temp.k: 4
  model.blocks.9.attn_temp.proj: 4
  model.blocks.9.attn_temp.q: 4
  model.blocks.9.attn_temp.v: 4
  model.blocks.9.cross_attn.kv_linear: 4
  model.blocks.9.cross_attn.proj: 4
  model.blocks.9.cross_attn.q_linear: 4
  model.blocks.9.mlp.fc1: 8
  model.blocks.9.mlp.fc2: 8
19-15:
  model.blocks.0.attn.k: 8
  model.blocks.0.attn.proj: 8
  model.blocks.0.attn.q: 8
  model.blocks.0.attn.v: 8
  model.blocks.0.attn_temp.k: 8
  model.blocks.0.attn_temp.proj: 8
  model.blocks.0.attn_temp.q: 8
  model.blocks.0.attn_temp.v: 8
  model.blocks.0.cross_attn.kv_linear: 8
  model.blocks.0.cross_attn.proj: 8
  model.blocks.0.cross_attn.q_linear: 8
  model.blocks.0.mlp.fc1: 8
  model.blocks.0.mlp.fc2: 8
  model.blocks.1.attn.k: 8
  model.blocks.1.attn.proj: 8
  model.blocks.1.attn.q: 8
  model.blocks.1.attn.v: 8
  model.blocks.1.attn_temp.k: 8
  model.blocks.1.attn_temp.proj: 8
  model.blocks.1.attn_temp.q: 8
  model.blocks.1.attn_temp.v: 8
  model.blocks.1.cross_attn.kv_linear: 8
  model.blocks.1.cross_attn.proj: 8
  model.blocks.1.cross_attn.q_linear: 8
  model.blocks.1.mlp.fc1: 8
  model.blocks.1.mlp.fc2: 8
  model.blocks.10.attn.k: 8
  model.blocks.10.attn.proj: 8
  model.blocks.10.attn.q: 8
  model.blocks.10.attn.v: 8
  model.blocks.10.attn_temp.k: 8
  model.blocks.10.attn_temp.proj: 8
  model.blocks.10.attn_temp.q: 8
  model.blocks.10.attn_temp.v: 8
  model.blocks.10.cross_attn.kv_linear: 8
  model.blocks.10.cross_attn.proj: 8
  model.blocks.10.cross_attn.q_linear: 8
  model.blocks.10.mlp.fc1: 8
  model.blocks.10.mlp.fc2: 8
  model.blocks.11.attn.k: 8
  model.blocks.11.attn.proj: 8
  model.blocks.11.attn.q: 8
  model.blocks.11.attn.v: 8
  model.blocks.11.attn_temp.k: 8
  model.blocks.11.attn_temp.proj: 8
  model.blocks.11.attn_temp.q: 8
  model.blocks.11.attn_temp.v: 8
  model.blocks.11.cross_attn.kv_linear: 8
  model.blocks.11.cross_attn.proj: 8
  model.blocks.11.cross_attn.q_linear: 8
  model.blocks.11.mlp.fc1: 8
  model.blocks.11.mlp.fc2: 8
  model.blocks.12.attn.k: 8
  model.blocks.12.attn.proj: 8
  model.blocks.12.attn.q: 8
  model.blocks.12.attn.v: 8
  model.blocks.12.attn_temp.k: 8
  model.blocks.12.attn_temp.proj: 8
  model.blocks.12.attn_temp.q: 8
  model.blocks.12.attn_temp.v: 8
  model.blocks.12.cross_attn.kv_linear: 8
  model.blocks.12.cross_attn.proj: 8
  model.blocks.12.cross_attn.q_linear: 8
  model.blocks.12.mlp.fc1: 8
  model.blocks.12.mlp.fc2: 8
  model.blocks.13.attn.k: 8
  model.blocks.13.attn.proj: 8
  model.blocks.13.attn.q: 8
  model.blocks.13.attn.v: 8
  model.blocks.13.attn_temp.k: 8
  model.blocks.13.attn_temp.proj: 8
  model.blocks.13.attn_temp.q: 8
  model.blocks.13.attn_temp.v: 8
  model.blocks.13.cross_attn.kv_linear: 8
  model.blocks.13.cross_attn.proj: 8
  model.blocks.13.cross_attn.q_linear: 8
  model.blocks.13.mlp.fc1: 8
  model.blocks.13.mlp.fc2: 8
  model.blocks.14.attn.k: 8
  model.blocks.14.attn.proj: 8
  model.blocks.14.attn.q: 8
  model.blocks.14.attn.v: 8
  model.blocks.14.attn_temp.k: 8
  model.blocks.14.attn_temp.proj: 8
  model.blocks.14.attn_temp.q: 8
  model.blocks.14.attn_temp.v: 8
  model.blocks.14.cross_attn.kv_linear: 8
  model.blocks.14.cross_attn.proj: 8
  model.blocks.14.cross_attn.q_linear: 8
  model.blocks.14.mlp.fc1: 8
  model.blocks.14.mlp.fc2: 8
  model.blocks.15.attn.k: 8
  model.blocks.15.attn.proj: 8
  model.blocks.15.attn.q: 8
  model.blocks.15.attn.v: 8
  model.blocks.15.attn_temp.k: 8
  model.blocks.15.attn_temp.proj: 8
  model.blocks.15.attn_temp.q: 8
  model.blocks.15.attn_temp.v: 8
  model.blocks.15.cross_attn.kv_linear: 8
  model.blocks.15.cross_attn.proj: 8
  model.blocks.15.cross_attn.q_linear: 8
  model.blocks.15.mlp.fc1: 8
  model.blocks.15.mlp.fc2: 8
  model.blocks.16.attn.k: 8
  model.blocks.16.attn.proj: 8
  model.blocks.16.attn.q: 8
  model.blocks.16.attn.v: 8
  model.blocks.16.attn_temp.k: 8
  model.blocks.16.attn_temp.proj: 8
  model.blocks.16.attn_temp.q: 8
  model.blocks.16.attn_temp.v: 8
  model.blocks.16.cross_attn.kv_linear: 8
  model.blocks.16.cross_attn.proj: 8
  model.blocks.16.cross_attn.q_linear: 8
  model.blocks.16.mlp.fc1: 8
  model.blocks.16.mlp.fc2: 8
  model.blocks.17.attn.k: 8
  model.blocks.17.attn.proj: 8
  model.blocks.17.attn.q: 8
  model.blocks.17.attn.v: 8
  model.blocks.17.attn_temp.k: 8
  model.blocks.17.attn_temp.proj: 8
  model.blocks.17.attn_temp.q: 8
  model.blocks.17.attn_temp.v: 8
  model.blocks.17.cross_attn.kv_linear: 8
  model.blocks.17.cross_attn.proj: 8
  model.blocks.17.cross_attn.q_linear: 8
  model.blocks.17.mlp.fc1: 8
  model.blocks.17.mlp.fc2: 8
  model.blocks.18.attn.k: 8
  model.blocks.18.attn.proj: 8
  model.blocks.18.attn.q: 8
  model.blocks.18.attn.v: 8
  model.blocks.18.attn_temp.k: 8
  model.blocks.18.attn_temp.proj: 8
  model.blocks.18.attn_temp.q: 8
  model.blocks.18.attn_temp.v: 8
  model.blocks.18.cross_attn.kv_linear: 8
  model.blocks.18.cross_attn.proj: 8
  model.blocks.18.cross_attn.q_linear: 8
  model.blocks.18.mlp.fc1: 8
  model.blocks.18.mlp.fc2: 8
  model.blocks.19.attn.k: 8
  model.blocks.19.attn.proj: 8
  model.blocks.19.attn.q: 8
  model.blocks.19.attn.v: 8
  model.blocks.19.attn_temp.k: 8
  model.blocks.19.attn_temp.proj: 8
  model.blocks.19.attn_temp.q: 8
  model.blocks.19.attn_temp.v: 8
  model.blocks.19.cross_attn.kv_linear: 8
  model.blocks.19.cross_attn.proj: 8
  model.blocks.19.cross_attn.q_linear: 8
  model.blocks.19.mlp.fc1: 8
  model.blocks.19.mlp.fc2: 8
  model.blocks.2.attn.k: 8
  model.blocks.2.attn.proj: 8
  model.blocks.2.attn.q: 8
  model.blocks.2.attn.v: 8
  model.blocks.2.attn_temp.k: 8
  model.blocks.2.attn_temp.proj: 8
  model.blocks.2.attn_temp.q: 8
  model.blocks.2.attn_temp.v: 8
  model.blocks.2.cross_attn.kv_linear: 8
  model.blocks.2.cross_attn.proj: 8
  model.blocks.2.cross_attn.q_linear: 8
  model.blocks.2.mlp.fc1: 8
  model.blocks.2.mlp.fc2: 8
  model.blocks.20.attn.k: 8
  model.blocks.20.attn.proj: 8
  model.blocks.20.attn.q: 8
  model.blocks.20.attn.v: 8
  model.blocks.20.attn_temp.k: 8
  model.blocks.20.attn_temp.proj: 8
  model.blocks.20.attn_temp.q: 8
  model.blocks.20.attn_temp.v: 8
  model.blocks.20.cross_attn.kv_linear: 8
  model.blocks.20.cross_attn.proj: 8
  model.blocks.20.cross_attn.q_linear: 8
  model.blocks.20.mlp.fc1: 8
  model.blocks.20.mlp.fc2: 8
  model.blocks.21.attn.k: 8
  model.blocks.21.attn.proj: 8
  model.blocks.21.attn.q: 8
  model.blocks.21.attn.v: 8
  model.blocks.21.attn_temp.k: 8
  model.blocks.21.attn_temp.proj: 8
  model.blocks.21.attn_temp.q: 8
  model.blocks.21.attn_temp.v: 8
  model.blocks.21.cross_attn.kv_linear: 8
  model.blocks.21.cross_attn.proj: 8
  model.blocks.21.cross_attn.q_linear: 8
  model.blocks.21.mlp.fc1: 8
  model.blocks.21.mlp.fc2: 8
  model.blocks.22.attn.k: 8
  model.blocks.22.attn.proj: 8
  model.blocks.22.attn.q: 8
  model.blocks.22.attn.v: 8
  model.blocks.22.attn_temp.k: 8
  model.blocks.22.attn_temp.proj: 8
  model.blocks.22.attn_temp.q: 8
  model.blocks.22.attn_temp.v: 8
  model.blocks.22.cross_attn.kv_linear: 8
  model.blocks.22.cross_attn.proj: 8
  model.blocks.22.cross_attn.q_linear: 8
  model.blocks.22.mlp.fc1: 8
  model.blocks.22.mlp.fc2: 8
  model.blocks.23.attn.k: 8
  model.blocks.23.attn.proj: 8
  model.blocks.23.attn.q: 8
  model.blocks.23.attn.v: 8
  model.blocks.23.attn_temp.k: 8
  model.blocks.23.attn_temp.proj: 8
  model.blocks.23.attn_temp.q: 8
  model.blocks.23.attn_temp.v: 8
  model.blocks.23.cross_attn.kv_linear: 8
  model.blocks.23.cross_attn.proj: 8
  model.blocks.23.cross_attn.q_linear: 8
  model.blocks.23.mlp.fc1: 8
  model.blocks.23.mlp.fc2: 8
  model.blocks.24.attn.k: 8
  model.blocks.24.attn.proj: 8
  model.blocks.24.attn.q: 8
  model.blocks.24.attn.v: 8
  model.blocks.24.attn_temp.k: 8
  model.blocks.24.attn_temp.proj: 8
  model.blocks.24.attn_temp.q: 8
  model.blocks.24.attn_temp.v: 8
  model.blocks.24.cross_attn.kv_linear: 8
  model.blocks.24.cross_attn.proj: 8
  model.blocks.24.cross_attn.q_linear: 8
  model.blocks.24.mlp.fc1: 8
  model.blocks.24.mlp.fc2: 8
  model.blocks.25.attn.k: 8
  model.blocks.25.attn.proj: 8
  model.blocks.25.attn.q: 8
  model.blocks.25.attn.v: 8
  model.blocks.25.attn_temp.k: 8
  model.blocks.25.attn_temp.proj: 8
  model.blocks.25.attn_temp.q: 8
  model.blocks.25.attn_temp.v: 8
  model.blocks.25.cross_attn.kv_linear: 8
  model.blocks.25.cross_attn.proj: 8
  model.blocks.25.cross_attn.q_linear: 8
  model.blocks.25.mlp.fc1: 8
  model.blocks.25.mlp.fc2: 8
  model.blocks.26.attn.k: 8
  model.blocks.26.attn.proj: 8
  model.blocks.26.attn.q: 8
  model.blocks.26.attn.v: 8
  model.blocks.26.attn_temp.k: 8
  model.blocks.26.attn_temp.proj: 8
  model.blocks.26.attn_temp.q: 8
  model.blocks.26.attn_temp.v: 8
  model.blocks.26.cross_attn.kv_linear: 8
  model.blocks.26.cross_attn.proj: 8
  model.blocks.26.cross_attn.q_linear: 8
  model.blocks.26.mlp.fc1: 8
  model.blocks.26.mlp.fc2: 8
  model.blocks.27.attn.k: 8
  model.blocks.27.attn.proj: 8
  model.blocks.27.attn.q: 8
  model.blocks.27.attn.v: 8
  model.blocks.27.attn_temp.k: 8
  model.blocks.27.attn_temp.proj: 8
  model.blocks.27.attn_temp.q: 8
  model.blocks.27.attn_temp.v: 8
  model.blocks.27.cross_attn.kv_linear: 8
  model.blocks.27.cross_attn.proj: 8
  model.blocks.27.cross_attn.q_linear: 8
  model.blocks.27.mlp.fc1: 8
  model.blocks.27.mlp.fc2: 8
  model.blocks.3.attn.k: 8
  model.blocks.3.attn.proj: 8
  model.blocks.3.attn.q: 8
  model.blocks.3.attn.v: 8
  model.blocks.3.attn_temp.k: 8
  model.blocks.3.attn_temp.proj: 8
  model.blocks.3.attn_temp.q: 8
  model.blocks.3.attn_temp.v: 8
  model.blocks.3.cross_attn.kv_linear: 8
  model.blocks.3.cross_attn.proj: 8
  model.blocks.3.cross_attn.q_linear: 8
  model.blocks.3.mlp.fc1: 8
  model.blocks.3.mlp.fc2: 8
  model.blocks.4.attn.k: 8
  model.blocks.4.attn.proj: 8
  model.blocks.4.attn.q: 8
  model.blocks.4.attn.v: 8
  model.blocks.4.attn_temp.k: 8
  model.blocks.4.attn_temp.proj: 8
  model.blocks.4.attn_temp.q: 8
  model.blocks.4.attn_temp.v: 8
  model.blocks.4.cross_attn.kv_linear: 8
  model.blocks.4.cross_attn.proj: 8
  model.blocks.4.cross_attn.q_linear: 8
  model.blocks.4.mlp.fc1: 8
  model.blocks.4.mlp.fc2: 8
  model.blocks.5.attn.k: 8
  model.blocks.5.attn.proj: 8
  model.blocks.5.attn.q: 8
  model.blocks.5.attn.v: 8
  model.blocks.5.attn_temp.k: 8
  model.blocks.5.attn_temp.proj: 8
  model.blocks.5.attn_temp.q: 8
  model.blocks.5.attn_temp.v: 8
  model.blocks.5.cross_attn.kv_linear: 8
  model.blocks.5.cross_attn.proj: 8
  model.blocks.5.cross_attn.q_linear: 8
  model.blocks.5.mlp.fc1: 8
  model.blocks.5.mlp.fc2: 8
  model.blocks.6.attn.k: 8
  model.blocks.6.attn.proj: 8
  model.blocks.6.attn.q: 8
  model.blocks.6.attn.v: 8
  model.blocks.6.attn_temp.k: 8
  model.blocks.6.attn_temp.proj: 8
  model.blocks.6.attn_temp.q: 8
  model.blocks.6.attn_temp.v: 8
  model.blocks.6.cross_attn.kv_linear: 8
  model.blocks.6.cross_attn.proj: 8
  model.blocks.6.cross_attn.q_linear: 8
  model.blocks.6.mlp.fc1: 8
  model.blocks.6.mlp.fc2: 8
  model.blocks.7.attn.k: 8
  model.blocks.7.attn.proj: 8
  model.blocks.7.attn.q: 8
  model.blocks.7.attn.v: 8
  model.blocks.7.attn_temp.k: 8
  model.blocks.7.attn_temp.proj: 8
  model.blocks.7.attn_temp.q: 8
  model.blocks.7.attn_temp.v: 8
  model.blocks.7.cross_attn.kv_linear: 8
  model.blocks.7.cross_attn.proj: 8
  model.blocks.7.cross_attn.q_linear: 8
  model.blocks.7.mlp.fc1: 8
  model.blocks.7.mlp.fc2: 8
  model.blocks.8.attn.k: 8
  model.blocks.8.attn.proj: 8
  model.blocks.8.attn.q: 8
  model.blocks.8.attn.v: 8
  model.blocks.8.attn_temp.k: 8
  model.blocks.8.attn_temp.proj: 8
  model.blocks.8.attn_temp.q: 8
  model.blocks.8.attn_temp.v: 8
  model.blocks.8.cross_attn.kv_linear: 8
  model.blocks.8.cross_attn.proj: 8
  model.blocks.8.cross_attn.q_linear: 8
  model.blocks.8.mlp.fc1: 8
  model.blocks.8.mlp.fc2: 8
  model.blocks.9.attn.k: 8
  model.blocks.9.attn.proj: 8
  model.blocks.9.attn.q: 8
  model.blocks.9.attn.v: 8
  model.blocks.9.attn_temp.k: 8
  model.blocks.9.attn_temp.proj: 8
  model.blocks.9.attn_temp.q: 8
  model.blocks.9.attn_temp.v: 8
  model.blocks.9.cross_attn.kv_linear: 8
  model.blocks.9.cross_attn.proj: 8
  model.blocks.9.cross_attn.q_linear: 8
  model.blocks.9.mlp.fc1: 8
  model.blocks.9.mlp.fc2: 8
4-0:
  model.blocks.0.attn.k: 4
  model.blocks.0.attn.proj: 4
  model.blocks.0.attn.q: 4
  model.blocks.0.attn.v: 4
  model.blocks.0.attn_temp.k: 4
  model.blocks.0.attn_temp.proj: 4
  model.blocks.0.attn_temp.q: 4
  model.blocks.0.attn_temp.v: 4
  model.blocks.0.cross_attn.kv_linear: 4
  model.blocks.0.cross_attn.proj: 4
  model.blocks.0.cross_attn.q_linear: 4
  model.blocks.0.mlp.fc1: 8
  model.blocks.0.mlp.fc2: 8
  model.blocks.1.attn.k: 4
  model.blocks.1.attn.proj: 4
  model.blocks.1.attn.q: 4
  model.blocks.1.attn.v: 4
  model.blocks.1.attn_temp.k: 4
  model.blocks.1.attn_temp.proj: 4
  model.blocks.1.attn_temp.q: 4
  model.blocks.1.attn_temp.v: 4
  model.blocks.1.cross_attn.kv_linear: 4
  model.blocks.1.cross_attn.proj: 4
  model.blocks.1.cross_attn.q_linear: 4
  model.blocks.1.mlp.fc1: 8
  model.blocks.1.mlp.fc2: 8
  model.blocks.10.attn.k: 4
  model.blocks.10.attn.proj: 4
  model.blocks.10.attn.q: 4
  model.blocks.10.attn.v: 4
  model.blocks.10.attn_temp.k: 4
  model.blocks.10.attn_temp.proj: 4
  model.blocks.10.attn_temp.q: 4
  model.blocks.10.attn_temp.v: 4
  model.blocks.10.cross_attn.kv_linear: 4
  model.blocks.10.cross_attn.proj: 4
  model.blocks.10.cross_attn.q_linear: 4
  model.blocks.10.mlp.fc1: 8
  model.blocks.10.mlp.fc2: 8
  model.blocks.11.attn.k: 4
  model.blocks.11.attn.proj: 4
  model.blocks.11.attn.q: 4
  model.blocks.11.attn.v: 4
  model.blocks.11.attn_temp.k: 4
  model.blocks.11.attn_temp.proj: 4
  model.blocks.11.attn_temp.q: 4
  model.blocks.11.attn_temp.v: 4
  model.blocks.11.cross_attn.kv_linear: 4
  model.blocks.11.cross_attn.proj: 4
  model.blocks.11.cross_attn.q_linear: 4
  model.blocks.11.mlp.fc1: 8
  model.blocks.11.mlp.fc2: 8
  model.blocks.12.attn.k: 4
  model.blocks.12.attn.proj: 4
  model.blocks.12.attn.q: 4
  model.blocks.12.attn.v: 4
  model.blocks.12.attn_temp.k: 4
  model.blocks.12.attn_temp.proj: 4
  model.blocks.12.attn_temp.q: 4
  model.blocks.12.attn_temp.v: 4
  model.blocks.12.cross_attn.kv_linear: 4
  model.blocks.12.cross_attn.proj: 4
  model.blocks.12.cross_attn.q_linear: 4
  model.blocks.12.mlp.fc1: 8
  model.blocks.12.mlp.fc2: 8
  model.blocks.13.attn.k: 4
  model.blocks.13.attn.proj: 4
  model.blocks.13.attn.q: 4
  model.blocks.13.attn.v: 4
  model.blocks.13.attn_temp.k: 4
  model.blocks.13.attn_temp.proj: 4
  model.blocks.13.attn_temp.q: 4
  model.blocks.13.attn_temp.v: 4
  model.blocks.13.cross_attn.kv_linear: 4
  model.blocks.13.cross_attn.proj: 4
  model.blocks.13.cross_attn.q_linear: 4
  model.blocks.13.mlp.fc1: 8
  model.blocks.13.mlp.fc2: 8
  model.blocks.14.attn.k: 4
  model.blocks.14.attn.proj: 4
  model.blocks.14.attn.q: 4
  model.blocks.14.attn.v: 4
  model.blocks.14.attn_temp.k: 4
  model.blocks.14.attn_temp.proj: 4
  model.blocks.14.attn_temp.q: 4
  model.blocks.14.attn_temp.v: 4
  model.blocks.14.cross_attn.kv_linear: 4
  model.blocks.14.cross_attn.proj: 4
  model.blocks.14.cross_attn.q_linear: 4
  model.blocks.14.mlp.fc1: 8
  model.blocks.14.mlp.fc2: 8
  model.blocks.15.attn.k: 4
  model.blocks.15.attn.proj: 4
  model.blocks.15.attn.q: 4
  model.blocks.15.attn.v: 4
  model.blocks.15.attn_temp.k: 4
  model.blocks.15.attn_temp.proj: 4
  model.blocks.15.attn_temp.q: 4
  model.blocks.15.attn_temp.v: 4
  model.blocks.15.cross_attn.kv_linear: 4
  model.blocks.15.cross_attn.proj: 4
  model.blocks.15.cross_attn.q_linear: 4
  model.blocks.15.mlp.fc1: 8
  model.blocks.15.mlp.fc2: 8
  model.blocks.16.attn.k: 4
  model.blocks.16.attn.proj: 4
  model.blocks.16.attn.q: 4
  model.blocks.16.attn.v: 4
  model.blocks.16.attn_temp.k: 4
  model.blocks.16.attn_temp.proj: 4
  model.blocks.16.attn_temp.q: 4
  model.blocks.16.attn_temp.v: 4
  model.blocks.16.cross_attn.kv_linear: 4
  model.blocks.16.cross_attn.proj: 4
  model.blocks.16.cross_attn.q_linear: 4
  model.blocks.16.mlp.fc1: 8
  model.blocks.16.mlp.fc2: 8
  model.blocks.17.attn.k: 4
  model.blocks.17.attn.proj: 4
  model.blocks.17.attn.q: 4
  model.blocks.17.attn.v: 4
  model.blocks.17.attn_temp.k: 4
  model.blocks.17.attn_temp.proj: 4
  model.blocks.17.attn_temp.q: 4
  model.blocks.17.attn_temp.v: 4
  model.blocks.17.cross_attn.kv_linear: 4
  model.blocks.17.cross_attn.proj: 4
  model.blocks.17.cross_attn.q_linear: 4
  model.blocks.17.mlp.fc1: 8
  model.blocks.17.mlp.fc2: 8
  model.blocks.18.attn.k: 4
  model.blocks.18.attn.proj: 4
  model.blocks.18.attn.q: 4
  model.blocks.18.attn.v: 4
  model.blocks.18.attn_temp.k: 4
  model.blocks.18.attn_temp.proj: 4
  model.blocks.18.attn_temp.q: 4
  model.blocks.18.attn_temp.v: 4
  model.blocks.18.cross_attn.kv_linear: 4
  model.blocks.18.cross_attn.proj: 4
  model.blocks.18.cross_attn.q_linear: 4
  model.blocks.18.mlp.fc1: 8
  model.blocks.18.mlp.fc2: 8
  model.blocks.19.attn.k: 4
  model.blocks.19.attn.proj: 4
  model.blocks.19.attn.q: 4
  model.blocks.19.attn.v: 4
  model.blocks.19.attn_temp.k: 4
  model.blocks.19.attn_temp.proj: 4
  model.blocks.19.attn_temp.q: 4
  model.blocks.19.attn_temp.v: 4
  model.blocks.19.cross_attn.kv_linear: 4
  model.blocks.19.cross_attn.proj: 4
  model.blocks.19.cross_attn.q_linear: 4
  model.blocks.19.mlp.fc1: 8
  model.blocks.19.mlp.fc2: 8
  model.blocks.2.attn.k: 4
  model.blocks.2.attn.proj: 4
  model.blocks.2.attn.q: 4
  model.blocks.2.attn.v: 4
  model.blocks.2.attn_temp.k: 4
  model.blocks.2.attn_temp.proj: 4
  model.blocks.2.attn_temp.q: 4
  model.blocks.2.attn_temp.v: 4
  model.blocks.2.cross_attn.kv_linear: 4
  model.blocks.2.cross_attn.proj: 4
  model.blocks.2.cross_attn.q_linear: 4
  model.blocks.2.mlp.fc1: 8
  model.blocks.2.mlp.fc2: 8
  model.blocks.20.attn.k: 4
  model.blocks.20.attn.proj: 4
  model.blocks.20.attn.q: 4
  model.blocks.20.attn.v: 4
  model.blocks.20.attn_temp.k: 4
  model.blocks.20.attn_temp.proj: 4
  model.blocks.20.attn_temp.q: 4
  model.blocks.20.attn_temp.v: 4
  model.blocks.20.cross_attn.kv_linear: 4
  model.blocks.20.cross_attn.proj: 4
  model.blocks.20.cross_attn.q_linear: 4
  model.blocks.20.mlp.fc1: 8
  model.blocks.20.mlp.fc2: 8
  model.blocks.21.attn.k: 4
  model.blocks.21.attn.proj: 4
  model.blocks.21.attn.q: 4
  model.blocks.21.attn.v: 4
  model.blocks.21.attn_temp.k: 4
  model.blocks.21.attn_temp.proj: 4
  model.blocks.21.attn_temp.q: 4
  model.blocks.21.attn_temp.v: 4
  model.blocks.21.cross_attn.kv_linear: 4
  model.blocks.21.cross_attn.proj: 4
  model.blocks.21.cross_attn.q_linear: 4
  model.blocks.21.mlp.fc1: 8
  model.blocks.21.mlp.fc2: 8
  model.blocks.22.attn.k: 4
  model.blocks.22.attn.proj: 4
  model.blocks.22.attn.q: 4
  model.blocks.22.attn.v: 4
  model.blocks.22.attn_temp.k: 4
  model.blocks.22.attn_temp.proj: 4
  model.blocks.22.attn_temp.q: 4
  model.blocks.22.attn_temp.v: 4
  model.blocks.22.cross_attn.kv_linear: 4
  model.blocks.22.cross_attn.proj: 4
  model.blocks.22.cross_attn.q_linear: 4
  model.blocks.22.mlp.fc1: 8
  model.blocks.22.mlp.fc2: 8
  model.blocks.23.attn.k: 4
  model.blocks.23.attn.proj: 4
  model.blocks.23.attn.q: 4
  model.blocks.23.attn.v: 4
  model.blocks.23.attn_temp.k: 8
  model.blocks.23.attn_temp.proj: 8
  model.blocks.23.attn_temp.q: 8
  model.blocks.23.attn_temp.v: 8
  model.blocks.23.cross_attn.kv_linear: 4
  model.blocks.23.cross_attn.proj: 4
  model.blocks.23.cross_attn.q_linear: 4
  model.blocks.23.mlp.fc1: 8
  model.blocks.23.mlp.fc2: 8
  model.blocks.24.attn.k: 4
  model.blocks.24.attn.proj: 4
  model.blocks.24.attn.q: 4
  model.blocks.24.attn.v: 4
  model.blocks.24.attn_temp.k: 4
  model.blocks.24.attn_temp.proj: 4
  model.blocks.24.attn_temp.q: 4
  model.blocks.24.attn_temp.v: 4
  model.blocks.24.cross_attn.kv_linear: 4
  model.blocks.24.cross_attn.proj: 4
  model.blocks.24.cross_attn.q_linear: 4
  model.blocks.24.mlp.fc1: 8
  model.blocks.24.mlp.fc2: 8
  model.blocks.25.attn.k: 4
  model.blocks.25.attn.proj: 4
  model.blocks.25.attn.q: 4
  model.blocks.25.attn.v: 4
  model.blocks.25.attn_temp.k: 4
  model.blocks.25.attn_temp.proj: 4
  model.blocks.25.attn_temp.q: 4
  model.blocks.25.attn_temp.v: 4
  model.blocks.25.cross_attn.kv_linear: 4
  model.blocks.25.cross_attn.proj: 4
  model.blocks.25.cross_attn.q_linear: 4
  model.blocks.25.mlp.fc1: 8
  model.blocks.25.mlp.fc2: 8
  model.blocks.26.attn.k: 4
  model.blocks.26.attn.proj: 4
  model.blocks.26.attn.q: 4
  model.blocks.26.attn.v: 4
  model.blocks.26.attn_temp.k: 4
  model.blocks.26.attn_temp.proj: 4
  model.blocks.26.attn_temp.q: 4
  model.blocks.26.attn_temp.v: 4
  model.blocks.26.cross_attn.kv_linear: 4
  model.blocks.26.cross_attn.proj: 4
  model.blocks.26.cross_attn.q_linear: 4
  model.blocks.26.mlp.fc1: 8
  model.blocks.26.mlp.fc2: 8
  model.blocks.27.attn.k: 4
  model.blocks.27.attn.proj: 4
  model.blocks.27.attn.q: 4
  model.blocks.27.attn.v: 4
  model.blocks.27.attn_temp.k: 4
  model.blocks.27.attn_temp.proj: 4
  model.blocks.27.attn_temp.q: 4
  model.blocks.27.attn_temp.v: 4
  model.blocks.27.cross_attn.kv_linear: 4
  model.blocks.27.cross_attn.proj: 4
  model.blocks.27.cross_attn.q_linear: 4
  model.blocks.27.mlp.fc1: 8
  model.blocks.27.mlp.fc2: 8
  model.blocks.3.attn.k: 4
  model.blocks.3.attn.proj: 4
  model.blocks.3.attn.q: 4
  model.blocks.3.attn.v: 4
  model.blocks.3.attn_temp.k: 4
  model.blocks.3.attn_temp.proj: 4
  model.blocks.3.attn_temp.q: 4
  model.blocks.3.attn_temp.v: 4
  model.blocks.3.cross_attn.kv_linear: 4
  model.blocks.3.cross_attn.proj: 4
  model.blocks.3.cross_attn.q_linear: 4
  model.blocks.3.mlp.fc1: 8
  model.blocks.3.mlp.fc2: 8
  model.blocks.4.attn.k: 4
  model.blocks.4.attn.proj: 4
  model.blocks.4.attn.q: 4
  model.blocks.4.attn.v: 4
  model.blocks.4.attn_temp.k: 4
  model.blocks.4.attn_temp.proj: 4
  model.blocks.4.attn_temp.q: 4
  model.blocks.4.attn_temp.v: 4
  model.blocks.4.cross_attn.kv_linear: 4
  model.blocks.4.cross_attn.proj: 4
  model.blocks.4.cross_attn.q_linear: 4
  model.blocks.4.mlp.fc1: 8
  model.blocks.4.mlp.fc2: 8
  model.blocks.5.attn.k: 4
  model.blocks.5.attn.proj: 4
  model.blocks.5.attn.q: 4
  model.blocks.5.attn.v: 4
  model.blocks.5.attn_temp.k: 4
  model.blocks.5.attn_temp.proj: 4
  model.blocks.5.attn_temp.q: 4
  model.blocks.5.attn_temp.v: 4
  model.blocks.5.cross_attn.kv_linear: 4
  model.blocks.5.cross_attn.proj: 4
  model.blocks.5.cross_attn.q_linear: 4
  model.blocks.5.mlp.fc1: 8
  model.blocks.5.mlp.fc2: 8
  model.blocks.6.attn.k: 4
  model.blocks.6.attn.proj: 4
  model.blocks.6.attn.q: 4
  model.blocks.6.attn.v: 4
  model.blocks.6.attn_temp.k: 4
  model.blocks.6.attn_temp.proj: 4
  model.blocks.6.attn_temp.q: 4
  model.blocks.6.attn_temp.v: 4
  model.blocks.6.cross_attn.kv_linear: 4
  model.blocks.6.cross_attn.proj: 4
  model.blocks.6.cross_attn.q_linear: 4
  model.blocks.6.mlp.fc1: 8
  model.blocks.6.mlp.fc2: 8
  model.blocks.7.attn.k: 4
  model.blocks.7.attn.proj: 4
  model.blocks.7.attn.q: 4
  model.blocks.7.attn.v: 4
  model.blocks.7.attn_temp.k: 4
  model.blocks.7.attn_temp.proj: 4
  model.blocks.7.attn_temp.q: 4
  model.blocks.7.attn_temp.v: 4
  model.blocks.7.cross_attn.kv_linear: 4
  model.blocks.7.cross_attn.proj: 4
  model.blocks.7.cross_attn.q_linear: 4
  model.blocks.7.mlp.fc1: 8
  model.blocks.7.mlp.fc2: 8
  model.blocks.8.attn.k: 4
  model.blocks.8.attn.proj: 4
  model.blocks.8.attn.q: 4
  model.blocks.8.attn.v: 4
  model.blocks.8.attn_temp.k: 4
  model.blocks.8.attn_temp.proj: 4
  model.blocks.8.attn_temp.q: 4
  model.blocks.8.attn_temp.v: 4
  model.blocks.8.cross_attn.kv_linear: 4
  model.blocks.8.cross_attn.proj: 4
  model.blocks.8.cross_attn.q_linear: 4
  model.blocks.8.mlp.fc1: 8
  model.blocks.8.mlp.fc2: 8
  model.blocks.9.attn.k: 4
  model.blocks.9.attn.proj: 4
  model.blocks.9.attn.q: 4
  model.blocks.9.attn.v: 4
  model.blocks.9.attn_temp.k: 4
  model.blocks.9.attn_temp.proj: 4
  model.blocks.9.attn_temp.q: 4
  model.blocks.9.attn_temp.v: 4
  model.blocks.9.cross_attn.kv_linear: 4
  model.blocks.9.cross_attn.proj: 4
  model.blocks.9.cross_attn.q_linear: 4
  model.blocks.9.mlp.fc1: 8
  model.blocks.9.mlp.fc2: 8
9-5:
  model.blocks.0.attn.k: 4
  model.blocks.0.attn.proj: 4
  model.blocks.0.attn.q: 4
  model.blocks.0.attn.v: 4
  model.blocks.0.attn_temp.k: 4
  model.blocks.0.attn_temp.proj: 4
  model.blocks.0.attn_temp.q: 4
  model.blocks.0.attn_temp.v: 4
  model.blocks.0.cross_attn.kv_linear: 4
  model.blocks.0.cross_attn.proj: 4
  model.blocks.0.cross_attn.q_linear: 4
  model.blocks.0.mlp.fc1: 8
  model.blocks.0.mlp.fc2: 8
  model.blocks.1.attn.k: 4
  model.blocks.1.attn.proj: 4
  model.blocks.1.attn.q: 4
  model.blocks.1.attn.v: 4
  model.blocks.1.attn_temp.k: 4
  model.blocks.1.attn_temp.proj: 4
  model.blocks.1.attn_temp.q: 4
  model.blocks.1.attn_temp.v: 4
  model.blocks.1.cross_attn.kv_linear: 4
  model.blocks.1.cross_attn.proj: 4
  model.blocks.1.cross_attn.q_linear: 4
  model.blocks.1.mlp.fc1: 8
  model.blocks.1.mlp.fc2: 8
  model.blocks.10.attn.k: 4
  model.blocks.10.attn.proj: 4
  model.blocks.10.attn.q: 4
  model.blocks.10.attn.v: 4
  model.blocks.10.attn_temp.k: 4
  model.blocks.10.attn_temp.proj: 4
  model.blocks.10.attn_temp.q: 4
  model.blocks.10.attn_temp.v: 4
  model.blocks.10.cross_attn.kv_linear: 4
  model.blocks.10.cross_attn.proj: 4
  model.blocks.10.cross_attn.q_linear: 4
  model.blocks.10.mlp.fc1: 8
  model.blocks.10.mlp.fc2: 8
  model.blocks.11.attn.k: 4
  model.blocks.11.attn.proj: 4
  model.blocks.11.attn.q: 4
  model.blocks.11.attn.v: 4
  model.blocks.11.attn_temp.k: 4
  model.blocks.11.attn_temp.proj: 4
  model.blocks.11.attn_temp.q: 4
  model.blocks.11.attn_temp.v: 4
  model.blocks.11.cross_attn.kv_linear: 4
  model.blocks.11.cross_attn.proj: 4
  model.blocks.11.cross_attn.q_linear: 4
  model.blocks.11.mlp.fc1: 8
  model.blocks.11.mlp.fc2: 8
  model.blocks.12.attn.k: 4
  model.blocks.12.attn.proj: 4
  model.blocks.12.attn.q: 4
  model.blocks.12.attn.v: 4
  model.blocks.12.attn_temp.k: 4
  model.blocks.12.attn_temp.proj: 4
  model.blocks.12.attn_temp.q: 4
  model.blocks.12.attn_temp.v: 4
  model.blocks.12.cross_attn.kv_linear: 4
  model.blocks.12.cross_attn.proj: 4
  model.blocks.12.cross_attn.q_linear: 4
  model.blocks.12.mlp.fc1: 8
  model.blocks.12.mlp.fc2: 8
  model.blocks.13.attn.k: 4
  model.blocks.13.attn.proj: 4
  model.blocks.13.attn.q: 4
  model.blocks.13.attn.v: 4
  model.blocks.13.attn_temp.k: 4
  model.blocks.13.attn_temp.proj: 4
  model.blocks.13.attn_temp.q: 4
  model.blocks.13.attn_temp.v: 4
  model.blocks.13.cross_attn.kv_linear: 4
  model.blocks.13.cross_attn.proj: 4
  model.blocks.13.cross_attn.q_linear: 4
  model.blocks.13.mlp.fc1: 8
  model.blocks.13.mlp.fc2: 8
  model.blocks.14.attn.k: 4
  model.blocks.14.attn.proj: 4
  model.blocks.14.attn.q: 4
  model.blocks.14.attn.v: 4
  model.blocks.14.attn_temp.k: 4
  model.blocks.14.attn_temp.proj: 4
  model.blocks.14.attn_temp.q: 4
  model.blocks.14.attn_temp.v: 4
  model.blocks.14.cross_attn.kv_linear: 4
  model.blocks.14.cross_attn.proj: 4
  model.blocks.14.cross_attn.q_linear: 4
  model.blocks.14.mlp.fc1: 8
  model.blocks.14.mlp.fc2: 8
  model.blocks.15.attn.k: 4
  model.blocks.15.attn.proj: 4
  model.blocks.15.attn.q: 4
  model.blocks.15.attn.v: 4
  model.blocks.15.attn_temp.k: 4
  model.blocks.15.attn_temp.proj: 4
  model.blocks.15.attn_temp.q: 4
  model.blocks.15.attn_temp.v: 4
  model.blocks.15.cross_attn.kv_linear: 4
  model.blocks.15.cross_attn.proj: 4
  model.blocks.15.cross_attn.q_linear: 4
  model.blocks.15.mlp.fc1: 8
  model.blocks.15.mlp.fc2: 8
  model.blocks.16.attn.k: 4
  model.blocks.16.attn.proj: 4
  model.blocks.16.attn.q: 4
  model.blocks.16.attn.v: 4
  model.blocks.16.attn_temp.k: 4
  model.blocks.16.attn_temp.proj: 4
  model.blocks.16.attn_temp.q: 4
  model.blocks.16.attn_temp.v: 4
  model.blocks.16.cross_attn.kv_linear: 4
  model.blocks.16.cross_attn.proj: 4
  model.blocks.16.cross_attn.q_linear: 4
  model.blocks.16.mlp.fc1: 8
  model.blocks.16.mlp.fc2: 8
  model.blocks.17.attn.k: 4
  model.blocks.17.attn.proj: 4
  model.blocks.17.attn.q: 4
  model.blocks.17.attn.v: 4
  model.blocks.17.attn_temp.k: 4
  model.blocks.17.attn_temp.proj: 4
  model.blocks.17.attn_temp.q: 4
  model.blocks.17.attn_temp.v: 4
  model.blocks.17.cross_attn.kv_linear: 4
  model.blocks.17.cross_attn.proj: 4
  model.blocks.17.cross_attn.q_linear: 4
  model.blocks.17.mlp.fc1: 8
  model.blocks.17.mlp.fc2: 8
  model.blocks.18.attn.k: 4
  model.blocks.18.attn.proj: 4
  model.blocks.18.attn.q: 4
  model.blocks.18.attn.v: 4
  model.blocks.18.attn_temp.k: 4
  model.blocks.18.attn_temp.proj: 4
  model.blocks.18.attn_temp.q: 4
  model.blocks.18.attn_temp.v: 4
  model.blocks.18.cross_attn.kv_linear: 4
  model.blocks.18.cross_attn.proj: 4
  model.blocks.18.cross_attn.q_linear: 4
  model.blocks.18.mlp.fc1: 8
  model.blocks.18.mlp.fc2: 8
  model.blocks.19.attn.k: 4
  model.blocks.19.attn.proj: 4
  model.blocks.19.attn.q: 4
  model.blocks.19.attn.v: 4
  model.blocks.19.attn_temp.k: 4
  model.blocks.19.attn_temp.proj: 4
  model.blocks.19.attn_temp.q: 4
  model.blocks.19.attn_temp.v: 4
  model.blocks.19.cross_attn.kv_linear: 4
  model.blocks.19.cross_attn.proj: 4
  model.blocks.19.cross_attn.q_linear: 4
  model.blocks.19.mlp.fc1: 8
  model.blocks.19.mlp.fc2: 8
  model.blocks.2.attn.k: 4
  model.blocks.2.attn.proj: 4
  model.blocks.2.attn.q: 4
  model.blocks.2.attn.v: 4
  model.blocks.2.attn_temp.k: 4
  model.blocks.2.attn_temp.proj: 4
  model.blocks.2.attn_temp.q: 4
  model.blocks.2.attn_temp.v: 4
  model.blocks.2.cross_attn.kv_linear: 4
  model.blocks.2.cross_attn.proj: 4
  model.blocks.2.cross_attn.q_linear: 4
  model.blocks.2.mlp.fc1: 8
  model.blocks.2.mlp.fc2: 8
  model.blocks.20.attn.k: 4
  model.blocks.20.attn.proj: 4
  model.blocks.20.attn.q: 4
  model.blocks.20.attn.v: 4
  model.blocks.20.attn_temp.k: 4
  model.blocks.20.attn_temp.proj: 4
  model.blocks.20.attn_temp.q: 4
  model.blocks.20.attn_temp.v: 4
  model.blocks.20.cross_attn.kv_linear: 4
  model.blocks.20.cross_attn.proj: 4
  model.blocks.20.cross_attn.q_linear: 4
  model.blocks.20.mlp.fc1: 8
  model.blocks.20.mlp.fc2: 8
  model.blocks.21.attn.k: 4
  model.blocks.21.attn.proj: 4
  model.blocks.21.attn.q: 4
  model.blocks.21.attn.v: 4
  model.blocks.21.attn_temp.k: 4
  model.blocks.21.attn_temp.proj: 4
  model.blocks.21.attn_temp.q: 4
  model.blocks.21.attn_temp.v: 4
  model.blocks.21.cross_attn.kv_linear: 4
  model.blocks.21.cross_attn.proj: 4
  model.blocks.21.cross_attn.q_linear: 4
  model.blocks.21.mlp.fc1: 8
  model.blocks.21.mlp.fc2: 8
  model.blocks.22.attn.k: 4
  model.blocks.22.attn.proj: 4
  model.blocks.22.attn.q: 4
  model.blocks.22.attn.v: 4
  model.blocks.22.attn_temp.k: 4
  model.blocks.22.attn_temp.proj: 4
  model.blocks.22.attn_temp.q: 4
  model.blocks.22.attn_temp.v: 4
  model.blocks.22.cross_attn.kv_linear: 4
  model.blocks.22.cross_attn.proj: 4
  model.blocks.22.cross_attn.q_linear: 4
  model.blocks.22.mlp.fc1: 8
  model.blocks.22.mlp.fc2: 8
  model.blocks.23.attn.k: 4
  model.blocks.23.attn.proj: 4
  model.blocks.23.attn.q: 4
  model.blocks.23.attn.v: 4
  model.blocks.23.attn_temp.k: 4
  model.blocks.23.attn_temp.proj: 4
  model.blocks.23.attn_temp.q: 4
  model.blocks.23.attn_temp.v: 4
  model.blocks.23.cross_attn.kv_linear: 4
  model.blocks.23.cross_attn.proj: 4
  model.blocks.23.cross_attn.q_linear: 4
  model.blocks.23.mlp.fc1: 8
  model.blocks.23.mlp.fc2: 8
  model.blocks.24.attn.k: 4
  model.blocks.24.attn.proj: 4
  model.blocks.24.attn.q: 4
  model.blocks.24.attn.v: 4
  model.blocks.24.attn_temp.k: 4
  model.blocks.24.attn_temp.proj: 4
  model.blocks.24.attn_temp.q: 4
  model.blocks.24.attn_temp.v: 4
  model.blocks.24.cross_attn.kv_linear: 4
  model.blocks.24.cross_attn.proj: 4
  model.blocks.24.cross_attn.q_linear: 4
  model.blocks.24.mlp.fc1: 8
  model.blocks.24.mlp.fc2: 8
  model.blocks.25.attn.k: 4
  model.blocks.25.attn.proj: 4
  model.blocks.25.attn.q: 4
  model.blocks.25.attn.v: 4
  model.blocks.25.attn_temp.k: 4
  model.blocks.25.attn_temp.proj: 4
  model.blocks.25.attn_temp.q: 4
  model.blocks.25.attn_temp.v: 4
  model.blocks.25.cross_attn.kv_linear: 4
  model.blocks.25.cross_attn.proj: 4
  model.blocks.25.cross_attn.q_linear: 4
  model.blocks.25.mlp.fc1: 8
  model.blocks.25.mlp.fc2: 8
  model.blocks.26.attn.k: 4
  model.blocks.26.attn.proj: 4
  model.blocks.26.attn.q: 4
  model.blocks.26.attn.v: 4
  model.blocks.26.attn_temp.k: 4
  model.blocks.26.attn_temp.proj: 4
  model.blocks.26.attn_temp.q: 4
  model.blocks.26.attn_temp.v: 4
  model.blocks.26.cross_attn.kv_linear: 4
  model.blocks.26.cross_attn.proj: 4
  model.blocks.26.cross_attn.q_linear: 4
  model.blocks.26.mlp.fc1: 8
  model.blocks.26.mlp.fc2: 8
  model.blocks.27.attn.k: 4
  model.blocks.27.attn.proj: 4
  model.blocks.27.attn.q: 4
  model.blocks.27.attn.v: 4
  model.blocks.27.attn_temp.k: 4
  model.blocks.27.attn_temp.proj: 4
  model.blocks.27.attn_temp.q: 4
  model.blocks.27.attn_temp.v: 4
  model.blocks.27.cross_attn.kv_linear: 4
  model.blocks.27.cross_attn.proj: 4
  model.blocks.27.cross_attn.q_linear: 4
  model.blocks.27.mlp.fc1: 8
  model.blocks.27.mlp.fc2: 8
  model.blocks.3.attn.k: 4
  model.blocks.3.attn.proj: 4
  model.blocks.3.attn.q: 4
  model.blocks.3.attn.v: 4
  model.blocks.3.attn_temp.k: 4
  model.blocks.3.attn_temp.proj: 4
  model.blocks.3.attn_temp.q: 4
  model.blocks.3.attn_temp.v: 4
  model.blocks.3.cross_attn.kv_linear: 4
  model.blocks.3.cross_attn.proj: 4
  model.blocks.3.cross_attn.q_linear: 4
  model.blocks.3.mlp.fc1: 8
  model.blocks.3.mlp.fc2: 8
  model.blocks.4.attn.k: 4
  model.blocks.4.attn.proj: 4
  model.blocks.4.attn.q: 4
  model.blocks.4.attn.v: 4
  model.blocks.4.attn_temp.k: 4
  model.blocks.4.attn_temp.proj: 4
  model.blocks.4.attn_temp.q: 4
  model.blocks.4.attn_temp.v: 4
  model.blocks.4.cross_attn.kv_linear: 4
  model.blocks.4.cross_attn.proj: 4
  model.blocks.4.cross_attn.q_linear: 4
  model.blocks.4.mlp.fc1: 8
  model.blocks.4.mlp.fc2: 8
  model.blocks.5.attn.k: 4
  model.blocks.5.attn.proj: 4
  model.blocks.5.attn.q: 4
  model.blocks.5.attn.v: 4
  model.blocks.5.attn_temp.k: 4
  model.blocks.5.attn_temp.proj: 4
  model.blocks.5.attn_temp.q: 4
  model.blocks.5.attn_temp.v: 4
  model.blocks.5.cross_attn.kv_linear: 4
  model.blocks.5.cross_attn.proj: 4
  model.blocks.5.cross_attn.q_linear: 4
  model.blocks.5.mlp.fc1: 8
  model.blocks.5.mlp.fc2: 8
  model.blocks.6.attn.k: 4
  model.blocks.6.attn.proj: 4
  model.blocks.6.attn.q: 4
  model.blocks.6.attn.v: 4
  model.blocks.6.attn_temp.k: 4
  model.blocks.6.attn_temp.proj: 4
  model.blocks.6.attn_temp.q: 4
  model.blocks.6.attn_temp.v: 4
  model.blocks.6.cross_attn.kv_linear: 4
  model.blocks.6.cross_attn.proj: 4
  model.blocks.6.cross_attn.q_linear: 4
  model.blocks.6.mlp.fc1: 8
  model.blocks.6.mlp.fc2: 8
  model.blocks.7.attn.k: 4
  model.blocks.7.attn.proj: 4
  model.blocks.7.attn.q: 4
  model.blocks.7.attn.v: 4
  model.blocks.7.attn_temp.k: 4
  model.blocks.7.attn_temp.proj: 4
  model.blocks.7.attn_temp.q: 4
  model.blocks.7.attn_temp.v: 4
  model.blocks.7.cross_attn.kv_linear: 4
  model.blocks.7.cross_attn.proj: 4
  model.blocks.7.cross_attn.q_linear: 4
  model.blocks.7.mlp.fc1: 8
  model.blocks.7.mlp.fc2: 8
  model.blocks.8.attn.k: 4
  model.blocks.8.attn.proj: 4
  model.blocks.8.attn.q: 4
  model.blocks.8.attn.v: 4
  model.blocks.8.attn_temp.k: 4
  model.blocks.8.attn_temp.proj: 4
  model.blocks.8.attn_temp.q: 4
  model.blocks.8.attn_temp.v: 4
  model.blocks.8.cross_attn.kv_linear: 4
  model.blocks.8.cross_attn.proj: 4
  model.blocks.8.cross_attn.q_linear: 4
  model.blocks.8.mlp.fc1: 8
  model.blocks.8.mlp.fc2: 8
  model.blocks.9.attn.k: 4
  model.blocks.9.attn.proj: 4
  model.blocks.9.attn.q: 4
  model.blocks.9.attn.v: 4
  model.blocks.9.attn_temp.k: 4
  model.blocks.9.attn_temp.proj: 4
  model.blocks.9.attn_temp.q: 4
  model.blocks.9.attn_temp.v: 4
  model.blocks.9.cross_attn.kv_linear: 4
  model.blocks.9.cross_attn.proj: 4
  model.blocks.9.cross_attn.q_linear: 4
  model.blocks.9.mlp.fc1: 8
  model.blocks.9.mlp.fc2: 8
fp_layers:
  14-10:
  - fc1_
  - fc2_
  # - blocks.4.attn
  # - blocks.11.attn
  19-15:
  - fc1_
  - fc2_
  # - blocks.11.attn
  # - blocks.11.attn
  4-0:
  - fc1_
  - fc2_
  # - blocks.1.attn
  # - blocks.25.attn
  9-5:
  - fc1_
  - fc2_
  # - blocks.26.attn
  # - blocks.10.attn
