diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..2774f33dc79ddbfd36956e55e757b716db91b6cc 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,2439 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.bias.value/0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_0.kernel.value/0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.1 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.10 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.100 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.101 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.102 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.103 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.104 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.105 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.106 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.107 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.108 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.109 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.11 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.110 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.111 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.112 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.113 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.114 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.115 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.116 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.117 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.118 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.119 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.12 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.120 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.121 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.122 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.123 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.124 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.125 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.126 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.127 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.13 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.14 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.15 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.16 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.17 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.18 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.19 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.2 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.20 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.21 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.22 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.23 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.24 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.25 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.26 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.27 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.28 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.29 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.3 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.30 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.31 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.32 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.33 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.34 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.35 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.36 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.37 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.38 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.39 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.4 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.40 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.41 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.42 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.43 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.44 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.45 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.46 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.47 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.48 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.49 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.5 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.50 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.51 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.52 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.53 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.54 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.55 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.56 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.57 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.58 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.59 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.6 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.60 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.61 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.62 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.63 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.64 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.65 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.66 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.67 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.68 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.69 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.7 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.70 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.71 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.72 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.73 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.74 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.75 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.76 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.77 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.78 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.79 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.8 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.80 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.81 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.82 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.83 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.84 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.85 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.86 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.87 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.88 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.89 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.9 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.90 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.91 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.92 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.93 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.94 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.95 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.96 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.97 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.98 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MlpBlock_0.Dense_1.kernel.value/0.0.99 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.bias.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.1.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.10.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.100.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.101.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.102.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.103.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.104.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.105.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.106.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.107.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.108.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.109.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.11.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.110.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.111.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.112.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.113.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.114.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.115.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.116.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.117.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.118.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.119.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.12.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.120.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.121.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.122.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.123.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.124.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.125.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.126.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.127.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.13.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.14.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.15.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.16.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.17.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.18.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.19.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.2.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.20.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.21.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.22.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.23.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.24.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.25.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.26.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.27.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.28.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.29.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.3.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.30.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.31.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.32.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.33.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.34.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.35.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.36.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.37.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.38.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.39.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.4.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.40.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.41.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.42.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.43.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.44.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.45.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.46.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.47.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.48.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.49.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.5.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.50.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.51.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.52.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.53.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.54.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.55.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.56.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.57.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.58.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.59.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.6.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.60.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.61.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.62.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.63.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.64.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.65.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.66.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.67.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.68.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.69.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.7.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.70.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.71.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.72.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.73.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.74.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.75.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.76.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.77.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.78.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.79.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.8.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.80.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.81.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.82.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.83.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.84.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.85.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.86.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.87.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.88.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.89.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.9.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.90.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.91.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.92.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.93.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.94.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.95.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.96.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.97.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.98.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.key.kernel.value/0.99.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.1 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.10 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.100 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.101 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.102 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.103 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.104 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.105 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.106 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.107 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.108 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.109 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.11 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.110 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.111 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.112 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.113 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.114 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.115 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.116 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.117 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.118 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.119 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.12 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.120 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.121 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.122 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.123 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.124 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.125 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.126 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.127 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.13 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.14 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.15 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.16 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.17 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.18 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.19 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.2 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.20 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.21 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.22 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.23 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.24 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.25 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.26 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.27 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.28 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.29 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.3 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.30 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.31 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.32 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.33 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.34 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.35 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.36 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.37 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.38 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.39 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.4 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.40 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.41 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.42 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.43 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.44 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.45 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.46 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.47 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.48 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.49 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.5 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.50 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.51 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.52 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.53 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.54 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.55 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.56 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.57 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.58 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.59 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.6 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.60 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.61 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.62 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.63 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.64 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.65 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.66 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.67 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.68 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.69 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.7 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.70 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.71 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.72 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.73 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.74 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.75 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.76 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.77 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.78 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.79 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.8 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.80 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.81 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.82 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.83 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.84 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.85 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.86 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.87 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.88 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.89 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.9 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.90 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.91 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.92 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.93 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.94 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.95 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.96 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.97 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.98 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.out.kernel.value/0.0.0.99 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.bias.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.1.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.10.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.100.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.101.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.102.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.103.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.104.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.105.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.106.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.107.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.108.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.109.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.11.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.110.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.111.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.112.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.113.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.114.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.115.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.116.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.117.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.118.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.119.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.12.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.120.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.121.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.122.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.123.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.124.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.125.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.126.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.127.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.13.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.14.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.15.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.16.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.17.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.18.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.19.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.2.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.20.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.21.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.22.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.23.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.24.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.25.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.26.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.27.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.28.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.29.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.3.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.30.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.31.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.32.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.33.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.34.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.35.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.36.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.37.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.38.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.39.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.4.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.40.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.41.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.42.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.43.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.44.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.45.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.46.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.47.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.48.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.49.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.5.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.50.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.51.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.52.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.53.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.54.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.55.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.56.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.57.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.58.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.59.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.6.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.60.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.61.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.62.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.63.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.64.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.65.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.66.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.67.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.68.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.69.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.7.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.70.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.71.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.72.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.73.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.74.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.75.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.76.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.77.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.78.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.79.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.8.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.80.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.81.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.82.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.83.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.84.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.85.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.86.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.87.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.88.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.89.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.9.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.90.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.91.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.92.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.93.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.94.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.95.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.96.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.97.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.98.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.query.kernel.value/0.99.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.bias.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.1.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.10.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.100.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.101.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.102.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.103.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.104.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.105.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.106.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.107.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.108.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.109.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.11.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.110.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.111.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.112.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.113.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.114.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.115.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.116.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.117.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.118.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.119.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.12.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.120.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.121.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.122.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.123.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.124.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.125.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.126.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.127.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.13.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.14.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.15.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.16.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.17.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.18.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.19.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.2.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.20.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.21.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.22.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.23.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.24.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.25.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.26.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.27.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.28.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.29.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.3.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.30.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.31.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.32.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.33.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.34.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.35.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.36.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.37.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.38.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.39.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.4.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.40.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.41.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.42.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.43.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.44.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.45.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.46.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.47.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.48.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.49.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.5.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.50.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.51.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.52.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.53.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.54.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.55.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.56.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.57.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.58.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.59.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.6.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.60.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.61.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.62.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.63.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.64.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.65.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.66.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.67.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.68.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.69.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.7.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.70.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.71.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.72.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.73.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.74.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.75.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.76.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.77.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.78.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.79.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.8.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.80.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.81.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.82.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.83.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.84.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.85.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.86.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.87.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.88.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.89.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.9.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.90.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.91.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.92.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.93.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.94.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.95.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.96.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.97.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.98.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoderblock.MultiHeadDotProductAttention_0.value.kernel.value/0.99.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.embedder.input_embedding.value/99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum.w.value/0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.attn_vec_einsum_1.w.value/0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum.w.value/0.0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.kv_einsum_1.w.value/0.0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum.w.value/0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.attn.q_einsum_1.w.value/0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.gating_einsum.value/0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp.linear.value/0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.gating_einsum.value/0.0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.mlp_1.linear.value/0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_attention_norm_1.Dense_0.kernel.value/0.99.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.0.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.1.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.10.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.100.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.101.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.102.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.103.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.104.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.105.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.106.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.107.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.108.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.109.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.11.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.110.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.111.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.112.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.113.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.114.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.115.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.116.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.117.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.118.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.119.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.12.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.120.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.121.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.122.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.123.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.124.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.125.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.126.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.127.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.13.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.14.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.15.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.16.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.17.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.18.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.19.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.2.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.20.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.21.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.22.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.23.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.24.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.25.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.26.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.27.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.28.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.29.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.3.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.30.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.31.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.32.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.33.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.34.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.35.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.36.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.37.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.38.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.39.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.4.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.40.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.41.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.42.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.43.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.44.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.45.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.46.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.47.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.48.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.49.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.5.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.50.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.51.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.52.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.53.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.54.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.55.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.56.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.57.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.58.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.59.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.6.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.60.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.61.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.62.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.63.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.64.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.65.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.66.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.67.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.68.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.69.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.7.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.70.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.71.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.72.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.73.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.74.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.75.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.76.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.77.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.78.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.79.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.8.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.80.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.81.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.82.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.83.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.84.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.85.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.86.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.87.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.88.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.89.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.9.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.90.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.91.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.92.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.93.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.94.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.95.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.96.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.97.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.98.0 filter=lfs diff=lfs merge=lfs -text +pi05-b1kpt12-cs32/params/params.PaliGemma.llm.layers.pre_ffw_norm_1.Dense_0.kernel.value/0.99.0 filter=lfs diff=lfs merge=lfs -text diff --git a/pi05-b1kpt12-cs32/_CHECKPOINT_METADATA b/pi05-b1kpt12-cs32/_CHECKPOINT_METADATA new file mode 100644 index 0000000000000000000000000000000000000000..b1ad20b876da4154895b37ea79c5f676cb6b0451 --- /dev/null +++ b/pi05-b1kpt12-cs32/_CHECKPOINT_METADATA @@ -0,0 +1 @@ +{"item_handlers": {"assets": "openpi.training.checkpoints_dist.CallbackHandler", "params": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler", "train_state": "orbax.checkpoint._src.handlers.pytree_checkpoint_handler.PyTreeCheckpointHandler"}, "metrics": {}, "performance_metrics": {}, "init_timestamp_nsecs": 1767229799528496481, "commit_timestamp_nsecs": 1767229802728609275, "custom_metadata": {}} \ No newline at end of file diff --git a/pi05-b1kpt12-cs32/assets/behavior-1k/2025-challenge-demos/norm_stats.json b/pi05-b1kpt12-cs32/assets/behavior-1k/2025-challenge-demos/norm_stats.json new file mode 100644 index 0000000000000000000000000000000000000000..fefcaf18ff6a0ed252f90c5d44deea7896633042 --- /dev/null +++ b/pi05-b1kpt12-cs32/assets/behavior-1k/2025-challenge-demos/norm_stats.json @@ -0,0 +1,280 @@ +{ + "norm_stats": { + "state": { + "mean": [ + -0.00005846144354851098, + 0.00004309547299772801, + 1.87934179853968e-6, + 0.9309465947766095, + -1.2725443969951074, + -0.49766999210309626, + 1.942999814430757e-6, + -0.4158380201614152, + 0.04024515114955109, + -0.07453817193179028, + -0.594127535939615, + 0.31868265162070325, + 0.11388705850720614, + -0.05640597927522259, + -0.4669532543297629, + -0.05248480201419137, + 0.05701159751817017, + -0.6318098552799045, + -0.19042700845828708, + 0.13961942843285158, + 0.04829387427794492, + 0.08463827622965639, + 0.07941574332132866, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "std": [ + 0.0073260674368166145, + 0.006824090883079344, + 0.010712973796184456, + 0.442045850335985, + 0.7984148593179322, + 0.44361891874599685, + 0.00013675557574358197, + 0.43882239648902227, + 0.15635028019966846, + 0.4415431635427401, + 0.5225676751868289, + 0.5451061475740472, + 0.5257572044197384, + 0.4812971265544686, + 0.4183356509452899, + 0.16286194001261475, + 0.3981727014724286, + 0.5389020848022247, + 0.5424428796172592, + 0.5290570416795007, + 0.468644092644503, + 0.029892546801102766, + 0.03394196803560625, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "q01": [ + -0.23693275068700315, + -0.2203868911638856, + -0.282214498847723, + 0.44817109262943267, + -2.56078554391861, + -1.832590900182724, + -0.000603372776764445, + -2.2558812255859375, + -0.17450004816055298, + -2.298614817261696, + -1.6374141297340392, + -1.70578418469429, + -1.0471981763839722, + -1.5708000659942627, + -2.2236741222143173, + -1.1826500248908998, + -1.8255017410516738, + -1.6310564013123512, + -2.3159839910268785, + -1.0471978187561035, + -1.5707999467849731, + 5.3140223088207984e-11, + 4.113015408258036e-9, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "q99": [ + 0.22272354944050343, + 0.22707138995826218, + 0.2740946335345507, + 1.7174573242664337, + -0.39724056361615656, + 0.2502449731826779, + 0.0005501750274852384, + 0.4865392913520338, + 1.057918763875961, + 1.8702061723470693, + 0.09817898899316788, + 2.3561959266662598, + 1.0471981763839722, + 1.5656513550281526, + 0.3981790454536678, + 0.17450004816055298, + 2.1624921292066577, + 0.08283200771734119, + 2.187388210654259, + 1.0471981763839722, + 1.5707989931106567, + 0.10000000149011612, + 0.10000000149011612, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + }, + "actions": { + "mean": [ + 0.04893109266375809, + 0.0006245477533399661, + -0.0011740326839283477, + 0.9310451754144458, + -1.2729174177854237, + -0.49817541274017557, + 0.0, + -0.4161416368262307, + 0.04028842801120399, + -0.07512601234020208, + -0.5943173639491, + 0.32049573491580646, + 0.11449833148934463, + -0.055707589426407134, + 0.37810974451379986, + -0.46734652490351297, + -0.05252230497908911, + 0.057440953368954065, + -0.6319079902279605, + -0.19209668236034977, + 0.1400963262097964, + 0.04803503401809413, + 0.26497314649715065, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "std": [ + 0.13478765489848302, + 0.07874567256492745, + 0.12131280149054482, + 0.4419347796935527, + 0.798239592324256, + 0.44357783906871456, + 0.0, + 0.4389106302489066, + 0.15646820569544165, + 0.44319416228404, + 0.5226811432028959, + 0.5466780423732988, + 0.5272938230878158, + 0.4831235608098808, + 0.9257610744303914, + 0.4183771095337573, + 0.16297654493115837, + 0.39953061767050524, + 0.5392108370671137, + 0.5444271798241045, + 0.5305801543217454, + 0.47021922602431293, + 0.9642559210645204, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "q01": [ + -0.34999446114897725, + -0.34999996423721313, + -0.2999999523162842, + 0.44999998807907104, + -2.5608972549438476, + -1.8325998783111572, + 0.0, + -2.2566190130710604, + -0.1745000034570694, + -2.3041425182819366, + -1.6380093373060227, + -1.714489839732647, + -1.0471980571746826, + -1.5707999467849731, + -1.0, + -2.224471002697945, + -1.1824695777893066, + -1.8292457363605499, + -1.6290890508890152, + -2.3186697664260865, + -1.0471980571746826, + -1.5707999467849731, + -1.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "q99": [ + 0.6491305756568931, + 0.34999996423721313, + 0.2999999523162842, + 1.7174445390701294, + -0.4000000059604645, + 0.24981330260634432, + 0.0, + 0.4862977035939694, + 1.0588124077320096, + 1.8737776160240187, + 0.09817477315664291, + 2.3561956882476807, + 1.0471980571746826, + 1.5692623853683472, + 1.0, + 0.39837483105063465, + 0.1745000034570694, + 2.1637151706218734, + 0.08434060472249988, + 2.187532807230951, + 1.0471980571746826, + 1.5707999467849731, + 1.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ] + } + } +} \ No newline at end of file diff --git a/pi05-b1kpt12-cs32/params/_METADATA b/pi05-b1kpt12-cs32/params/_METADATA new file mode 100644 index 0000000000000000000000000000000000000000..b808bf84255c340512b8575000aafb3da4694a57 --- /dev/null +++ b/pi05-b1kpt12-cs32/params/_METADATA @@ -0,0 +1 @@ +{"tree_metadata": {"('params', 'PaliGemma', 'img', 'Transformer', 'encoder_norm', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoder_norm", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoder_norm', 'scale', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoder_norm", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'LayerNorm_0', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'LayerNorm_0', 'scale', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "LayerNorm_0", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'LayerNorm_1', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'LayerNorm_1', 'scale', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "LayerNorm_1", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MlpBlock_0', 'Dense_0', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MlpBlock_0', 'Dense_0', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MlpBlock_0', 'Dense_1', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MlpBlock_0', 'Dense_1', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MlpBlock_0", "key_type": 2}, {"key": "Dense_1", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'key', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'key', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "key", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'out', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'out', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "out", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'query', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'query', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "query", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'value', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'Transformer', 'encoderblock', 'MultiHeadDotProductAttention_0', 'value', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "Transformer", "key_type": 2}, {"key": "encoderblock", "key_type": 2}, {"key": "MultiHeadDotProductAttention_0", "key_type": 2}, {"key": "value", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'embedding', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "embedding", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'embedding', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "embedding", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'head', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "head", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'head', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "head", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'img', 'pos_embedding', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "img", "key_type": 2}, {"key": "pos_embedding", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'embedder', 'input_embedding', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "embedder", "key_type": 2}, {"key": "input_embedding", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'final_norm', 'scale', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "final_norm", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'final_norm_1', 'Dense_0', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "final_norm_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'final_norm_1', 'Dense_0', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "final_norm_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'attn', 'attn_vec_einsum', 'w', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "attn_vec_einsum", "key_type": 2}, {"key": "w", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'attn', 'attn_vec_einsum_1', 'w', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "attn_vec_einsum_1", "key_type": 2}, {"key": "w", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'attn', 'kv_einsum', 'w', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "kv_einsum", "key_type": 2}, {"key": "w", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'attn', 'kv_einsum_1', 'w', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "kv_einsum_1", "key_type": 2}, {"key": "w", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'attn', 'q_einsum', 'w', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "q_einsum", "key_type": 2}, {"key": "w", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'attn', 'q_einsum_1', 'w', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "attn", "key_type": 2}, {"key": "q_einsum_1", "key_type": 2}, {"key": "w", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'mlp', 'gating_einsum', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "mlp", "key_type": 2}, {"key": "gating_einsum", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'mlp', 'linear', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "mlp", "key_type": 2}, {"key": "linear", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'mlp_1', 'gating_einsum', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "mlp_1", "key_type": 2}, {"key": "gating_einsum", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'mlp_1', 'linear', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "mlp_1", "key_type": 2}, {"key": "linear", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'pre_attention_norm', 'scale', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "pre_attention_norm", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'pre_attention_norm_1', 'Dense_0', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "pre_attention_norm_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'pre_attention_norm_1', 'Dense_0', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "pre_attention_norm_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'pre_ffw_norm', 'scale', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "pre_ffw_norm", "key_type": 2}, {"key": "scale", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'pre_ffw_norm_1', 'Dense_0', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "pre_ffw_norm_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'PaliGemma', 'llm', 'layers', 'pre_ffw_norm_1', 'Dense_0', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "PaliGemma", "key_type": 2}, {"key": "llm", "key_type": 2}, {"key": "layers", "key_type": 2}, {"key": "pre_ffw_norm_1", "key_type": 2}, {"key": "Dense_0", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'action_in_proj', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "action_in_proj", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'action_in_proj', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "action_in_proj", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'action_out_proj', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "action_out_proj", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'action_out_proj', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "action_out_proj", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'time_mlp_in', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "time_mlp_in", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'time_mlp_in', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "time_mlp_in", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'time_mlp_out', 'bias', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "time_mlp_out", "key_type": 2}, {"key": "bias", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}, "('params', 'time_mlp_out', 'kernel', 'value')": {"key_metadata": [{"key": "params", "key_type": 2}, {"key": "time_mlp_out", "key_type": 2}, {"key": "kernel", "key_type": 2}, {"key": "value", "key_type": 2}], "value_metadata": {"value_type": "jax.Array", "skip_deserialize": false}}}, "use_zarr3": false, "store_array_data_equal_to_fill_value": true, "custom_metadata": null} \ No newline at end of file diff --git a/pi05-b1kpt12-cs32/params/_sharding b/pi05-b1kpt12-cs32/params/_sharding new file mode 100644 index 0000000000000000000000000000000000000000..7e37724a87bbb27fdaef0a1ac768b1c46ef8d72e --- /dev/null +++ b/pi05-b1kpt12-cs32/params/_sharding @@ -0,0 +1 @@ +{"cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2Rlcl9ub3JtLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2Rlcl9ub3JtLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC52YWx1ZS5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC52YWx1ZS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC5rZXkuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC5rZXkua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC5vdXQuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC5vdXQua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC5xdWVyeS5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk11bHRpSGVhZERvdFByb2R1Y3RBdHRlbnRpb25fMC5xdWVyeS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk1scEJsb2NrXzAuRGVuc2VfMC5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk1scEJsb2NrXzAuRGVuc2VfMC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk1scEJsb2NrXzAuRGVuc2VfMS5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLk1scEJsb2NrXzAuRGVuc2VfMS5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLkxheWVyTm9ybV8wLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLkxheWVyTm9ybV8wLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLkxheWVyTm9ybV8xLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuVHJhbnNmb3JtZXIuZW5jb2RlcmJsb2NrLkxheWVyTm9ybV8xLnNjYWxlLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuZW1iZWRkaW5nLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuZW1iZWRkaW5nLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuaGVhZC5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcuaGVhZC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5pbWcucG9zX2VtYmVkZGluZy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0uZW1iZWRkZXIuaW5wdXRfZW1iZWRkaW5nLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0uZmluYWxfbm9ybS5zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0uZmluYWxfbm9ybV8xLkRlbnNlXzAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0uZmluYWxfbm9ybV8xLkRlbnNlXzAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLm1scC5nYXRpbmdfZWluc3VtLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLm1scC5saW5lYXIudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLm1scF8xLmdhdGluZ19laW5zdW0udmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLm1scF8xLmxpbmVhci52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLmF0dG4uYXR0bl92ZWNfZWluc3VtLncudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLmF0dG4uYXR0bl92ZWNfZWluc3VtXzEudy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLmF0dG4ua3ZfZWluc3VtLncudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLmF0dG4ua3ZfZWluc3VtXzEudy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLmF0dG4ucV9laW5zdW0udy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLmF0dG4ucV9laW5zdW1fMS53LnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLnByZV9hdHRlbnRpb25fbm9ybS5zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLnByZV9hdHRlbnRpb25fbm9ybV8xLkRlbnNlXzAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLnByZV9hdHRlbnRpb25fbm9ybV8xLkRlbnNlXzAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLnByZV9mZndfbm9ybS5zY2FsZS52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLnByZV9mZndfbm9ybV8xLkRlbnNlXzAuYmlhcy52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLlBhbGlHZW1tYS5sbG0ubGF5ZXJzLnByZV9mZndfbm9ybV8xLkRlbnNlXzAua2VybmVsLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLmFjdGlvbl9pbl9wcm9qLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLmFjdGlvbl9pbl9wcm9qLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLmFjdGlvbl9vdXRfcHJvai5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLmFjdGlvbl9vdXRfcHJvai5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLnRpbWVfbWxwX291dC5iaWFzLnZhbHVl":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLnRpbWVfbWxwX291dC5rZXJuZWwudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLnRpbWVfbWxwX2luLmJpYXMudmFsdWU=":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}","cGFyYW1zLnRpbWVfbWxwX2luLmtlcm5lbC52YWx1ZQ==":"{\"sharding_type\": \"NamedSharding\", \"shape\": [128, 1], \"axis_names\": [\"batch\", \"fsdp\"], \"partition_spec\": [], \"device_mesh\": {\"mesh\": [[{\"id\": 0}], [{\"id\": 1}], [{\"id\": 2}], [{\"id\": 3}], [{\"id\": 4}], [{\"id\": 5}], [{\"id\": 6}], [{\"id\": 7}], [{\"id\": 8}], [{\"id\": 9}], [{\"id\": 10}], [{\"id\": 11}], [{\"id\": 12}], [{\"id\": 13}], [{\"id\": 14}], [{\"id\": 15}], [{\"id\": 16}], [{\"id\": 17}], [{\"id\": 18}], [{\"id\": 19}], [{\"id\": 20}], [{\"id\": 21}], [{\"id\": 22}], [{\"id\": 23}], [{\"id\": 24}], [{\"id\": 25}], [{\"id\": 26}], [{\"id\": 27}], [{\"id\": 28}], [{\"id\": 29}], [{\"id\": 30}], [{\"id\": 31}], [{\"id\": 32}], [{\"id\": 33}], [{\"id\": 34}], [{\"id\": 35}], [{\"id\": 36}], [{\"id\": 37}], [{\"id\": 38}], [{\"id\": 39}], [{\"id\": 40}], [{\"id\": 41}], [{\"id\": 42}], [{\"id\": 43}], [{\"id\": 44}], [{\"id\": 45}], [{\"id\": 46}], [{\"id\": 47}], [{\"id\": 48}], [{\"id\": 49}], [{\"id\": 50}], [{\"id\": 51}], [{\"id\": 52}], [{\"id\": 53}], [{\"id\": 54}], [{\"id\": 55}], [{\"id\": 56}], [{\"id\": 57}], [{\"id\": 58}], [{\"id\": 59}], [{\"id\": 60}], [{\"id\": 61}], [{\"id\": 62}], [{\"id\": 63}], [{\"id\": 64}], [{\"id\": 65}], [{\"id\": 66}], [{\"id\": 67}], [{\"id\": 68}], [{\"id\": 69}], [{\"id\": 70}], [{\"id\": 71}], [{\"id\": 72}], [{\"id\": 73}], [{\"id\": 74}], [{\"id\": 75}], [{\"id\": 76}], [{\"id\": 77}], [{\"id\": 78}], [{\"id\": 79}], [{\"id\": 80}], [{\"id\": 81}], [{\"id\": 82}], [{\"id\": 83}], [{\"id\": 84}], [{\"id\": 85}], [{\"id\": 86}], [{\"id\": 87}], [{\"id\": 88}], [{\"id\": 89}], [{\"id\": 90}], [{\"id\": 91}], [{\"id\": 92}], [{\"id\": 93}], [{\"id\": 94}], [{\"id\": 95}], [{\"id\": 96}], [{\"id\": 97}], [{\"id\": 98}], [{\"id\": 99}], [{\"id\": 100}], [{\"id\": 101}], [{\"id\": 102}], [{\"id\": 103}], [{\"id\": 104}], [{\"id\": 105}], [{\"id\": 106}], [{\"id\": 107}], [{\"id\": 108}], [{\"id\": 109}], [{\"id\": 110}], [{\"id\": 111}], [{\"id\": 112}], [{\"id\": 113}], [{\"id\": 114}], [{\"id\": 115}], [{\"id\": 116}], [{\"id\": 117}], [{\"id\": 118}], [{\"id\": 119}], [{\"id\": 120}], [{\"id\": 121}], [{\"id\": 122}], [{\"id\": 123}], [{\"id\": 124}], [{\"id\": 125}], [{\"id\": 126}], [{\"id\": 127}]]}}"} \ No newline at end of file diff --git a/pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoder_norm.bias.value/.zarray b/pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoder_norm.bias.value/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..21863bc65ef5e814e44ba92ab8ae2656065bc316 --- /dev/null +++ b/pi05-b1kpt12-cs32/params/params.PaliGemma.img.Transformer.encoder_norm.bias.value/.zarray @@ -0,0 +1 @@ +{"chunks":[9],"compressor":{"id":"zstd","level":1},"dimension_separator":".","dtype":"