diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..e6872cfabee5f5114d606fb9a989b675a417fd20 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,651 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.4.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.5.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.6.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.7.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.1 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.2 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.3 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.embedding.word_embeddings.weight/0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.embedding.word_embeddings.weight/1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.embedding.word_embeddings.weight/2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.embedding.word_embeddings.weight/3.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.output_layer.weight/0.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.output_layer.weight/1.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.output_layer.weight/2.0 filter=lfs diff=lfs merge=lfs -text +nemo_model/model_weights/model.output_layer.weight/3.0 filter=lfs diff=lfs merge=lfs -text diff --git a/nemo_model/model_config.yaml b/nemo_model/model_config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..2ee745462902404d0ff2630deefa52da04e31ee3 --- /dev/null +++ b/nemo_model/model_config.yaml @@ -0,0 +1,119 @@ +mcore_gpt: true +micro_batch_size: 1 +global_batch_size: 8 +tensor_model_parallel_size: 1 +pipeline_model_parallel_size: 1 +virtual_pipeline_model_parallel_size: null +encoder_seq_length: 131072 +max_position_embeddings: 131072 +num_layers: 32 +hidden_size: 4096 +ffn_hidden_size: 14336 +num_attention_heads: 32 +init_method_std: 0.02 +use_scaled_init_method: true +hidden_dropout: 0.0 +attention_dropout: 0.0 +ffn_dropout: 0.0 +kv_channels: null +apply_query_key_layer_scaling: true +normalization: rmsnorm +layernorm_epsilon: 1.0e-05 +do_layer_norm_weight_decay: false +make_vocab_size_divisible_by: 128 +pre_process: true +post_process: true +persist_layer_norm: true +bias: false +activation: fast-swiglu +headscale: false +transformer_block_type: pre_ln +openai_gelu: false +normalize_attention_scores: true +position_embedding_type: rope +rotary_percentage: 1.0 +attention_type: multihead +share_embeddings_and_output_weights: false +overlap_p2p_comm: false +batch_p2p_comm: true +num_query_groups: 8 +tokenizer: + library: huggingface + type: meta-llama/Meta-Llama-3-8B + use_fast: true +native_amp_init_scale: 4294967296 +native_amp_growth_interval: 1000 +hysteresis: 2 +fp32_residual_connection: false +fp16_lm_cross_entropy: false +megatron_amp_O2: false +grad_allreduce_chunk_size_mb: 125 +grad_div_ar_fusion: true +gradient_accumulation_fusion: false +bias_activation_fusion: false +bias_dropout_add_fusion: false +masked_softmax_fusion: true +get_attention_mask_from_fusion: true +apply_rope_fusion: false +seed: 1234 +resume_from_checkpoint: null +use_cpu_initialization: false +onnx_safe: false +apex_transformer_log_level: 30 +gradient_as_bucket_view: true +sync_batch_comm: false +activations_checkpoint_granularity: null +activations_checkpoint_method: null +activations_checkpoint_num_layers: null +num_micro_batches_with_partial_activation_checkpoints: null +activations_checkpoint_layers_per_pipeline: null +sequence_parallel: false +transformer_engine: true +fp8: false +fp8_e4m3: false +fp8_hybrid: true +fp8_margin: 0 +fp8_interval: 1 +fp8_amax_history_len: 1024 +fp8_amax_compute_algo: max +reduce_amax: true +use_emha: false +data: + index_mapping_dir: null + data_impl: mmap + splits_string: 900,50,50 + seq_length: 131072 + skip_warmup: true + num_workers: 2 + dataloader_type: single + reset_position_ids: false + reset_attention_mask: false + eod_mask_loss: false + validation_drop_last: true + no_seqlen_plus_one_input_tokens: false + pad_samples_to_global_batch_size: false + shuffle_documents: true +nsys_profile: + enabled: false + start_step: 10 + end_step: 10 + ranks: + - 0 + gen_shape: false +optim: + name: fused_adam + lr: 0.0002 + weight_decay: 0.01 + betas: + - 0.9 + - 0.98 + sched: + name: CosineAnnealing + warmup_steps: 500 + constant_steps: 50000 + min_lr: 2.0e-05 +rotary_base: 500000.0 +scale_positional_embedding: true +precision: bf16 +target: nemo.collections.nlp.models.language_modeling.megatron_gpt_model.MegatronGPTModel +nemo_version: 2.0.0rc2 diff --git a/nemo_model/model_weights/common.pt b/nemo_model/model_weights/common.pt new file mode 100644 index 0000000000000000000000000000000000000000..06484c0f4f1c25cdfe5fc7c67ff47ab62ec8592f --- /dev/null +++ b/nemo_model/model_weights/common.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9a7b9851ff64227ad087c9f4320f1654f2c9d1a14c5e9cd3bd9ecf10de814a +size 27700 diff --git a/nemo_model/model_weights/metadata.json b/nemo_model/model_weights/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..efdcae4b720b402ac0295007ff69eefab33a2e82 --- /dev/null +++ b/nemo_model/model_weights/metadata.json @@ -0,0 +1 @@ +{"sharded_backend": "zarr", "sharded_backend_version": 1, "common_backend": "torch", "common_backend_version": 1} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.final_layernorm.weight/.zarray b/nemo_model/model_weights/model.decoder.final_layernorm.weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..5048bda89e8adc4d97badae725aec120d60c3868 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.final_layernorm.weight/.zarray @@ -0,0 +1,14 @@ +{ + "chunks": [ + 4096 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.final_layernorm.weight/0 b/nemo_model/model_weights/model.decoder.final_layernorm.weight/0 new file mode 100644 index 0000000000000000000000000000000000000000..9516e235e4a980a7d28623c84e6b8421c61f323b Binary files /dev/null and b/nemo_model/model_weights/model.decoder.final_layernorm.weight/0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_0_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_0_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..af093bc040b9bfdab9ffd67f2c1c213613e5c62d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_0_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfea882a79f2bdc6691f3abffbf42f72ea90a206a873ced4c23ba225be3a52b9 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_10_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_10_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c2ed0e50688a0cbc824eee6ed07b498871987e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_10_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce2fde5075677bd348eda3e8fec4edeb648738c9160fdf341ea4bd3d502a774 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_11_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_11_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4adb79a3b81eafad2ee0f6891a7bfedf0e64cb0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_11_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7570532fbe5a7308c0eab584375a11ea5447c53c0f37baa45d0151dd0eb3f64c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_12_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_12_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f8d86274644c9610771ede40197ca9b8eac9f58 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_12_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f25e501e97cff7e8de02864772880ba25c1f94f3df6c49aaa0b4dfec3844b1b +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_13_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_13_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f39fac0eeb29a317efec3a08fad2c0ce215c5f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_13_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1342c024e8d734dba993c1b2703152ac728b93923959bd96668f521c614ff6f0 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_14_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_14_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca2e850efa96d6c00c6de5ea14f639fbf9f963a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_14_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87ac81f15e7ccca8037453d164f6b0a311df1c456912d5a5845243aa9a83107 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_15_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_15_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..437ea1fcfa2ab73eee7a898eec0997704e1b4304 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_15_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6c29a320fc3bb7ca2177396a4d262d5bb686d6ee6695e957a5259707e910fc +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_16_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_16_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e61dfaa23975967270aad806dae065cdfaa7788 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_16_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e033d5985303a093052da5d9f4dea431c518af71c277a87f5a23bf3a6be39ad +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_17_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_17_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7bd56ed532e56a11558207a37763dbc872ce002 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_17_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9495d6607a34a2ee495c8ef1a9ef72a0c5276ada44355618992a56a7404df95 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_18_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_18_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bca5e5897d482f1f14aa7573e116d9e1f552e2d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_18_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8598da7e410942c77870b4e5bde6b7a9d28391ac318438c409c9ad8e6dca52da +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_19_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_19_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f13820fcf76e40258a06b4586e83498b826ad95 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_19_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06faf86285c4b17afd70ad266428a87834326e5cf2911a7a7f75acb12222e7bb +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_1_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_1_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..89ebbac9c03995272e3df2fa62675664d6f57716 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_1_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d595d940b7304a5515a42a13db5243328cf166c05d6b389dc38ba296f895b99c +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_20_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_20_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ea979f8b1e9e7529aacc0181479dc16e1e52a9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_20_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eccd309df2ac0d7db90c90896b13b0f798e8efc5614f96659dece819f797382 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_21_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_21_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fb7faa6a94cfff6ebdf180a413828c987073e7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_21_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1063001f00061025ff3b86b9b03e2d4b9890486ac0fd4dd52128a0b613c637 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_22_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_22_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4c370ddc2282ed7983afa95d8df86c57a47bf5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_22_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfbd9465298388f8614145b4a10caab9c7f8d0d55abe62ea7b8abfc8c47d2e8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_23_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_23_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec750c20d7ea754b7060591fc68df51db2bb12d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_23_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc13cb8c15337279cabdcfeefa23321afde337b7b1284f19824c43a0863cf76 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_24_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_24_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ebd92dcb0d34b0bd690efd0bdc2da5180f6df6f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_24_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8f7582bb9b53cf1c5fa153cef9175621b3dad029679c33aaf345766500e4d3 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_25_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_25_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e690f65e8714beb7e4217d01a10ba7cb9bd2b82 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_25_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f4e6361c8a0592b80aa747c8a0fc6d1d51fcebc316a89af4a64697edf2c228 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_26_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_26_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..855bcdfd04112b915222fc86f67f147e9ae74c65 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_26_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc5ddb8b6a5e8173eff44a1a258649591b98faefeb4ae37df307cfde547a8a +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_27_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_27_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd33c1ed411dcd0ce6f8c814e30f0f76671b0325 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_27_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e7685fc01ba14be5ea09d5faeb559f569b52461fd2c0cad1c16694f2a250b9 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_28_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_28_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac35976cb5928a8da7e4ccdb5356ae7bb705f31a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_28_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95929b1933ba15aeb06cc40866fb9bc4849d315e5167854256cfbb604ef140f7 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_29_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_29_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..18b725d90b3e3fd1650d0b3f1d82e0fa29091f46 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_29_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cc67352bf8ce0ded1ad8c89a8a7d1893620b64db012b54d1585e9983c90a8c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_2_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_2_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eedcf274f79f2090967c28473e46e4a930f08b6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_2_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486d703cc7a816327e1b18018996059a23adf9177172614e860956333dd2eef0 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_30_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_30_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..c65f52a055b7e082e0cd65885d5c0deb922e9a06 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_30_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182b1e32fa0c27a25cd6525d3fb451cacc43f098039497d197b8af232c17956f +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_31_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_31_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..560bcd57ffc8d169bccd69b8e291d213494f7214 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_31_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a0a2cf37407340f38545d83578fb11ba1cc31dd32ba53cb6c2ef01a94e8cc8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_3_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_3_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..453a09b5b68dbe4520a1a34bc51220e4967b3ad3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_3_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4320cf77a3d24b17bb878df3147154cec3781c7998cba60a0040af04b5fc791 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_4_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_4_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd55ac98a7bc03e00d0e77cfe691a007e0f00feb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_4_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f48b20cd6ce31054bb776dc121e2d8c860805aba3290e19ae82d80372d0d4b4 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_5_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_5_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa4f904fc32ad2778bb130a79be99caf55f0a168 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_5_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c00d72ef6d697433831669aab19149eb06a9acd1b5dde8d9bddbffc239dd1d +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_6_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_6_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ce60eae9a820b281c5469e683029860a30d9f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_6_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e4978cb21be48bbb69d8455cc10f6e5e076dc85878033e24e2a2602a8bd6ad +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_7_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_7_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a75133c7bf3a3a7788686658ab1f091f3dfad7a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_7_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b4ebcae96a9f703a9dbb76d7e0a9a4a8f1842cd879e739b92a40a11242f5f1 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_8_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_8_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa615aa0df41fd59c2241f1ac26cd10c64b24096 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_8_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c1c7068de4f865aa72c7521437552e1bf92c309441fc1ad65d305302200d5e +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_9_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_9_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7061341e4ce159a3311f6dee8ebf866a52101ec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1._extra_state/shard_9_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e95d1a0f3a9880b886738863ad1d3e2200e21959610023c0382eb3f863b29f +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/.zarray b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9e424fcff6340323a44182d5f408a4370e2438c3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/.zarray @@ -0,0 +1,16 @@ +{ + "chunks": [ + 1, + 4096 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 32, + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..45aea43b73ea2d547920c550a2752faf9bc442c0 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/0.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c52677cac2a4d5b4f40e1dd4508940b2aa0aedc3 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/1.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/10.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/10.0 new file mode 100644 index 0000000000000000000000000000000000000000..96f798c2b18102ce6e22d3644f341c3ef3a097d1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/10.0 @@ -0,0 +1 @@ +>™>¡>–>1>¥>£>¡>—>>€>¯>©>œ>©>œ>>¥>˜>§>˜>¤>£>x>‘>™>¥>[> >?>¨>£>> >œ>˜>©>‘>‘>œ>i>§>w>ˆ>¡>\>>ˆ>˜>Ÿ>>©>S>œ>¡>>œ>‡>¨>E>¦>™>Ÿ>¥>¡>¥>> >˜>¬>—>¤>¦>•>…>«>£>¥>§>£>}>>;>¡>§>¨>¨>=>£>¥>£>œ>>›>©>>£>¡>©>­>¤>³>;>5>§>£> >«>¦> >§>™>•>§>—>¡>¨>£>¡>œ>>£>>>¤>Ÿ>¢>¥>¥> >¡>°>›>D>£>‡>—>£>©>¤>w>>°>ˆ>—>§>s>‹>¨>¨>ƒ>«>•>—>¤>>£>§>”>œ>m>”>>‡>ž>W>}>¦>c>©>¡>µ>©>>q>0>£>£>›>>X>¡>«> >˜>¦>Ÿ>”>¦>­>€>£>§>“><>§>£>œ>¦>,> >¥>•>£> >‡>«>¤>¬>•>¥>Ÿ>>½>•>Ÿ>—>¡>£>©>¢>—>¥>”>¨>›>w>§>“> >>¤>¡>”>¥>«>¤>£>>Ÿ>¨>£>°>Ÿ>¥> >•>œ>>±>¬>…>¯>¥>l>™>¬>­>>«>>¦>©>—>š>«>a>¡>¦>—>œ>Ÿ>¥>©>¨>¡>™>¡>«>§>£>;>§>©>£>¡>¥>µ>>¥>÷=,>§>ª>Œ>>‘>©>Y>«>”>5>µ>˜>¬>¡>>§>…>¤>>¯>>¬>G>‡>”>>>¡>e>¥>Ÿ>Ÿ>>‰>£>¡>‘>>•>£>Ÿ>œ>¥>ª>{>¯>¨>>§>©>¥>Ÿ>”>¥>¥>‹>™>>>>£>œ>¨>“>«>œ>›>›>£>š>³>£>˜>—>Ÿ>x>•>£>§>>>A>§>¥>¯>”>“>“> >§>>¡>a>“>ˆ>¬>™>o>›>£>Ÿ>¥>£>š>‘>>•>“>«>¢>©>­>£>¡>’>¨>«>œ>?>‰> >§>‘>¡>˜>”>«>€>¡>§>…>£>‡>©>£>£>—>¥>˜>S>> >‡>¨>>¨>£>>¨>Ÿ>Œ>£>G> >Ÿ>¡>«>¡>œ>¡>§>¨>w>¥>‘>›>¯>™>¥>§>´>£>£>¤>­>¥>—>¥>X>¦>£>>¤>«>™>>•>Ÿ>¡>ª>0>„>¡>—>­>£>¢>´>>‹>˜>¤>ž>¥>˜>˜> >©>¡>¡>>“>«>«>£>œ>¤>->™>¥>¨>«>œ>¡>¥>¤>­>Y>Ÿ>§>>£>E>>>>˜>=>£>˜>›>¥>“>M>©>˜>£>œ>‡>5>£>•> >«>¥>›>¡>Ÿ>p>™>˜>”>£>˜>ˆ>§>‘>Y>£>9>£>•>“> >›>£>…>‘>¡>¥>•>¨>¦>£>¯>«>¤>Œ>¤>‹>¢>>­>¦>>>¥>§>>—>­>>§>£>Ž> >3>>ˆ>§>¥>«>˜>œ>¢>—>¦>¦>¦>¬>•>‹>§>©>§>¥>¥>q> >©>™>‡>œ>>y>¥>>¢>Q>¤>°>£>>›>¡>š>>‘> >³>¥>)>«>¯>¡>¥>>¯>‘>>£>¥>©>©>ž>œ>“> >¥>>˜>S>›>˜>”>u>>¬>£>¤>“>>>™>¡>o>°>>¡>£>e>£>£>¦>¨>o>>%>¬>¡>>£>{>>‘>Ÿ>¨>“>¥>¨>™>˜>­>¯>ž>Ÿ>•>…>¥>£>¤>£>©>{>œ>¦>©>›>Ÿ>£>˜>¥>­>S>S>¥>¤>˜> >§>œ>Ÿ>«>¨>¯> > >¥>©>L>¡>>€>•>›>©>¨>—>>³>‹>X>™>£>¡>£>>Ÿ> >¿>«>o>œ>q>;>›>ª>¡>>£>¨>Œ>¨> >°>Ÿ>«>£>¥>€>™>¡>¥>>¥>£>`>—>Ÿ>Ÿ>¨>>¥>•>©>¨>©>>”>£>£>£>­>©>>‘>¯>¦>›>>¡>”>°>£>¤> >«>¯>£>¨>Œ>>’>>>ª>>«>a>Y>¬> >£>…>œ>­>Ÿ>¥>¡>£>Ÿ>œ>>™>Ÿ>…>Œ>§>­>Ÿ>©>>¥>>¦> >¡> >•>¡>™>§>¯>ž>H>§>¨> >>¤>›>[>§>©>•>™>£>ª>¡>£>y>¡>³>•>¦>k>¥>¨>¢>M>£>¤>¬>¨>¥>°>–>>¨>¥>˜>«>¦>q>§> >§>¡>¡>/>_>¡>£>©>>™>£>§>Q>£>§>œ>•>™>ž>¨>¡>Ÿ>•>­>«>¤>§>«>‹>¨>>¥>‹>˜>o>ƒ>™>›>¯>›>“>¡>£>—>­>©>˜> >H>>¥>> >>>“>£>¡>Ÿ>˜>›>¬>>>€>°>d>>¡>œ>£>)>¤>¤> >ˆ>©>”>•>¡>T>­>ˆ>Q> >£>¥>±>™>ž>±>4>¡>`>‰>³>Ÿ>>°>>¡>¥>¥>©>¥>€>§>>¤>Ÿ> >>•>£>\>Ÿ>¨>U>©>˜>§>œ>£>§>>—>œ>•>š> >­>I>¡>Ÿ>­>£>©>£>›>˜>Œ>¡>o>©>¡>£>¥> >­>£>­>?>Ÿ>§>¡>­>¯>•>£>¨>§>©>¦>ª>t>>—>1>>¨>x>Ÿ>•>£>¡>š>™> >­>\>«>œ>¥>§>p> >©>>«>œ>”>­>¥>—>œ> >A>©>œ>£>‡>;>§>™>˜>ž>©>¢>©>>°>¡>‚>‰> >ƒ>­>>¥>]>™>“>¨>ˆ>·>S>¡>™> >«>–> >§>±>¨>›>³>¦>¦>°>‰>ˆ>`>•>”>¥>•>š>¯>£>«>¨>¨> >9>+>˜>¥>¥>‹>>˜>³>£>¥>…>¡>£>>œ>š>Ÿ>Œ>«>˜>i>˜>£>Ÿ>§>¨>q>£>¡>œ>˜>§>u>Ÿ>¤>¡>¬>©>ˆ>‘>¥>‹>£>¡>‰>“>›>Y>(>”>­>…>¢>°>­>­>œ>¥>¨>¥>>¥>£> > >£>]>¡>œ>«>K>Ÿ> >œ>œ>©>¡>µ>Ÿ>“>–>Ÿ>«>Ÿ>›>>£>™>>¥>•>§>©>…>˜>S>£>d>¥>w>¡>¯>ˆ>©>™>•>£>¡>‘>™>¬>‘>¡>¢>±>«> >>§>¥>«>£>¬>>>X>™>¡>ª>œ> >˜>°>>¯>->s>°> >‰>>­> >œ>¬>¦>§>•>£>ž>­>w>«>”>§>£>‘>£>§>Œ>¥>¡>§>£>¯>˜>˜>ˆ> >œ>•>›>­>§>—>c>œ>“>©>¥>¢>¯>£>£>•>Ÿ>›>>¨>°>›>§>œ>§>>¡>>>£>­>±>‘>§>„>¡>™>>]>Ÿ>—>Ÿ>‹>“>Ÿ>c>°>˜>£>¡>¥>Ÿ>k> >–>™>£>¢>£>£>¯>¦>š> >˜>¬>A>£>©>£>§>¡>œ>”>—>¥>•>>Ÿ>¡>Ÿ>>¡>˜>¥> >©>¤>£>ƒ>Ÿ>a>©>Ž>›>™>£>¥>«>>£>ª>£>™>Ÿ>u>>Ÿ>¢>£>©>œ>¢> >©>§>›>¨>¥>«>>>¨> > >«>>¡>§>§>q>”>Œ>›>‘>¡>š>•>y>]>S>‰>‹>£>L>¦>¨>˜>—>—>˜>¡>¤>>±>‚>”>¯>¥>š>G>>•>¡>{>Ÿ>¡>—>™>{>¡>c>­>«>«>[>§>¤>µ>«>Ÿ>§>£>A>­>œ>£>¥>Ÿ>š>¥>™>œ>±>¡>> >¡>¥>q>¡>©>>Ÿ>§>­>­>Ÿ>Ÿ>³>£>¡>§>>¡> >­>¡>ˆ>Ÿ>>«>¬>œ>¤>¬>©>™>>£>„>>£>s> >”>ƒ>£>©>>™>>¡>­>¤>§>­>¥>§>;>X> >¥>‘>£>¡>P>œ>§>ª>¦>¥>…>‹>ª>¨>—>[>ž> >£>›>”>G> >§>Ÿ>­>«>“>>­>«>¤>¡> >¥>œ>œ>¥>°> >‰>¥>«>>>œ>˜>«>Ž>£> >U>™>§>›>{>¯> >‡>‡>S>>£>¢>§>˜>°>|>>§>>ˆ>d> >¨>>@>¤>§>ª>°>‹>ˆ>°>Ÿ>0>©>”>˜>‡>£>¥>>>Ÿ>©>¯>ª>£>«>§>¡>G>>¥>°>‘>¡> >>>“>m>«>£>§>­>>•>¢>Ÿ>£>¤>‘>¡>­>§>>§>”>¤> >Ÿ>H>„>œ>§>˜>¨>”>ˆ>©>¡>¨>£>¦>˜>a>£>ª>§>“>ª>£>‹>£>‰>e>¡>˜>€>Ÿ>¤> >>£>¥>¡>«>>>¨>;>¡>œ>}>u>¥>>™>>—>£>ž>Ÿ>£>«>«>£>A>‰>©>>§>œ>˜>˜>—>Ÿ>©>˜>¨>> >­>«>¢>›>¯>Ÿ>¡>¤>œ>£>Ÿ>”>‰>¥>£>œ>§>¯>Ÿ>ž>£>§> > >T>¨>«>H>˜>Ž>¡>> >£>>>>¥>Ÿ>£>£>>s>¡>T>—>­>G>›>Ÿ>>­>W>…>ˆ>—>>©>a>–>¥>˜>­>>Š>Ž>•>“>D>>‘>¡>¦> >§>>‡>‹>›>«>Ÿ>S>¤>¦> >œ>£>˜>œ>¥>˜>‘>”>¡>>”>1>¬>«>”>£>”>•>Œ>™>™>>£>‡>£>¡>>˜>s>O>£> >¬>>Y>>›>>§>¨>°>¨> >¡>Ÿ>¨>¨>¥>©>>«>£>‘>¥>œ>©>Ÿ>£>£>'>›>©>™>£>«>‘>¡>¨>›>ž>¥>›>Ÿ>Ÿ>›>¥>>©>—>˜> >›>;>>Ÿ>”>¡>«>™>•>©>ž>­> >°>¡>µ>¯>¡>›>¥>,>§>Ÿ>¬>‘>›>ž>¢>¨>¡>«>)>•>–>£>Ÿ>>š>¦>y>˜>¡>œ>>§>§>K>‘>Œ>œ>£>->°>œ>¥>>X>¡>¤> >£>¯>“>§>­>­>˜>°>¦>ƒ>˜>¨>¥>©>°> >™>S>˜> >¤>>¡> >Ÿ>£>L>±>¥>™>˜>©>Ÿ>›>¤>§>>¡>¦>G>>™>™>>>¡>>ª>¡>˜>•>—>™>¡>¥>>‘>>›>­>§>›>¨>™>™>ª>¤>›>¥>Ÿ>’>>Ž>£>a>©>‘>>ª>“>s>§>¥>>±>«>§>›>¢>­>>>—> >>›>¯>§>£>©>¨>©>->«>¤>­>›>> > >‘>§>˜>¤>©>©>œ>¡>¡>©>‰>Ÿ>Š>£>¤>‹>T>§>˜>‘>«> >˜>§>”>>­>«>«>£>¨>©> >£>Ÿ>¢>‡>¡>«>¡>˜>“>£>¤>§>š>¢>Ÿ>w>˜> >–>£>—>§> >>¡>¸>a>P>>‰>Ÿ>£>©>±>œ>§>…>£> >™>œ>œ>›>£>¥> >˜>«>—>‡>|>>±>¡>§>±>¥>­>•>›>¥>›>”>§>u>>Ÿ>¥>§>‹> >>“>¤>‡>¥> >¥>©>¨>ª>£>µ> >¤>x>£>…>>>›>M>“>¹>‹>¡>K>¢>¨>“>¥>y>™>”>‹>£>ˆ>˜>L>­>­>«>ª>°>Ÿ>§>›>>£>¦>§>°>—>¦>¦>­>5>…>ƒ>›>£>œ>©>ˆ>ª>¥>©>ª>ˆ> >™>™>¥>(>›>›> > >Ÿ>>‘>³>¡>¡>g>¡>±>£>¨>œ>¦> >˜>¥>€>¥>>«>­>§>œ>œ>š>T>£>˜>y>8>“>>µ>™>•>£>ª>œ>ª>©>¤>Q>u>§>–>™>˜>4>›>§>©>£>¨>§>¤>Ÿ>¥>¥>¡>¥>¦>µ>°>”>©>”>¬>Ÿ>¡>š>¦>š>£>ž>‘>™>¯>‹>›>>–>¥>Ÿ>¥>5>™>š>§>§>¥>ž>§>¤>œ>¡>¤>¥>–>§>©>‹>£>¡>¥>¡>Ÿ>Ÿ>¥>‘>«> >§>ª>K>¡>œ>£>›>„>«>§>ˆ>£>¥>ž>¥> >“>ª>>Ÿ>Ÿ>¢>Ÿ>‹>³>s>‡>›>¥>£>œ>¢>>©>¥>£>ˆ>™>µ>©>5> >ˆ>—>Ÿ>9>”>“>§>> > >“>™>©>­>¡>„>¥>¥>¤>¡>‹>›>•>©>>§>¥>x>x>±>¥>¡>§>¨>¥>q>£>§> >™>ª>¯>³>¥>•>>§>“>a>Ÿ>¦>Ÿ> >q>¤>£> >¥>˜> >œ>§>°>>¥>­>Ÿ>¦>£>«>E>ž>¯>Ÿ>¥>>o>˜> >ª> >¡>¨>¢>s> > >¥>›>¡>§>¦>«>¡>…>>”>¡>”>Ÿ>£>™>8>Q>©>³>©>™>¢>¯> >Ÿ>¯>™>˜> >³>˜>š>”>>K>‰>H>>ž>¨>¡>€>¤>y>>¡>©>™>¡>>7>œ>«>ª>£>¥>>œ>•>¡>…>œ>Ÿ>—>¦>«>¤>¨>™>¡>ƒ>£>¨>I>§>«>œ>£>£>—>ª>¥>¨>—>‘>­>§>«>¡>­>ƒ>œ>£>™>h>> >™>˜>¬>˜>t>\>™>§>§>§> >¨>§>©>­>±>£>Ÿ>A> >¥>>¬> >«>­>§>§>¨>h>ƒ>¥>_>™>œ>¨>¥>>¥>­>©>Ÿ>¤>¨>¥>›>•>¡>¦>¢>5>œ>™>e>>Ÿ>™>„>­>¨>¥>£>£>©>§>›>˜>¥>£>Ÿ>§>§>§>…>¥>>™>¡>8>ž>™>¥>—>—>P>c>§>©> >‡>§>—>s>µ>¯>¢>¥>>Ÿ>©>§>´>¢>±>«>­>œ>Ÿ>…>¤>—>Ÿ>­>£>¡>«>H>©>¡>¡>™>¢>P>˜>˜>¬>>˜>ƒ>§>–>Ÿ>‚>m>§>¡>£>¡>˜> ><>¨>Œ>“>Y>>Ÿ>«>©>œ>¡>£>©>¥>ƒ>`>Œ>§>˜>Ÿ>§>ƒ>>¡> >¥>¡>£>˜>“>™>S>«>§>¤>©>’>£>—>¨>?>“>9> > >—>‘>©>‰>>›>¡>­>ž>Ÿ>£>§>E>©>>ƒ>¨>™>—>™>ˆ>§>¤>£>|>œ>‹>>•>—>©>¦> >¡>¨>§>¥>¨>¥>¥>°>•>¡>¨>”>¡>¡>µ>w>£>š>›>—>›>Ÿ>¢>¥>¡>š>¨>•>A>‹>©>¦>•>£>«>¥>¥>£>c>§> >©>§>¤>¦>> >«>£>>£>£>­>¥>‡>›>Ÿ>¨>£>œ>§>—>¨>§>£>§> >¡>§>¦>“>¤>H>˜>>«>h>¡>§>­>¥>£>|>8>>¡>—>«>›>K> >a>>°>œ>£>”>¬>§>> >³>™>ª>£>«>•>£>¡>\>k>¦>>3>™>­>Ÿ>0>‰>Ÿ>>§>˜> >¤>¥>¬>¡>›>Œ>±>—>‘>ƒ>>>>¸>”>¦>«>£>£>¨>©>­>…>>\>”>ª>¬>—>¡>¨>X>¯>“>™>­>¨>«>[>¨>”>§>«>ª>—>¬>£>•>¡>¨>†>°>“>£>˜>‡>¡>œ> >>«>¡>›>>©>e>™>˜>>­>”>¡>m>¨>•>«>Ÿ>¨>Ÿ>‰>”>Ÿ>•>¡>¨>>L>•>§>¥>”>s>›>>¯>«>”> > >ª>¢>•>¥>™>‹>Ÿ>­>¥>•>™>>¯>c>Ž>Ÿ>T>™>˜>œ>>­> >¢>™>>¡>¥>£>¢>°>¥> >†>©>¬>”> >°>ƒ>¥>˜>•>ª>Ÿ>œ>«>©>U>§>‰>°>>¨>¥>£>±>¢>©>S>Ÿ>Œ>™>«>¡>£>¥>•> >>°>¡>˜>™>£>‘>«>›>ƒ>>§>™>©>¬>w>¥> >¡>1>­>Ÿ>¤>£>ƒ>š>£>¤>§>¡>“>s>±>­>S> >E>©>¨>™>£>¦>£>˜>”>&>>{>>¡>…>Ÿ>›>>©>>™>œ>¡>ƒ>°>…>‚>–>«>£>š>©>¯> >­>¤>o>£>«>¥>¤>†>H>T>©>›>>¡>©>¢>£>¡>¨>£>‡>Ÿ>›>§>¡>>¡>¡>©>©>§>Œ>¨>ª> >™>•>§>¥>;>§>¤>™>«>U>¥>¯> >£>«>§>§>«>¡>¡>ˆ>œ>>©>>£>‘>§>£>¢>Ÿ>©>“>£>Q>¥>¨>‰>™>±>y>¨> >«>§>•>¥>>ª>>«>o>±>°>¥>>£>¡>•>W>¡>‘>¨>š>¥>©>¡>Ÿ>>>9>œ>­>¡>›>£>Ÿ>¥>“>•>˜>—>>©>£>K>¬>‹>—>¬>Œ>¦>¥>>>­>£>™>¥>“>¨>£>>Ÿ>3>¡>i>Ÿ>§>>¦>§> >¥>X>¡> >>¨>o>£>£>§>­>™>“>£>©>±>Ÿ>£>©>˜>›>§>¥>‘>“>¡>‡>›>‘>©>œ> >>¯>«>> >>«>¡>>¡>§> >¥>¤>¤>œ>§>Ÿ>‡>›>¥>•>˜>­>£>˜>«>§>¡>¡>¤>\>”>­>¥>>«>’>¡>œ>§>¥>«>›>¡>>3>›> >£>¦>¨>¬>¡>£>§>¡>Ÿ>˜>¡>¥>>>°> >§>£>Ÿ>¥>—> >³>Ÿ>#>=>>¦>>¬>—>˜>>¨>£>¥>™>=>¥>¡>_>’>¡>Ÿ>ª>“>›>¡>¬>­>¡>©>›>>©>Ÿ>›><>«>>™> >£>•>Y>0>œ>¥>ž>>>8>£>ž>§>«>™>‹>¤>¬>°>«>¡>¨>«>ž>˜>—>©>©>w>˜>¤>>¥>‡>«>¥>£>£> >±>>¤>¬>£>§>>¥>§>–>£>œ>¢>¤>—>>¤>£>Ÿ>œ>™>¡>™>£>§>£>¬>¢>˜>§>>>¡>L>¢>±>¡>§>§>¬> >œ>>@>8>¦>£>¥>> >œ>a>ž>©> >¥>Y>Œ>>ˆ>©>>œ>™>—>˜>”>¯>H>>Ž>—>£>ž>Ÿ>©>”>}>Ÿ>£>Q>>˜>‰>­>¢>­>q>•>°>¢>¨>§>¡>Ÿ>¨>•>—>G>•>™>…>>©>­>Ÿ>š>™>>1>>‘>”>£> >¨>§>­>œ>­>œ> >œ>£>…>µ>£>˜>—>‘>µ>ž>§>£>¥>±>©>¡>­> >­>™>¢>;>©>›>•>±>>£>“>«>x>>¡>§>£>™>”>•>¡>¡>¡>¡>£>©>›>§>¦>¡>>¡>™>Ÿ>›>“>d>Ÿ>>‘> >“>>—>±>£>­>­>h>¤>¥>¥>œ>7>¡> >£>¯>¥>9>>{>¡>>„>¢>>«>˜>§>›>¡>£>…>>§>™>«>±>§> >¢>—>Q>©>¥>°>—> >œ>>£>«>s>O>„>1>X>¤> >§>©>Ÿ>­>¡>§>©>ž>£>­>¨>¨> >©>£>¬>§>Ÿ>£>§>§>¡>•>¡>¨> >‡>¥>¢>•>£>Y>>™>¯> >œ>™>¦>“>“>¦>|>«>X>5>‹>£>©>¡>«>{>¡>£>™>p>¡>¥>«>¥>¥>q>µ>˜>>›>©>œ>…>«> >¯>>¥>>¦>™>E>™>¥>¤>x>«> >§>¥>}>¤>¯>O>”> >£>œ>·>•>¯>‘>—> >¯>§>«>¥>>­>ª>¢>­>›>‹> >¥>™>¥>…> >7>¬>«>£> >“>•>>>™>>§>Ÿ>©> >>¥>L>¥>›>£>¨>œ>K>§>¥>¥>™> >±>|>ž>¨>œ>©>Ÿ>€>¬>¯>¡> >m>«>˜>¨>™>ª>™>¥>£>¡>¦>£>œ>œ>‘>•>§>¡>Ÿ>¤>™>>˜>­> >—>¨>¡>­>¡>Ÿ>£>>©>£>£>£>©>>©>—>¦>§>>›>Œ>™>§>> >¨>>Ÿ>‘>‘>¡>§>ž>¥>—>>‘>§>«>y>«>•>œ> >˜>¤>«>š>­>«>«>›>£>W>>>¥>£>¨>¤>§>>¨>–>¡>³>£>¥>>>§>u>¡>£>œ>>¥>¦>7>œ>\=œ>¥>¨>¨>¡>¨>]>­>©>£>£>>¥>œ>š>©>™>¦>§>>£>¬>¡>>¡>“>¥>ª>Ÿ>‰>˜>¡>›>”>e>+>˜>ˆ>›>”> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/11.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/11.0 new file mode 100644 index 0000000000000000000000000000000000000000..6795576f2b400b39147728839ef3584a95feeb42 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/11.0 @@ -0,0 +1 @@ +¡>›>£>˜>X>©>§>£>œ>¥>ƒ>±>­>>«>Ÿ>Ÿ>­>•>§>˜>¨>¥>…>’>š>¥>d>£>Y>©>£>”>¢>›>>¬>˜>•> >t>«>‚>>¤>m>>>›>¡>…>­>d>ž>£>ž> >ˆ>«>e>ª>›>¤>©>£>¨>£> >˜>¯>™>©>­>˜>ˆ>°>©>§>§>§>ƒ>“>[>¦>£>«>«>x>«>«>¥>Ÿ>¡>Ÿ>°> >§>¢>­>±>§>¬>_>Q>«>¥> >±>¨>§>¥>>—>§>™>¥>¯>¥>¡>>>Ÿ> >£>¥>Ÿ>¥>¨>§> >©>³>Ÿ>H>§>‰>œ>©>«>¨>„>ž>°>‹>›>«>€>‘>©>ª>‡>ª>˜>—>©>Ÿ>§>«>—>¢>u>”>>‰> >i>€>«>s>¬>¦>¸>¯>œ>{>@>¥>§>>>e>£>¬>£>›>«>Ÿ>—>§>¯>‡>©>­>—>`>¨>§>ž>¯>G>£>©>—>¡>¥>‹>­>«>¯>˜>«>£>K>Ç>”>§>˜>£>¥>°>§>™>£>™>«>™>„>­>”>¥>“>¦>§>•>«>«>£>¤>>£>°>¢>­>¥>©>Ÿ>—> >>±>»>‰>´>©>{>›>°>±> >¯>œ>¨>­>˜>>­>t>¥>­>›>>£>§>¬>§>£>—>¡>­>«>¥>W>§>«>¥>¡>¥>¸>¥>©> >4>«>­>>‘>”>­>m>­>—>Y>µ>™>­>¡>>¨>‰>­>•>±>>±>i>>™>›>>¡>q>©>¤>> >‹>¡>¡>™>“>š>«>>œ>£>­>€>µ>¯>‘>©>­>©>Ÿ>”>ª>¨>>›>Ÿ>‘>>¤>Ÿ>ª>•>¯> >™> >§> >µ>§>™>—>¥>{>”>¥>©>‘>“>I>¨>¬>­>™>•>™>¡>¬>¤>£>h>’>‰>«>œ>{>£>£>£>¥>¬>›>“>Ÿ>—>–>­>«>¥>±>¤>«>—>«>¯>œ>S>‹>¥>¥>”>£>›>™>°>ƒ>¢>¦>‹>¥>Š>¯>¤>£>”>¦>œ>k>œ>¥>‰>ª>Ž>¨>§>¥>¨> >>¥>`>¥>¡>¤>­>¥>>£>§>­>ƒ>©>”>>±>>¥>¨>»>§>¨>­>±>¥>›>«>e>«>£>”>¥>­>›>‘>–>¡>§>©>S>ˆ>£>Ÿ>°>£>¥>»>“>>™>§> >¨>>›>¤>«>£>¤>‘>™>­>°>¥> >¨>M>>¦>©>±>Ÿ>§>§>«>°>h>¦>«>œ>¦>a>>¡>‘>›>W>¦>›>œ>¦>—>c>°>™>¥>Ÿ>‹>K>¤>˜>£>­>«>£>¥> >>›>›>“>§>š>‹>©>•>q>«>Y>£>›>˜>£>>§>‡>”>§>©>—>¯>±>¥>¯>­>«>’>¥>>¡>‘>µ>©>>Ÿ>«>©>˜>˜>µ> >©>£>>£>Q>‘>‹>­>«>°>™>Ÿ>§>™>©>¦>¨>±>•>>¬>«>­>£>¨>€> >ª>ž>‹>ž>¡>>¨>ž>£>l>­>µ>¥>‡>Ÿ>Ÿ>›>•>“>¡>´>«>S>­>±> >¨>˜>±>”>‘>£>©>°>­>£>£>—>¡>©>“>›>l>Ÿ>>˜>>¡>°>¥>¨>•>œ>£>œ>§>{>³>¥>£>§>l>§>©>¥>«>{> >G>±>£>>§>ƒ>>—>>©>”>§>«>>>±>´> >£>—>ƒ>ª>¥>§>§>ª>€>¡>«>­>>£>§>™>¯>°>]>c>­>§>Ÿ>Ÿ>ª>™>Ÿ>±>©>±>Ÿ>£>§>«>e>¢>“>ƒ>™>>«>«>>>µ>‘>g>›>£>¡>§>’>¢>¡>À>°>}>Ÿ>€>T>>«>«>“>¡>­>‘>§>¡>µ>¡>«>¥>¥>…>›>¥>§>ˆ>«>¥>i>™> > >­> >§>˜>­>©>«>¡>•>¤>¥>¥>±>©>Ÿ>–>°>«> >“>£>˜>±>¥>§>§>«>¸>¤>«>‘>¡>”>£>‘>­>ž>«>l>m>­>£>¥>> >±>Ÿ>¥>Ÿ>§>ž>¢>“>›>¢>Œ>‘>¬>¬>¡>­> >©>ˆ>§>>§>¤>˜>¡>>«>°>¡>P>«>©> >•>¨>™>u>©>¨>˜>™>¡>«>£>£>ƒ>§>½>™>«>{>§>¯>§>c>§>§>«>«>§>´>”>>«>£>™>°>§>}>©>¡>«>¡>£>K>i>£>¥>¥> > >¨>©>h>¥>«>ž>˜>™>>¯>¢>Ÿ>—>³>µ>©>§>­>Ž>«>>§>‘>œ>€>ˆ>™>œ>µ>ž>•>©>¥>—>¬>«>˜>§>l>œ>§> >£>>>—>£>¥>£>›> >°> >>…>³>q>‡>¦>Ÿ>©>P>¥>«>¢>‘>±>•>•>¥>o>³>Œ>i>¥>§>«>­>¡>Ÿ>´>Q> >o>‰>·>>‘>³>›>¡>§>£>©>¥>‡>«>“>ª>¡>¥>Ÿ>—> >q>Ÿ>«>m>±>™>§>¡>¤>¨>¡>˜> >•>>£>¯>X>¤>£>¸>£>¯>¥>£>š>“>¥>y>­>¥>¨>©>£>¸>¥>³>H>Ÿ>§>£>³>·>˜>¨>¬>©>©>§>°>€> >˜>M>¢>­>>¥>•>¢>§>Ÿ>›>£>­>m>¯>Ÿ>¨>¬>€>£>­>¡>°>Ÿ>—>­>§>›>¢>£>_>«> >£>Œ>S>¥>™>™>¡>©>¢>©>‘>µ>¥>ˆ>Œ>C>ˆ>¯>‡>©>m>>•>ª>Œ>µ>h>¡>> >¯>™>>¨>·>­>>½>¥>§>³>>Œ>l>˜>”>­>™>Ÿ>­>§>°>­>¨>¡>=>Q>›>¬>©>”>‰>š>°>ª>§>…>§>§>¦>Ÿ>ž>Ÿ>>¬>™>}>>¥>£>¨>«>h>©>£> >>¨>}> >§>¡>°>§>>•>¨>‘>©>¥>‹>š>>o>/>—>±>ˆ>¡>µ>¯>°>>­>«>£>>©>£>£>>£>p>¥> >­>[>>£> > >­>Ÿ>¹>¡>—>™>>¯>Ÿ>Ÿ>>ª>›>’>§>š>§>«>Œ>š>c>¥>y>­>ƒ>£>°>Œ>©>œ>•>©>£>’>™>°>”>Ÿ>¥>±>¯>£> >«>¥>©>£>°>>>k>™>£>¬>™>£>˜>³>P>´>4>{>³>£>>£>±> > >­>§>¬>˜>¤>Ÿ>±>>¬>™>©>£>”>¨>©>>©>¥>¯>¥>¬>˜>œ>Œ>¡> >˜>Ÿ>°>§>—>c>>—>«>¥>£>±>©>¦>š>§>>‘>­>±> >«>¡>¨>>£>£>Ÿ>¥>°>´>“>«>‰>£>œ>…>k>¡>›> >Œ>•>£>s>±>š>§>£>­>§>w>£>—>œ>¥>¥>¥>­>·>«>œ>¡>™>±>W>£>«>£>©>§>¡>™>œ>¨>›> >¢>¥>Ÿ>>©>›>ª>Ÿ>¯>¬>§>¥>£>u>¤>•>¡>˜>¥>§>°>ˆ>£>«>£>Ÿ>£>€>”>£>§>ª>±>›>£>¨>«>©>Ÿ>©>©>°>“>¡>¯>£>£>­>>¡>«>ª>€>•>>Ÿ>”> >™>™>}>e>h>>>©>e>«>«>˜>™>˜>>¥>§>>±>‰>™>­>¥>>`>Ÿ>—>¥>…> >¥>>Ÿ>…> >p>±>«>°>h>¬>©>»>±>¥>©>§>a>³> >¥>§> >>ª>˜>œ>³> >Ÿ>£>§>ª>>§>­>Ÿ> >«>±>°> >Ÿ>µ>§>¡>§>…>§>£>³>§>Š>Ÿ>¡>©>°>>«>±>­>š>¢>¡>ˆ>ƒ>¤>|>£>—>ˆ>¦>§>¡>>£>¤>­>§>­>³>§>§>W>o>£>§>˜>¢>¥>`>›>­>­>§>ª>‰>>­>­>›>i> >¤>£>>›>[>£>©>£>°>«>‘>¡>°>°>¨>§>£>¥>Ÿ> >©>¹>¡>>¦>±>£>>>™>­>>¥>¥>i>>©>¡>ƒ>µ>£>‹>Š>h>>§>§>«>Ÿ>µ>ƒ>‘>°>Ÿ>>|>¤>©>”>[>§>«>«>µ>>‹>±>¡>L>¯>˜>™>‹>ª>§>Ÿ>> >©>³>¬>©>«>¨>¨>c>•>§>³>“>£>£>”>—>”>{>­>§>«>°>›>˜>§>¥>§>§>•>Ÿ>¯>¦>>ª>•>§>¥>§>[>‡> >¥>>­>™>Œ>­>¤>­>¨>§>›>d>£>°>­>•>©>«>>§>>s>£>™>„>©>§>¡>¡>©>©>¡>«>>Ÿ>­>Y>¦> >…>‡>­>‘>›>Ÿ>>¨>¥>>¨>¬>­>£>h>Ž>©>>¨> >>›>›>£>«>›>¨> >£>µ>°>¦>›>¯>œ>¥>§>¥>¥>£>˜>›>§>§>>ª>±>£> >£>ª>¥> >m>¯>­>9>•>>§>ˆ>£>§>Ÿ>¡>Ÿ>©>£>§>§> >|>§>d>™>³>a>Ÿ> >¥>³>g>Œ>‹>>>­>s>˜>«>™>°>£>>”>”>”>]>‘>‘>£>©>¡>­>Ÿ>‹>>›>­>¢>l>§>§>£>Ÿ>§>˜> >¦>>“>—>£>ž>›>O>«>©>•>©>—>›>‘>> >ƒ>§>Œ>¤>¦>H>™>w>h>¨>£>¯> >i>”>£>¤>§>­>±>ª> > > >­>©>­>«>>°>©>“>­>Ÿ>°>Ÿ>¥>¥>Y>>­>>¥>­>‘>¥>­>>¡>¥>¡>¡>¡>ž>ª>“>«>˜>›>£>>Y>‘>¡>˜>§>­>›>•>«> >­>£>¯>¥>µ>µ>¤>>§>X>­>¦>°>˜>œ> >>©>¥>³>O>œ>™>¨>£>£>Ÿ>«>ƒ>›>§>œ>£>©>­>\>“>>œ>£>a>³>ž>§>’>e>¥>¬>¦>¥>¯>˜>¨>±>°>›>µ>©>ˆ>ž>°>¥>­>µ>Ÿ>›>m>™>>¨>>¡>¡>¡>¢>c>³>§> >˜>¨>¡>Ÿ>£>©>Ÿ>¡>§>]>¡>›>> >?>©>•>«>¢>™>™>™>œ>¡>©>A>•>>>­>«>>­>˜>›>«>¨>>ª> >‘>¡>‘>£>k>§>”>ˆ>­>•>>«>§> >³>«>¨>œ>§>³>”>‘>›>©>>£>³>©>£>«>©>­>E>±>£>±>œ>ƒ>£>¢>•>¬>›>£>­>¯>£>¤>§>­>ˆ>£>‹>¡>¨>>k>¨>>”>­> >ž>©>—>•>±>«>­>¢>­>«>¥>£>£>¥>ˆ>¥>°>¡>›>—>§>©>¬>>§>¡>€>™>£>•>ª>ž>«>¥> >£>¹>u>h>H>Œ>£>¡>¨>´>œ>©>Š>¥>£>š>Ÿ> >œ>¨>§>¥>>°>™>‹>…>Ÿ>±>£>¥>°>¨>«>›>>£>›>ž>£>|>˜>£>«>­>>£>¡>—>­>>§>¡>¥>«>¯>­>©>¼>¤>¥>>¥>‡>‡>ˆ>Ÿ>`>•>·>>¥>[>§>­>“>§>…>›>›>>¥>Œ>Ÿ>p>±>³>±>­>±>¡>­> >“>§>£>¨>µ>›>§>©>¯>Y>‡>ƒ>Ÿ>§> >­>‹>­>©>­>°>>¡>¢>œ>µ>I>Ÿ>™>$>¡>£>•>—>³>¥>£>t>£>³>¥>°>¥>©> >>§>…>©> >°>³>«>Ÿ>>œ>s>§>Ÿ>…>U>”>¡>·>›>š>¥>¨>¡>«>­>¥>g>†>¥>—>›>>A>ž>§>«>§>«>¬>¥>§>§>«>¤>«>©>¼>¯>>«>•>±>£>§>›>ª>>§>Ÿ>˜>›>³>‹>£>£>š>ª>£>«>T>Ÿ>>«>«>©>£>§>¬>>¤>§>¥>›>­>©>Œ>¥>¥>£>£>¡>¡>«>‘>°>£>«>¨>_> >>§>>ˆ>±>§>Œ>¥>§>¢>¨>¤>•>ª>“>¡>¡>£>£>>¹>€>Œ>œ>§>©> >¨>„>­>©>¡>‰>>½>­>[>¡>Œ>™>£>Y>˜>”>°>‘>¥>§>”>>­>­>£>‹>§>§>«>¢>Œ>>™>«>‘>©>¨>>ƒ>µ>­>£>ª>«>¨>}>§>«>£>›>«>¸>µ>¥>ž> >©>–>x>¢>¨> >>{>§>§>¡>¤>›>¥>Ÿ>©>­> >§>±>¡>«>¥>±>P>¡>³>¡>¦>“>>>¡>¯>¢>£>¨>¤>}>£>£>ª>¡>£>©>©>©>¥>‡>Ÿ>—>¢>•>¥>©>>Y>i>«>¸>©>˜>§>µ>¡>£>³>>™>¥>·>>>˜>‘>c>ˆ>[> >§>­>§>ƒ>©>€>‘>£>ª>›>§>Ÿ>W>¦>±>¯>¨>§>>¡>—>§>ˆ>>¡>™>£>­>§>«>›>¢>†>¨>«>c>§>¯>›>§>§>œ>©>£>¯>™>”>´>©>³>¤>±>…>›>¥>>u>•>¡>Ÿ>›>°>™>‡>k>›>¯>­>«>¥>¥>§>³>¯>³>©>£>d> >¨>>±>¡>¬>¯>©>«>­>t>…>«>k>¡>¡>«>¨>Ÿ>©>°>­>¥>£>­>¯>>“>£>¨>¥>E>>˜>i>£>¥>œ>‰>¯>­>¦>©>¥>«>¨>›>>ª>¥>£>¬>©>ª>‹>§>‡>¢>§>H>Ÿ>›>§>œ>˜>_>p>§>¯>£>†>©>•>{>µ>´>£>£>¢>¢>¬>·>·>¦>µ>­>«>> >‹>¥>™>¡>°>£>£>¨>]>ª>¥>¥>ž>¦>_>™>›>¯>Ÿ>œ>‹>­>™>Ÿ>…>x>©>£>£>¦>›>£>O>¨>>•>k>¡>Ÿ>¯>¬>œ>£>¥>­>¨>…>m>•>§>™>Ÿ>­>>£>¥>§>«>£>¥>œ>”>œ>c>¯>«>§>§>’>©>˜>¯>`>•>W>¡>¤>—>•>©>>¢>œ>œ>±>Ÿ>Ÿ>ª>§>_>«>“>‹>«>Ÿ>œ>ž>Œ>ª>«>§>{>Ÿ>>“>˜>”>­>§>¡>¥>©>©>§>«>§>©>¯>™>§>ª>•> >£>µ>„>¨>™>›>>›>¡>§>¥>£>›>°>›>Y>>­>«>—>§>«>¦>©>£>m>«> >ª>§>¬>§>>§>­>£>>¥>¥>µ>«>‰> >¡>«>«>>­>™>¬>§>§>©>£>§>§>¨>™>§>@>›>“>³>x>¥>«>¯>©>©>ƒ>H>£>£>™>­> >[>£>s>¡>³>Ÿ>¥>—>­>«>’>E>¸>œ>­>«>°>—>«>£>i>w>¬>Ÿ>X>™>³>¥>5>›>Ÿ>>§>›>£>¥>¨>°>£>™>>´>Ÿ>˜>Œ>ˆ>‘>Ž>¿>–>¥>«>¬>¥>ª>«>­>‹>¡>€>”>¯>¯>˜>¥>¬>m>µ>‘>>­>«>°>s>«>—>§>­>©>›>«>¥>—> >­>Œ>«>”>£>˜>Œ> >>¡>”>­>£>œ>”>±>p>>—>ž>µ>˜>£>{>«>š>¯>£>«>£>‹>•>£>—>£>ª>Ÿ>s>˜>¨>¦>—>}>Ÿ> >°>­>”>¦>£>­>¥>˜>«>¡>>¡>¯>¤>•>œ>‘>±>w>Ž>¥>k>>™>¡> >°>¥>§>ž>>¥>£>¥>£>¸>¥>¡>ˆ>¬>«>•>£>°>‡>¥>˜>™>©>¡>Ÿ>¯>«>g>§>>³>£>¤>©>§>´>£>¬>h> >Œ>™>¬>£>£>¥>˜>¥>>±>¢>›>ž>§>”>¯>¥>ˆ>¡>­>>«>­>ƒ>©>¥>¥>X>±>>¥>¥>…>œ>£>§>©>¥>•>“>µ>­>h>Ÿ>a>«>­>>§>©>£>™>”>E>>…>‘>¥>‰>¢>›>¡>¨>£>œ>›>§>‡>µ>Œ>‡>›>­>¤>™>±>°>£>¯>¨>{>¡>¯>¨>¬>‡>a>]>­>ž>…>£>³>¦>§>¥>­>¥>Œ>¢>›>ª>§>ž> >¥>«>«>­>>­>©>£>›>˜>¨>¥>]>©>¨>›>¯>p>§>¸>£>£>³>ª>­>¬>¥>¨>>›>¡>«>œ>©>”>§>ª>§>¤>­>“>¥>a>¥>¨>>›>µ>>­>£>¯>¨>’>§>“>°>>­>{>³>³>­>Ÿ>©>§>•>p>¡>‘>°> >§>«>§> >’>“>S>Ÿ>°>£>Ÿ>§>Ÿ>§>”>™>>›>¢>­>£>h>«>>˜>­>Œ>«>¨>“>†>³>«>›>«>˜>©>£>„> >T>£>y>¡>ª>¡>¨>¨>¥>§>k>©>¤>”>«>y>¨>¢>¨>°>˜>•>§>¯>µ>¡>©>­>›>œ>§>§>•>”>£>> >™>¬>>£>–>³>­>¡>¢> >³>¤>¢>£>­>£>©>«>£>>«>£>Œ>Ÿ>©>•>™>«>§>™>ª>«>£>¡>¤>k>˜>¯>¨>“>«>•>¥>¡>©>§>­>œ>£>>U>›>£>¨>«>«>±>¥>«>¬>£>Ÿ>›>¡>¨>Ÿ> >°>¢>­>¥>Ÿ>§>—>§>¸>¥>E>`> >¬>£>°>›>Ÿ> >«>§>ª>Ÿ>X>§>¥>m>•>§> >¬>˜> >¥>±>±>£>­>œ>£>«>¢>Ÿ>Y>±>£>œ>¡>£>”>s>8>>¥> >‰>‘>S>©>£>©>­>Ÿ>>¤>³>µ>­>£>ª>°>Ÿ>š>˜>«>¬>€>™>©>Ÿ>©>Œ>°>§>§>¥> >°>C>£>°>¥>­>“>©>­>—>¦>œ>£>§>š>>§>§>£>Ÿ>œ>¡>>©>­>¤>´>¡>™>©>”>”>¥>h>¥>µ>¦>¯>¯>¯>¡>¤>¡>]>c>§>£>§>›>¤>Ÿ>h>£>°>£>§>…>>Ÿ>Œ>«>•>¡>ž>›>›>—>³>_> >“>—>¥> >£>­>•>…>£>¦>k>>›>>°>¦>±>s>–>µ>¢>¬>¥>¥>£>©>”>˜>W>˜>›>ˆ> >­>¯>¢>Ÿ>> >Y> >•>–>§>Ÿ>­>«>­>>±>›>¢>Ÿ>¥>‰>³>£>›>˜>‘>»> >«>§>©>³>«>¥>­>Ÿ>«>š>£>Y>­>>š>³>£>¡>—>±>€>Ÿ>§>©>§>›>˜>•>§>§>¥>§>©>«>¡>°>«>£>…>£>>¡>Ÿ>•>w>¥>£>˜>¥>•> >>·>£>±>±>x>¥>©>§>¢>U>£>£>§>³>ª>[>£>†>¥>•>‰>£>”>©>™>«>›>§>¤>‹> >ª>›>«>¹>«>£>¨>›>g>­>­>µ>™>¢>¢>¡>¨>¬>‚>h>Œ>U>o>¨> >«>«>Ÿ>°>£>«>°>Ÿ>§>°>©>«>¡>­>¢>¯>­>>§>«>§>¨>•>£>«>§>>«>£>˜>§>u>£>>³>¥>ž>>¨>—>—>¦>…>«>q>[>>§>­>¤>°>ƒ>£>¦>œ>x>§>¥>¯>¦>§>€>¸>—> >ž>¦>Ÿ>>«>¥>´>>¥>Ÿ>©>™>O>˜>¨>¨>„>¯>£>­>«>„>¥>±>U>•>¡>£>¡>·>›>µ>–>™> >µ>£>°>«>¡>µ>¬>¥>±>Ÿ>Œ>¥>©>›>ª>‰>¡>Y>±>­>¥>>–>™>“>Ÿ>ž>¡>­> >©>¥>>¥>[>«>›>¥>¬>¡>c>¬>§>¦>ž>£>µ>ˆ>Ÿ>­>™>­>¡>…>­>µ>¥>£>>­>›>©>œ>­>˜>©>§>£>­>§>š>™>”>>§>£>ž>¥>Ÿ>‘>›>­>£> >°>¥>µ>¥>Ÿ>§> >­>¡>£>§>¯>>¯>—>©>«>“>>>œ>©>>¡>ª>>>š>“> >¨>£>©>—>¡>“>©>°>>­>™>>¡>š>¡>¯>›>±>©>µ> >¤>o>Ÿ>…>¥>©>©>¨>¬>¡>«>›>Ÿ>±>¨>¨>D>Ÿ>§>ƒ>£>£>›>ˆ>ª>©>X>>Œ=œ>¥>©>¬>¥>­>i>µ>«>©>§>¢>©>£>>­> >§>¨>‰>§>°>§>>Ÿ>”>©>«>¥>>>¥>>˜>x>K>›>>™>“> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/12.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/12.0 new file mode 100644 index 0000000000000000000000000000000000000000..6200258220c0e5c230e21467f03d7732fd94d5a8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/12.0 @@ -0,0 +1 @@ +Ÿ>œ>Ÿ>™>‰>§>¥>£>Ÿ>¡>‰>±>­>›>§>>›>¨>•>©>™>ª>¥>‰>•>—>§>€>¢>}>¦>¢>”>>Ÿ>>­>˜>—>ž>„>ª>‡>‘>¥>>›>“>>¢>>«>> >Ÿ>Ÿ>¡>>¬>…>©>>£>¨>Ÿ>¤>¡>¡>™>¨>›>¥>¦>™>‰>«>§>¥>¥>ª>ˆ>—>>£>£>©>ª>‘>§>¤>¢>>£>š>­>Ÿ>§> >«>¯>¥>³>>>¬>¦>ž>­>¥>¡>£>›>›>§>Ÿ>£>­>£>£>¡>‘>>¡> >¤>>¥>§>¨>Ÿ>§>°>>h>£>>›>§>§>¥>‡>>¯>‘>›>¨>‡>•>¤>§>‹>­>š>›>©>>¡>§>˜>Ÿ>„>™>“>>›>„>ˆ>©>„>©>£>¹>±>›>„>c>¤>§>ž>“>€>Ÿ>ª>¡>›>¨>Ÿ>•>¡>­>‹>¥>©>>ƒ>£>¤>Ÿ>¬>p>Ÿ>§>˜>¢>§>>¨>§>­>™>¥>Ÿ>…>½>•>¦>™> >¥>«>¤>™>§>›>¨>›>‹>©>–>§>•>¥>¦>—>©>¬>¤>£>>Ÿ>­>¡>«>¢>§> >›>>>­>µ>Œ>°>§>…>>­>«>›>­>>§>©>™>Ÿ>©>ƒ>¥>¨>›>›>£>§>ª>©>¢>›>£>­>§>¥>p>¨>­>£>Ÿ>£>³>£>©>>e>¬>§>“>“>”>«>>­>”>ˆ>¸>™>«>£>‘>£>Œ>ª>—>°>•>­>…>>™>›>“>¡>ƒ>¦>¥>>ž>>¤>>—>•>>¨>>>§>­>‰>±>ª>“>©>­>¤> >—>¨>©>“>>Ÿ>—>‘>£>>§>˜>«>™>œ> >¥>Ÿ>´>¥>›>™>Ÿ>„>—>£>§>•>“>d>¥>§>©>š>•>—>Ÿ>©>£>¤>>—>>ª>›>…>ª>§>¡>¥>©>>•>Ÿ>”>—>­>§>§>¬>£>§>˜>¤>ª>>{>>¦>§>”>£>˜>™>«>…>Ÿ>§>>§>—>©>§>¡>—>¤>œ>}>>£>>©>>¨>¦>£>§>¡>>¥>€>¢>¡>¥>¯>£>›>§>£>«>‰>¨>”>>±>Ÿ>¡>¨>´>£>§>§>­>¥>™>¥>}>¨>£>˜>¥>©>›>•>™>¡>¡>ª>ƒ>Œ>£>>­>¡>£>·>—>>˜>£>>§>›>š>Ÿ>«>¨>¥>“>™>©>©>¥>¡>§>t>›>ª>§>¯>Ÿ>¤>¨>§>¯>}>¡>¦>¡>¢>>“>>“>¡>‚>¤>™>>§>—>}>­>™>¦>Ÿ>>}>Ÿ>—>Ÿ>­>©>Ÿ>§>Ÿ>‡>>™>“>¨>ž>>¥>•>€>§>ƒ>¥>˜>—>Ÿ>>£>‘>—>¡>¥>˜>­>¨>£>©>¬>§>•>¢>>¡>“>µ>§>‘>¡>¤>«>—>—>¬>Ÿ>­>£>•>Ÿ>‡>‘>>©>¥>«>›>>¥>›>¥>£>¥>­>˜>>©>¨>ª>¥>©>†>£>¨>Ÿ>>¡>£>ˆ>ª>›>¢>ˆ>«>±>£>‰>›>¥>ž>•>”>£>·>©>‡>«>³>¢>§>—>°>—>•>¡>©>¯>¬>> >™> >£>•>›>‚>›>›>—>>¡>¬>¢>£>‘>Ÿ>>š>§>…>´>§>£>¨>}>¥>¡>©>§>…>>w>°>¥>Ÿ> >‰>“>•>>§>•>¨>§>›> >¯>³>Ÿ>¥>›>‹>©>£>£>¤>¤>ˆ>¡>©>§>œ>¡>¢>˜>©>­>|>}>¬>§>›>¡>§>>£>¯>§>±>¥>Ÿ>£>ª>„>¡>“>‰>›>œ>§>§>Ÿ>•>µ>‘>€>›>¡> >§>“>>£>Ì>¨>…>>‰>p>>¥>§>—>£>©>’>§>£>±>¡>ª>§>¥>Œ>›>¨>¥>>¥>¥>y>˜>Ÿ> >§>¡>£>š>«>©>­>Ÿ>—>£>¥>¥>¯>ª> >—>°>ª>œ>‘>¥>˜>­>¨>£>§>§>·>£>¨>“>£>‘>£>>§>>©>€>…>©>¢>§>“>¡>¯>Ÿ>¤>>§>Ÿ>Ÿ>“>›>¡>>“>¬>ª> >§>›>¡>Œ>©>Ÿ>¢>£>™>¢>>©>­>Ÿ>p>¥>ª>Ÿ>˜>§>™>ˆ>«>§>˜>›>¥>©>Ÿ>£>‰>¦>¸>˜>¨>‡>¤>«>¦>}>¥>§>¬>§>¨>³>—>‘>¬>¡>˜>­>§>„>©>Ÿ>©>£>£>|>ƒ> >¦>§>£>Ÿ>§>§>}>£>§>ž>˜>™>>¬>Ÿ>¡>˜>°>±>§>¥>©>‘>§>‘>§>”>˜>‰>Œ>>Ÿ>°>>—>§>¡>˜>­>­>˜>§>>ž>§>£>£>“>‘>š>¤>£>£>> >­> >>Š>­>ƒ>Š>§>>¦>‡>£>¦>¢>•>¯>—>—>Ÿ>€>«>>‹>¥>¥>§>µ>£>>³>>¢>ƒ>>³>›>>¯>>Ÿ>¤>£>ª>¨>‹>ª>“>¨>Ÿ>¥>¡>•>¢>>Ÿ>©>€>¯>™>§>¤>§>¨> >—>Ÿ>•>›>Ÿ>¯>u>¡>Ÿ>±> >°>§>Ÿ>›>•>§>…>­>Ÿ>§>¥>£>±>¥>¯>t> >§>£>±>´>š>¤>§>§>§>¥>°>‰>>™>>Ÿ>«>ˆ>¥>”>¡>£>£>›>£>§>ƒ>­>›>¨>ª>ˆ>¥>ª>¢>­>Ÿ>—>©>¨>>Ÿ>¤>u>¬>ž>£>>…>¥>›>›>Ÿ>©>£>§>“>°>£>>>>‹>«>Œ>§>‡>›>—>¤>>¸>€>¢>š> >ª>›>Ÿ>§>´>¯>>³>§>¥>±>‘>Œ>€>—>—>§>—>ž>¯>¥>«>©>§>¡>o>ƒ>™>©>§>•>>>¯>¥>ª>Œ>¤>¥>Ÿ>›>>£>“>­>œ>ˆ>™>¥>Ÿ>©>©>ˆ>¨>£>Ÿ>Ÿ>¨>‡>Ÿ>§>ž>¬>§>“>—>©>“>¥>¡>>—>>…>W>—>¯>‹>¡>µ>¬>³>œ>§>§>§>‘>¥>¡>£> >¡>ƒ>¡>Ÿ>ª>‚>>¢>Ÿ>¡>©>Ÿ>±>¢>•>> >­>>Ÿ>’>§>™>•>©>>§>©>>š>€>£>…>§>Š>¨>­>>©>Ÿ>˜>£>£>”>™>¯>˜> >¤>°>­>£>Ÿ>ª>¦>©>£>­>•>’>>›>¥>©>™>¢>˜>¯>x>±>c>…>±>£>’>£>­>£>Ÿ>©>¥>§>™>£>Ÿ>¯>ˆ>«>—>§>¡>•>£>§>“>¥>£>©>£>¬>›>Ÿ>>Ÿ>£>™>œ>°>¥>˜>{>›>•>¨>¥>¡>³>©>¨>›>¤>›>‘>­>­>Ÿ>©>Ÿ>¥>“>¡>Ÿ> >¥>°>±>–>§>>¡>Ÿ>>‚>Ÿ>›> >>—>Ÿ>€>­>Ÿ>¤>Ÿ>©>¡>‹>¡>™>œ>¥>¤>£>­>­>­>›> >˜>¯>„>¡>¥>£>¨>£>¢>š>™>¥>š>Ÿ>¢>§>Ÿ>>§>œ>¥>Ÿ>¬>§>©>§>¡>ƒ>¥>•>›>›>£>¥>±>Ž>£>ª>¥>£> >‡>—>£>¥>¥>­>>¢>§>©>§>Ÿ>¥>©>­>•>Ÿ>°>¡>£>ª>’>£>©>§>†>•>“>Ÿ>˜>¡>™>˜>‡>>ƒ>’>‘>¥>y>§>§>›>›>›>›>¢>§>“>«>Œ>™>«>¥>Ÿ>w>Ÿ>š>§>‰> >£>œ>Ÿ>‰>ž>‚>³>©>°>>¨>§>½>°>£>¥>§>{>­>>§>¥>>Ÿ>§>›>Ÿ>±>Ÿ>Ÿ> >¥>§>„>¥>¯>Ÿ>Ÿ>©>­>±>Ÿ>Ÿ>µ>§>Ÿ>©>Œ>¥>¡>±>£>>Ÿ>ž>­>¬>>§>¬>©>™>Ÿ>£>>Š>£>‡>£>™>>¨>§>Ÿ>›>¡>¥>°>£>ª>¯>¥>¥>>}>£>£>›>Ÿ>§>y>›>©>©>§>£>>‘>©>¬>›>€>Ÿ> >¢>Ÿ>—>y>¨>§>¡>­>«>—> >¯>­>¤>©>¡>§>>¡>£>µ>>’>¥>¬>£>Ÿ>Ÿ>—>ª>“>Ÿ>Ÿ>y>>§>Ÿ>‰>¯>¡>>‘>€>“>§>¤>ª>š>³>ˆ>•>­>¢>“>•>Ÿ>»>“>…>§>­>«>³>—>>¬> >s>¨>˜>>>¥>§>Ÿ>“>›>§>·>©>£>©>¦>¤>ƒ>š>§>°>•>£>£>•>™>“>…>­>¤>ª>«>¡>™>£>¤>¥>©>“>¡>¯>£>‘>§>—>¡>¡>¤>q>>Ÿ>¥>Ÿ>ª>—>>¯>¡>£>§>ª>™>}>©>­>©>™>§>£>>¤>>…>¥>›>Œ>£>¥>¤>Ÿ>¦>§> >ª>>›>©>{>¢>Ÿ>Œ>‹>§>’>Ÿ>Ÿ>›>§>£> >¥>¬>¯>£>‹>>­>“>§>>Ÿ>›>›>¢>©>›>¥>Ÿ>¡>±>«>§>˜>³>œ>£>§>¡>§> >š>¨>¦>¥>›>©>»>£>Ÿ>Ÿ>©>¤>>ƒ>«>¬>h>—>>¥>>£>§>¡>Ÿ> >§>¢>£>£> >‡>¤>ƒ>™>´>>Ÿ>>§>­>€>‘>‘>›>™>­>‡>˜>£>›>«>¡>’>—>—>˜>„>“>’>£>§>Ÿ>¨>>>‘>œ>«>Ÿ>>£>§>£>›>¥>›>ž>§>›>™>™>¤>Ÿ>›>ƒ>«>­>™>§>™>š>‘>›>>‡>¨>>¥>¢>s>›>…>>¦>£>¯>¢>>˜>>¢>§>©>­>©>¢> > >ª>«>­>¬>Ÿ>­>©>•>§>Ÿ>­>¢>¥>§>‹>¡>¨>>¥>«>–>¤>©>Ÿ>¡>¤>Ÿ>Ÿ>Ÿ>>¥>“>§>˜>›>¢> >†>‘> >—>¢>¯>›>™>©>¡>«>¡>°>¥>°>°>§>Ÿ>¨>ƒ>¬>£>­>˜>œ>>Ÿ>§>¥>±>‡>›>›>£>¡>Ÿ>Ÿ>¨>ˆ>>¥>Ÿ>¥>¨>¬>y>š>‘>>¢>–>¯>œ>©>“>w>¥>¨>£>£>­>—>©>°>³>›>³>¥>>˜>­>¢>ª>´>Ÿ>›>>›>Ÿ>¥>“>£>Ÿ>Ÿ>¡>ƒ>±>ª>Ÿ>˜>§>Ÿ>¡>¥>©>Ÿ>¤>£>}>>›>›>Ÿ>‚>©>•>§>¡>›>˜>–>Ÿ>¥>¤>„>™>Ÿ>>¯>¤>Ÿ>«>š>›>¥>£>Ÿ>­>>•>Ÿ>“>¢>†>§>—>>§>•>‡>ª>£>Ÿ>´>¬>¨>›>£>°>“>–>›>¨>“>¡>³>¤>¤>«>¨>«>a>­>¥>¯>>ˆ>£>¡>˜>«>›>£>­>«>¢>£>¨>¬>>¢>>§>¥>“>ƒ>©>›>“>¨>¡>›>§>—>•>­>©>ª>¢>¨>«>£>£>¢>¡>Œ> >­> >›>˜>©>¨>­>›>¥>Ÿ>‡>˜>¡>˜>§>>«>¤>£>¢>¸>„>‡>ƒ>‘>¡>£>©>°>›>§>>¤> >›>>Ÿ>Ÿ>¥>¥>¤> >«>›>>‰>Ÿ>µ>¡>§>¯>¨>­>™>¡>£>Ÿ>¹>£>‡>—>¤>ª>«>“>£>Ÿ>—>¡>‘>¤>¢>¥>­>­>­>¥>´>£>¤>‡>£>>Š>Œ>>y>•>¸>“>£>>§>ª>š>¨>‡>›>>™>£>>›>>­>´>°>¯>¸>Ÿ>­>¡>•>©>£>¨>´>>§>¥>¬>…>‹>>Ÿ>¨> >§>>­>©>©>«>>¡>¢>œ>µ>k>›>><>>¡>“>—>´>Ÿ>¥>ƒ>£>±>¡>«>£>§> >>¦>>§>Ÿ>±>°>§>>™>›>>¦>>‹>{>•>›>±>›>—>¨>¥>Ÿ>¨>¥>¥>>‰>§>—>š>>K>Ÿ>§>«>¥>°>©>£>¢>£>©>¡>§>§>·>­>™>§>•>­>£>£>›>¥>>£>Ÿ>™>Ÿ>¯>Ž>>¡>›>ª>¢>©>u>›>›>ª>§>£>¡>§>©>¡>£>£>£>›>­>¨>>¥>Ÿ>£>¥>¡>¡>¥>•>­>¡>¥>§>y>¢>>§>œ>>¬>£>>¥>¥>Ÿ>§>£>•>ª>‘>Ÿ>£>¢>¡>>´>„>Œ>›>£>¨>¢>£>‹>«>§>£>>>¼>ª>€>¤>>š>£>y>›>•>­>•>¥>£>™>Ÿ>©>¬>¥>>§>£>¨>¡>>Ÿ>Ÿ>¬>•>§>¨>>…>±>ª> >«>©>§>ˆ>¢>§>Ÿ>˜>§>±>±>£>›>Ÿ>§>—>ˆ>¡>ª>Ÿ>Ÿ>‡>Ÿ>¡>>¢>>£> >©>­>Ÿ>§>­>Ÿ>©>§>­>d>Ÿ>­> >¤>”>‹>›>¢>­>¥>£>§>¥>‡>¡>£>¬>¡>¢>§>¥>«>£>>¡>—>¢>™>£>¥>›>>|>§>±>¨>•>£>±>Ÿ> >°>>›>£>´>›>›>™>—>u>‹>}>Ÿ>¡>­>¥>‰>¨>…>•>§>§>›>£>Ÿ>ˆ>¡>«>­>§>¤>“>Ÿ>™>¥>‰>>¡>›>£>­>©>«>§>¡>ˆ>£>§>>§>­> >¡>¤>›>©>£>«>™>™>­>¤>¯>£>±>Œ>›>£>Ÿ>>—>Ÿ>›>>­>›>•>„>>§>¯>§>¤>§>¥>°>¬>³>§>¡>Š>£>ª>‘>«> >«>¯>¤>«>ª>ƒ>‰>§>>¢> >©>¥>>§>±>ª>¥>­>­>©>›>—>¢>§>¡>h>Ÿ>™>€>Ÿ> >›>>«>ª>§>ª>¤>¬>©>Ÿ>œ>§>¡>£>©>¦>¥>>¨>Œ>Ÿ>¦>g>>™>¥>™>˜>|>€>¨>¯>¤>‹>§>—>„>µ>°> >¦>¡>Ÿ>§>·>³>¥>±>ª>¬>˜>Ÿ>Œ>¤>›>¢>«>¤>Ÿ>§>>©>¥>£>ž>¥>{>›>>­>Ÿ>›>>¯>˜>>‰>ƒ>ª>¤>¤>¤>>¡>x>¥>>›>€>›>>°>©>œ>£>£>©>¥>Œ>ƒ>™>§>™>£>«>ˆ>¢>¥>¤>ª>¡>¤>™>•>›>>­>¨>©>§>”>Ÿ>—>ª>}>•>>¡>£>™>•>©>>¢>>œ>­>¡>Ÿ>£>¦>€>«>–>‹>§>ž>>Ÿ>“>­>¥>©>‰>Ÿ>>‘>˜>—>¬>¦>Ÿ>¢>§>¨>£>©>¥>¥>°>˜>£>§>—>Ÿ>¡>µ>‰>¥>›>›>›>™>¢>£>¥>§>¡>©>>{>>°>§>—>¥>«>¤>§>¤>ƒ>¬>Ÿ>ª>¥>¥>¥>”>¥>ª>£>•>¢>£>¯>£>>>Ÿ>§>§>Ÿ>­>›>«>­>£>ª>£>§>¤>¥>™>¥>m>œ>“>­>…>¤>§>­>©>©>ˆ>h>£>£>—>§>Ÿ>€>Ÿ>‚>Ÿ>±>Ÿ>¤>™>©>¬>“>ƒ>µ>>­>¨>ª>›>¦>£>>ƒ>©>Ÿ>{>›>¯>Ÿ>`>§>¢>“>©>›> >¦>§>©>¡>˜>>µ>>¢>>‹>•>‘>½>›>©>­>£> >©>«>«>‹>Ÿ>‹>•>¨>­>˜>¥>­>>°>“>Ÿ>°>¨>±>€>©>•>¤>«>¥>—>¨>¡>—>Ÿ>©>‘>±>•>¢>™>>¡>Ÿ>£>•>¯>£>Ÿ>“>¬>>›>˜>>³>•>¡>…>¨>™>©>£>©>>>™>¡>—>Ÿ>©> >…>™>©>§>—>„>›>¡>°>­>˜>£>Ÿ>ª>Ÿ>™>ª>¢>>£>«>©>š>ž>•>±>‡>‘>¡>>›>š> >>¯>¡>§>›>ž>£>£>£>¢>µ>£>Ÿ>Œ>©>«>™>Ÿ>¯>>¥>—>™>§>>¡>¬>©>€>ª>“>¯>¡>¤>©>¡>µ>Ÿ>ª>„>¡>‘>˜>©>>£>£>™>£>Ÿ>°>¢>›>›>¢>—>¨>ª>Œ>œ>©>>«>«>‰>¤>¡>¥>†>°>›>£>¡>‡> >¦>§>©>¡>›> >µ>µ>€>Ÿ>w>­>©>Ÿ>¥>¤>¡>œ>—>‚>>>‘>¢>Œ> >›>¡>§>Ÿ>>›>£>Œ>­>‘>‰>˜>©>£>>¬>­>¥>«>§>‡>£>°>§>©>>|>|>©>Ÿ>‰>£>¬>§>§>¥>©>£>>>›>¥>£>>¡>¤>©>©>©>>©>§>¡>Ÿ>š>¢>§>‹>§>¨>˜>µ>„>¤>¹>Ÿ>¡>­>§>«>¬>£>¥>“>›>Ÿ>©>›>¦>—>¥>©>£>£>©>—>¤>u>¢>§>‘>>³>ˆ>¬>¡>ª>¥>–>¥>“>«>Ÿ>©>‰>¯>³>§>¢>§>£>—>>¤>”>­>Ÿ>£>©>ª>›>“>“>y>¢>¬>Ÿ>>¥>>£>‘>—>™>•> >¤>¥>{>§>“>—>ª>‘>«>¤>“>‰>¯>§> >©>›>ª>¢>‰>Ÿ>>§>„>Ÿ>£>Ÿ>¥>©>¡>¥>{>¥>¢>•>¬>„>Ÿ>Ÿ>§>¯>›>˜>¥>«>µ>>§>«>™>™>¥>§>–>•>£>’>>™>ª>>£>•>ª>«>¡> >>­>¤>>£>©>¡>§>©>§>›>§>¡>‘>>§>˜>>©>§>›>§>§>Ÿ>£>£>€>™>­>§>“>ª>•>§>>©>¤>­>›>£>>…>Ÿ>Ÿ>¤>¥>«>­>£>ª>§>Ÿ>Ÿ>›>£>§>£>>­> >¨>¢>Ÿ>¤>™>¬>¹>£>p>{>>©>Ÿ>±>š>œ>Ÿ>§>£>«>Ÿ>…>¥>¦>ƒ>˜>¦>£>§>—>Ÿ>¥>¯>¬>£>­>> >­>›>>‡>­>£>>¢>¡>—>„>k>>£>Ÿ>>“>o>¥>Ÿ>¨>¬>Ÿ>“>¥>¯>³>«>¥>§>°>Ÿ>˜>›>©>¬>ˆ>›>¥>>«>>°>£>¥>¤> >±>>£>«>£>ª>•>§>©>—>£>›>£>¤>›>Ÿ>¥>¥>¥>œ>>¨>›>¤>¯>£>¯>¤>™>¥>•>“>¥>€>¥>°>£>ª>«>¯>Ÿ>£>>x>ˆ>©>¤>ª>ž>¡>>ƒ>£>¯>£>¥>˜>“>¡>‘>ª>—>£>—>š>—>˜>³>p>¡>”>—>¥>Ÿ>Ÿ>«>˜>Œ>£>£>Œ>’>›>‘>©>¥>°>>™>¬>¡>«>¥>¤>¢>§>•>™>}>˜>›>>¡>«>«> >›> >Ÿ>}>Ÿ>–>•>§> >¯>§>­>Ÿ>¯>Ÿ>£>Ÿ>¤>>±>£>›>—>–>´>Ÿ>¬>¥>©>¯>©>£>¯>>©>›>¢>ƒ>¥>›>š>±>£>¢>˜>§>ˆ>›>©>§>¥>›>™>—>¥>¥>¤>¥>§>«>Ÿ>©>§>Ÿ>‰>¡>>¢>ž>•>> >¢>•>Ÿ>“>Ÿ>›>³>£>§>°>…>§>§>§>Ÿ>s>¡> >£>±>§>y>¤>‰>¡>—>> >•>§>š>«>Ÿ>¥>£>>ž>§>>©>´>©>¡>¦>˜>{>­>§>³>>Ÿ>¡>£>¤>ª>ˆ>…>>ˆ>>ª>Ÿ>¨>«>Ÿ>«>¡>©>ª>>§>­>¨>§>¡>©>¢>­>«> >¦>§>©>£>—>¢>ª>¥>>¥>>›>¢>‚>¥>›>µ> >ž>>§>—>•>¤>‹>©>€>>>£>©>¢>«>ˆ>Ÿ>¥>>„>¡>£>­>§>£>‡>¸>—> >>¦>¡>™>­>£>­>>§> >¥>›>m>š>£>§>‹>­> >©>§>‹>£>°>>›>¡>¤>¢>´>˜>°>™>™>Ÿ>³>¥>­>§>¢>µ>¨>¥>°>Ÿ>>Ÿ>©>˜>§>Š>£>{>°>­>£>¢>”>˜>“>ž>™> >¬>Ÿ>ª>Ÿ>“>¡>€>§>Ÿ>§>­>ž>>­>¤>§>Ÿ>>°>>ž>ª>›>­> >‹>©>¯>¥> >ƒ>¯>™>­>™>©>›>§>§>£>ª>¥>›>š>—>>¥>£>>­>¡>•>™>­>¡>›>¬>¥>­> >>¦>>«>Ÿ>£>¥>«>‘>­>˜>¨>©>“>Ÿ>>ž>§>“>ž>§>œ>>—>•>¡>©>¥>¨>”>¡>•>§>­>ˆ>«>›>>Ÿ>›>¡>«>>³>¥>¬>Ÿ>§>>Ÿ>‹>§>§>¨>§>«>Ÿ>©>—>¡>µ>¦>«>‡>>¥>>§>¡>Ÿ>‹>ª>©>Š>>w=Ÿ>¢>©>§>¡>ª>€>¯>¨>¤>¥>>§>£>™>¨>Ÿ>¥>§>>§>­>¨>¢>>™>§>©>¢>>>£>>—>ƒ>{>˜>“>>“> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/13.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/13.0 new file mode 100644 index 0000000000000000000000000000000000000000..4a1fbf0664f31e7a036041c30b8c4fb63167374a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/13.0 @@ -0,0 +1 @@ +¥>£>§>ž>™>¯>ª>©>§>«>>±>°>¥>¯>£>£>­>¡>ª>¡>­>ª>—>›>¡>­>‡>¯>>¬>§>>ª>£> >¯>¡>>§>>±>•>—>ª>‹>£>›> >§>•>«>Œ>¥>¨>§>§>˜>°>”>³>¢>«>«>§>©>©>«>Ÿ>­>¡>¨>¯>>•>±>¬>°>­>±>”>Ÿ>>«>¨>©>°>¡>°>­>ª>¥>¨>¥>­>¥>©>¤>´>°>­>±>–>>¯>¬>§>±>°>«>¢>§>Ÿ>¬>£>«>«>§>«>¤>›>¨>­>§>¥>¥>¬>°>­>§>©>³>Ÿ>H>ª>”>£>­>­>ª>‹>©>µ>˜>¥>¯>Œ>›>°>±>—>¯>¡>Ÿ>°>¥>ª>­> >¨>Œ>£>œ>’>ª>>>­>Š>¯>©>½>³>§>>5>¬>°>§>Ÿ>>©>°>©>¥>¬>¥>¡>«>±>–>¬>±>¡>’>ª>­>§>±>ˆ>§>­>¡>©>¬>›>­>«>°> >©>©>“>¿>>©>£>ª>ª>´>©>¡>«>¡>­> >“>­> >©>Ÿ>ª>¯>™>³>°>­>©>™>§>°>§>±>¥>­>©>Ÿ>Ÿ>£>±>¼>•>³>ª>ˆ>§>°>³>¨>³>¥>«>¯>Ÿ>£>­>>«>­>Ÿ>¥>«>¯>¯>±>¥>¡>©>³>¯>­>X>­>­>©>©>«>µ>«>°>ü=A>°>­>œ>˜>Ÿ>´>>¯>>>½>¤>¯>ª>>­>˜>±>¡>±>›>µ>—>š>Ÿ>¤>>¤>‹>¯>¬>£>©>­>§>¨>ž>œ>¡>´>¥>§>ª>µ>”>µ>³>›>­>­>«>£>›>©>±>›>¥>¡>ž>™>§>£>­>›>°>¡>¤>¤>ª>£>µ>­>£>£>¨>ˆ>Ÿ>­>°>—>Ÿ>E>­>°>¯> >œ> >©>«>ª>«>‰> >›>­>Ÿ>>©>¨>¨>¨>­>£>Ÿ>¥>Ÿ>Ÿ>­>­>«>³>­>ª>>°>­>¢>Œ>—>­>­>œ>«>Ÿ>¡>¯>‹>¦>«>—>§>©>±>¬>©>>ª> >>¤>©>•>±>›>¯>­>©>«>§>—>«>ˆ>­>§>§>°>ª>£>¯>«>¬>‘>¯>Ÿ>§>°>¡>«>­>¸>«>©>°>´>§>¡>¯>‹>ª>©>>°>°>¨>Ÿ>¡>¬>ª>°>™>”>«>£>±>ª>©>¸>>š>¡>¨>©>­>£>£>§>°>¥>§> >¢>¥>¯>ª>¦>­>Œ>¡>­>«>´>§>¬>©>©>­>…>§>©>§>­>>œ>§>ž>¥>‘>­>¡>£>­>>Š>´>>«>¥>£>‹>§>Ÿ>©>³>©>¤>­>§>“>£>¡>¡>¬>£>™>¯>>’>ª>“>¨>Ÿ>¡>¨>§>©>£>›>¨>«>Ÿ>µ>°>­>°>³>­>›>¬>˜>«>Ÿ>¸>¯>™>¤>§>­>Ÿ>Ÿ>±>§>«>¬>™>§>>™>›>¯>«>´>Ÿ>¤>¥>§>§>ª>±>µ>£>˜>­>°>­>¬>­>Ž>§>­>¥>”>¥>«>“>­>§>ª>“>±>´>ª>•>£>©>£> >›>£>µ>­>–>´>³>«>¯>>´>Ÿ>›>§>­>³>±>¥>­>£>§>­>>£>‘>§>£>¢>>«>³>¨>¬>>§>¨>£>«>>·>«>©>¬>‚>¬>­>¯>¬>Œ>¡>‰>µ>­>§>©>“>›>Ÿ>¢>­>œ>ª>°>¢>£>´>µ>£>­>¤>}>°>¨>©>­>©>‘>¨>­>­>¥>«>«>£>¯>·>y>>­>«>¢>¥>°>¤>§>±>¬>·>§>¨>ª>³>‘>§>Ÿ>•>£>¢>¯>¯>§>š>·>>Ž>¤>¬>ª>©>¢>£>§>ã>³>>§>“>}>£>­>­>Ÿ>¦>­>š>«>ª>¸>¥>¯>ª>­>”>£>¯>ª>>ª>«>[>>¥>¥>°>©>©>¡>¯>«>¯>§>Ÿ>¨>ª>«>µ>«>§>Ÿ>µ>­>¥>>¨>Ÿ>­>­>­>«>¬>¹>©>³>›>§>™>­>>­>¥>¬>Š>Œ>±>¨>ª>›>¥>³>£>«>¥>ª>¡>©>›>£>§>—>š>µ>¯>ª>­>¥>ª>•>­>¥>¨>¬>Ÿ>«>¤>³>µ>¤>\>¬>©>¥>>­>Ÿ>Œ>­>ª>Ÿ>£>­>¯>­>ª>>¬>¼> >­>>¬>±>«>…>©>­>¯>­>ª>³>¡>˜>³>©>¤>¯>­>>±>ª>´>§>£>‹>|>¥>­>ª>°>§>±>ª>{>§>­>©>ž>£>§>¸>§>§> >±>µ>­>­>°>›>°>›>¬>>¥>>™>¥>¡>³>¥>ž>«>©>Ÿ>°>¯>£>­>œ>©>¬>§>¨>™>›>Ÿ>§>§>¬>£>¨>±>§>•>‘>µ>>“>­>£>¯>“>¥>¯>°>>±>œ>Ÿ>§>>µ>—>˜>«>ª>­>·>§>¨>µ>>©>>“>µ>¥>™>³>§>§>«>«>±>¯>—>³>™>¯>§>©>§>›>©>Š>¥>°>„>´>Ÿ>ª>©>©>­>©>Ÿ>§>œ>¡>«>´>_>©>§>·>§>¯>¬>¤>£> >¯>>µ>¨>¯>¬>¨>·>©>°>O>§>­>­>³>·>¡>©>­>­>­>¨>¯>”>¢>¡>Œ>©>µ>‘>ª>œ>§>§>¥>£>©>°>ƒ>°>§>°>ª>“>­>³>¦>°>£>¡>¬>°>£>¤>¬>Œ>ª>§>©>›>‘>­>¥>¡>§>ª>©>«>ž>µ>©>“>š>>•>´>‘>­>‹>¤>ž>±>–>¸>Š>«>£>§>¯>¥>§>¦>¹>µ> >³>ª>¨>´>>•>>Ÿ>>­>£>£>±>«>±>±>­>§>H>™>¡>­>¯>>›>¤>±>¨>­>”>ª>­>­>¥>§>¥>˜>³>¡>>¢>­>§>¯>©>p>­>ª>¯>§>­>“>¥>©>¥>¯>­>›>Ÿ>«>™>­>¨>”>£>£>‘>*>ž>µ>—>¥>¹>±>¸>¡>­>­>©>™>§>§>­>©>©>Š>«>§>±>>¢>©>§>§>°>£>¸>«> >£>¨>³>¥>£>>­>¥>›>°>¡>°>°>˜>¡>Œ>­>‘>­>—>¨>¸>›>°>¥>¡>¯>§>£>Ÿ>´> >¥>¨>°>°>ª>¨>¬>¨>­>§>µ>¡>Ÿ>Œ>¥>«>°>¡>­>Ÿ>±>>±>4>Ž>±>©>—>©>µ>©>©>°>«>§>£>¯>¥>³>‹>¯>™>¯>©>Ÿ>©>­>›>«>«>°>©>³>¢> >˜>¥>«>£>¡>±>«>¢>_>¥>¢>­>§>©>±>­>«>¤>©>¡>›>³>³>¥>±>¥>­>>¬>©>§>©>±>¸>Ÿ>­>•>¥>£>>>§>£>©>–> >ª>>´>£>°>«>­>§>‡>§>>£>ª>«>ª>¯>´>°>¤>¦>Ÿ>¹>–>¦>­>©>­>¬>¥>¥>¢>­>¡>¤>©>°>¨>š>¬>>ª>§>°>­>¯>±>£>>©>>§>£>¬>ª>·>•>«>­>­>¨>§>‘>>©>­>«>µ>¡>ª>«>­>­>£>­>­>³>›>¥>³>§>©>°>>¨>«>­>’>Ÿ>™>£>Ÿ>§>Ÿ>¡>‘>‡>>˜>™>ª>ˆ>³>¬>¡>¡>¢>£>§>ª>š>°>”>Ÿ>¯>©>¥>ˆ>¦>¡>ª>>¢>«>£>¥>“>¥>>·>ª>³>Œ>°>°>»>¸>­>­>«>ˆ>¯>¤>­>­>¥>§>­>£>£>µ>¥>§>¥>¬>°>>ª>±>§>¥>­>°>³>«>£>¸>§>§>©>‘>¬>©>»>©>™>¥>§>¯>°>¤>¯>·>³>¡>£>¥>•>>§>>ª> >™>«>¬>¨>¥>¤>§>­>©>­>´>¨>«>“>‹>§>¬> >ª>«>†>¡>°>°>«>©>“>™>­>µ>£>‰>¥>§>§>§>Ÿ>ˆ>­>¯>¨>±>­>Ÿ>¤>³>°>«>­>§>­>¥>£>«>¼>¤>—>ª>¯>ª>£>£>£>±>›>©>¬>‹>¢>¬>¦>>±>ª>˜>“>>ž>«>¯>­>¡>³>™>™>³>¡>›>©>¨>Ã> >“>­>°>°>±>>™>µ>¥>‡>­>¡>£>˜>­>­>¨>œ>¥>­>¸>¯>­>­>­>¬>>Ÿ>¬>±>>ª>©>ž>§>›>‘>°>­>­>°>¥>Ÿ>­>¨>©>¬>>¥>·>«>›>°>>ª>¥>©>…>•>§>ª>£>°>Ÿ>™>³>§>±>§>«>Ÿ>c>©>°>³> >­>ª>—>¨>™>‘>©>£>—>«>­>©>¨>¨>­>¥>¯>§>¥>±>ˆ>ª>¨>“>•>°>™>¢>¥>¢>©>¨>§>ª>µ>±>§>›>™>¯>Ÿ>­>¤>¢>£>¡>©>­>£>«>§>­>µ>¯>ª>¢>·>¤>­>­>¨>¯>«>Ÿ>©>¬>©>¡>«>Å>§>¤>¥>°>­>§>>±>±>E> >™>«>•>§>­>«>§>§>«>¥>¨>¬>¨>’>ª>>£>¹>•>£>¨>©>­>Œ>—>—>£>£>°>‹>¡>ª>£>°>¨>—>Ÿ>>Ÿ>—>>>­>­>¥>­>¥>˜>›>£>±>¦>>¬>­>­>¥>ª>¡>¥>°>¥>>¡>§>¥>£>“>°>±>>¯>Ÿ>>›>£>¡>”>¯>“>«>¨>‘>£>>„>¬>§>³>£>>Ÿ>§>©>¯>­>µ>«>§>¥>¥>°>±>´>­>¦>³>­>>«>¤>³>¦>©>­>¡>¤>±>§>¯>±>ž>ª>¯>¥>©>©>§>©>§>£>±>>­>>Ÿ>¦>£>˜>›>§>£>«>³>Ÿ>Ÿ>­>¥>±>«>µ>­>±>µ>¢>¡>¯>>¯>¨>³>›>£>¥>©>­>«>³>“>¡>¢>ª>ª>¢>£>¬>>§>­>¤>©>¯>±>}>Ÿ>™>£>§>¯>±>£>¬>>y>©>­>ª>¯>±>Ÿ>«>±>µ>¢>·>­>•>¡>¯>­>­>·>§>¡>‹>Ÿ>¥>©>›>«>¤>¦>§>ˆ>µ>­>¡>©>­>¥>¦>«>ª>©>§>ª>ˆ>¨>£>¡>§>>±>Ÿ>±>¥>£>¡>Ÿ>£>¬>¨>‘>¡>£>£>±>«>¥>°>¡>¡>©>©>¦>±>§>—>¤>•>§>‹>«>›>“>µ> >“>°>«>¥>µ>­>­>¤>«>³>›>š>¡>©> >§>¸>¯>ª>±>µ>°>M>³>«>±>§>ƒ>ª>©>¡>³>Ÿ>­>´>³>§>ª>°>³>™>©>›>ª>­>›>>­>§>Ÿ>°>§>¡>­>Ÿ>›>°>ª>­>©>±>­>§>¬>«>§>•>©>°>¬>¡>>­>«>¯>¡>«>§>>¢>¥>>¬>¦>°>¤>£>©>¸>Œ>>•>š>¨>©>¯>·>£>­>•>ª>§>¡>£>©>¤>­>ª>¨>£>³>¡>™>“>§>·>­>§>³>°>­>ž>¥>¬>¥>Ä>­>Œ>¡>¨>­>«>•>¨>©>¡>­>>¯>§>«>¯>µ>±>¬>½>©>©>>ª>™>‘>—>¥>„>¡>»>—>£>…>­>­>Ÿ>­>‘>¥>¥>©>ª>•>¦>y>ª>³>³>´>½>©>«>§>›>«>«>­>¹>¢>©>­>³>“>‘>•>§>¬>§>°>—>³>ª>°>«>•>¨>§>¥>Ë>‡>¡>¥>>¥>§>›>¢>·>©>©>‹>¬>¸>ª>µ>«>©>§>£>­>•>¬>¤>°>µ>­>¦>>£>>©>£>™>ˆ>¡>¦>³>Ÿ>>ª>­>¥>°>§>¬>‹>“>¬>£>Ÿ>¥><>§>­>°>­>µ>¯>©>©>«>°>§>«>­>¸>¯>Ÿ>¯>Ÿ>´>©>«>£>¬>§>¯>¥>¢>¡>±>•>¢>§>¢>¯>§>ª>ˆ>¥>¤>­>¯>¬>«>­>°>¥>©>¬>«>¡>°>«>™>£>§>©>­>©>¦>­>›>³>¥>¬>¯>‰>§>§>­>£>“>­>¬>™>ª>©>£>¬>©>ž>°>>¨>§>ª>¤>•>³>>•>¡>­>«>¥>«>•>°>­>ª>“>£>½>³>>§>—>£>¬>ˆ>Ÿ>Ÿ>­>œ>­>ª> >¢>°>µ>§>š>¯>«>°>§>›>§>Ÿ>¬>˜>¯>«>>”>°>±>§>¯>­>«>>¨>ª>§>¤>°>³>±>ª>¡>§>«>>>§>°>©>£>>§>¨>§>¨>¢>¨>§>­>±>£>­>±>§>¯>ª>±>L>¥>µ>£>­>ž>–>¥>¦>³>«>¬>¯>§>>§>¬>¯>§>¥>­>ª>¯>¨>•>§>¡>§>>§>­>¡>‡>‹>­>µ>°>œ>«>¸>£>§>³>¥>¢>­>¸>¡>¥>ž>¡>>‰>Ž>¦>©>­>©>•>¬>>™>¯>¯>£>ª>¥>>¨>³>°>¬>¥>—>¨>>­>˜>¥>ª>¥>¬>³>«>°>¸>¨>–>­>«>>­>´>§>§>­>¢>¯>ª>±>¡>—>±>«>­>¯>±>>¨>©>¥>Ž>Ÿ>©>¡>§>°>Ÿ>–>>Ÿ>¯>«>­>¨>©>§>µ>­>µ>¨>¥>“>§>¯>>µ>§>°>µ>­>°>±>‹>”>«>…>§>§>±>­>¥>­>µ>¯>§>­>¯>°>¤>¨>ª>­>«>G>¤>>„>¤>«>¡>˜>°>°>¯>­>«>°>­>¥>£>­>©>©>±>ª>°>˜>ª>—>¥>­>S>©>¢>«>£>¡>o>‰>­>¯>¬>—>§>¡>>¸>µ>©>¥>§>¬>±>Ð>¹>§>¸>¯>±>¢>£>•>©>¡>¦>µ>¨>©>°>>­>ª>©>¥>­>k>£>Ÿ>³>¥>£>—>±>£>©>”>Ž>«>ª>§>¨>¤>¥>‡>¬>™>œ>ˆ>§>£>¯>­>¥>¥>§>³>­>•>Œ>Ÿ>­>¡>§>°>‘>«>©>«>¬>«>©>Ÿ>Ÿ>£>‡>±>°>­>­>›>¥>>°>‘>›>ˆ>¥>­>>Ÿ>±>˜>§>¢>¨>´>¥>§>«>«>Œ>­>›>—>¬>Ÿ>§>¥>›>°>ª>«>œ>¥>—>—> > >­>¬>©>§>°>­>­>°>§>ª>±>Ÿ>«>­>>ª>¥>¸>“>­>£>¥>¥>¡>£>¨>ª>§>£>³>£>>›>°>­>>©>³>©>­>«>Ž>³>¥>±>¬>­>§>›>¬>­>«>ž>¬>§>±>«>—>¥>§>­>¨>£>¯>>°>°>©>±>§>¬>©>§>¡>«>A> >>¯>‹>«>¬>³>ª>¬>”>T>§>ª>¢>«>§>>ª>>§>µ>§>©>¡>°>­>˜>—>¹>¥>¯>­>°>>ª>¨>Œ>>­>¥>…>£>±>§>5>µ>¥>˜>©>¢>§>§>«>­>¨>Ÿ>˜>·>¨>§>>—>š>›>»>Ÿ>¯>°>«>­>¯>°>°>“>§>>™>±>³>¢>¬>±>>µ>Ÿ>¤>±>­>°>‹>³>Ÿ>©>­>¯>£>­>£>ž>§>­>—>¸>¡>§>¥>›>£>¤>§>›>³>­>§>>³>‰>£>£>¥>µ>Ÿ>«>Œ>­>¢>­>­>¬>£>”> >ª>¡>§>¯>¤>y>£>«>­>Ÿ>‹>¡>©>´>·>Ÿ>©>£>°>­>¡>±>¨>™>¤>°>­> >¦>™>´>—>œ>©>ˆ>£>¡>§>¤>µ>ª>­>¢>§>«>§>©>©>¸>¬>¥>—>°>¯> >¤>°>‘>¬>>Ÿ>¯>§>§>°>¬>>­>˜>µ>¨>ª>¬>£>±>ª>­>“>¨>™>£>­>¨>©>©>>§>§>·>©>¨>£>§>Ÿ>¯>¬>—>¢>´>¤>°>¯>>©>¥>¬>‘>³>¤>¬>«>>¥>©>¬>¯>§>Ÿ>«>¼>±>‘>§>>°>­>¤>ª>­>¨>¥>>‘>—>—>›>§>˜>¥>¡>¨>¬>¥>£>¢>ª>“>°>š>—>Ÿ>­>§>£>°>µ>ª>µ>¬>Ž>¨>³>­>«>—>>c>°>£>“>¥>±>ª>«>§>³>­>™>£>§>©>¨>¥>©>ª>«>¨>¯>™>±>«>¨>§>>§>¬>™>«>ª>£>»>a>§>»>«>§>°>ª>¯>°>¨>°>›>¢>§>­>£>ª>>¬>°>ª>§>¯> >§>w>¬>­>˜>¨>»>‘>±>§>°>­>>ª>”>µ>§>­>“>³>µ>­>¥>¬>ª>›>>©>™>¹>§>ª>­>­>§>>š>Ž>§>°>¨>£>«>§>­>Ÿ> >¢>>ª>©>«>†>¬>˜>>¯>—>´>­>Ÿ>•>³>­>¤>°>£>­>­>>§>“>«>Š>£>¯>¥>«>­>¬>«>…>­>­>>¯>>­>¥>¬>´>©>™>ª>°>³>§>­>³>Ÿ>¡>©>¯> >Ÿ>«>>§>>±>¥>§>›>±>°>§>§>¥>´>ª>§>©>«>©>«>³>«>¥>­>¦>˜>§>¬>Ÿ>Ÿ>³>¬>£>­>­>§>¨>§>‹> >±>ª>Ÿ>­>ž>­>£>­>­>µ>¡>©>˜>Ž>§>ª>ª>©>­>°>­>­>­>©>§>¢>©>¬>§>¥>±>­>µ>ª>¨>¬>Ÿ>¬>¸>§>€>Š>¢>­>©>´>¡>¥>§>ª>©>°>¥>‡>­>©>>Ÿ>­>¥>ª>Ÿ>§>¥>±>°>§>°>¤>©>°>¡>¥>™>°>ª>¥>¥>©>¢>><>¥>©>¥>—>›>„>­>¥>¬>±>£>—>©>³>»>±>¬>­>µ>¤>¡>Ÿ>«>´>>¥>°>¤>°>‘>³>¥>ª>­>§>µ>“>©>°>©>±>>­>­>Ÿ>ª>ž>ª>­>Ÿ>§>¨>©>§>¡>¢>¥>§>­>µ>§>·>­> >­>›>>°>…>©>·>«>­>°>°>©>£>¤>>—>­>©>¬>£>ª>§>>§>¯>ª>©>©>›>¡>›>­>›>«>¡>›>¡> >µ>‰>§>™>Ÿ>­>©>§>°>¡>—>§>«>>š>Ÿ>™>¯>©>±>>Ÿ>µ>§>µ>©>«>ª>¯>Ÿ>£>>>Ÿ>—>©>±>¯>¥>¥>©>¤>“>¤>Ÿ>>¯>¨>°>¬>´>£>³>¥>©>¥>©>›>µ>¬>¤>¡> >¸>©>­>­>­>µ>¬>©>±>£>µ>¡>­>˜>¯>¤>¢>±>¨>¥>¡>¯>“>£>¯>¯>ª>£>¡>¡>­>ª>©>§>°>­>§>¬>¯>§>•>¨>¥>©>¢>¡>>§>«>>¨>›>ª> >»>§>«>³>>«>¯>­>§>‰>ª>©>§>³>©>Š>ª>•>©>>•>§>›>ª>¡>°>§>©>¬>˜>£>­>—>­>µ>­>ª>«>Ÿ>Œ>¯>­>·>¢>§>§>ª>¨>¯>”>‹>Ÿ>™>Œ>ª>¥>°>°>¤>±>§>°>°>¥>­>³>­>­>¥>¯>¬>³>±>§>­>°>¨>ª> >©>­>ª>—>¯>¥>£>­>>­>£>¼>ª>§>¥>§>ž>Ÿ>­>>±>Œ>š>›>©>±>©>¯>‘>§>«>£>>§>§>±>­>ª>>¼>¡>§>Ÿ>©>¥>¥>¯>­>³>›>¬>¨>©>¡>X>£>­>­>>­>¥>­>­>–>©>¯>l>Ÿ>«>©>¥>»>Ÿ>°>¢>¢>¥>³>¨>°>¨>§>¸>¯>ª>·>§>™>ª>­>¡>©>”>¨>‰>±>­>ª>§>›> >>£>£>§>«>§>«>§>›>©>Š>°>>©>°>«>>³>ª>ª>¥>¬>±>–>§>­>Ÿ>³>¥>“>«>³>©>§>‹>°>¡>±>¥>­>£>©>­>§>ª>­>£>¥>>Ÿ>­>ª>¥>­>§> >£>±>¨>¡>°>­>°>«>¢>¬>£>±>§>«>«>±>œ>°>Ÿ>°>­>œ>£>˜>¥>ª>›>¨>¬>ª>§>£> >©>­>°>±>›>©>>¬>±>”>°>£>£>¡>¤>©>¯>Ÿ>¸>«>·>£>©>‰>¥>‘>«>©>­>­>­>§>¬>£>§>»>«>­>•>§>­>›>©>­>¥>–>¬>«>š>¥>Ÿ=§>§>­>¯>¨>°>€>´>°>«>§>¥>¬>«>£>ª>¤>­>­>—>­>³>ª>©>£>¡>¯>³>¬>˜>¥>§>¡>ž>>>£>™>¥>> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/14.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/14.0 new file mode 100644 index 0000000000000000000000000000000000000000..fa466f23770d82514757b51fcb525949791eba3d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/14.0 @@ -0,0 +1 @@ +±>­>±>¨>»>µ>µ>´>°>·>£>¸>¹>°>·>­>°>·>­>°>©>³>µ>£>ª>ª>³>˜>´>¯>°>°>©>°>°>­>¸>«>§>°>>¹>Ÿ>§>±>¡>­>§>­>±>Ÿ>»>¥>­>°>°>³>¢>¸>«>µ>¯>³>·>±>µ>µ>µ>¬>µ>¯>´>¸>¥>¡>µ>±>»>±>·>¡>ª>°>¸>µ>·>·>µ>·>µ>µ>­>­>¯>¹>°>´>°>»>¹>µ>¸>´>£>µ>µ>³>µ>µ>³>­>­>­>µ>­>µ>´>°>±>«>¦>¯>³>°>±>°>³>·>¸>³>³>½>¬>G>³>¡>«>µ>·>³>>¯>»>¤>¬>¸>—>©>·>¹>§>·>ª>«>·>µ>±>µ>©>°>>¯>©> >°>©>¡>µ>œ>¸>±>À>¹>±>›>?>´>µ>¯>«>•>°>·>°>­>¸>±>©>µ>¹>¡>µ>¼>¬>·>µ>±>±>µ>§>±>µ>±>³>³>¥>·>±>·>­>¯>°>¯>Á>£>±>­>µ>°>»>´>­>°>­>µ>«>Ÿ>³>©>³>§>µ>½>¤>½>¹>µ>µ>¥>°>¹>±>³>±>µ>´>­>ª>±>½>Ä>¤>¹>±>œ>±>¸>¸>°>»>«>·>½>­>°>µ>¡>µ>¸>ª>³>±>µ>¸>¸>­>«>°>·>µ>·>h>³>·>°>°>µ>½>´>¹>ÿ=L>»>µ>ª>¥>©>¼> >µ>­>°>Á>­>·>°>¨>µ>¥>·>­>»>©>¹>­>¦>«>¯>«>«>›>¸>µ>«>¯>µ>°>­>¬>­>¯>¸>³>´>±>¼>¡>¿>·>ª>³>±>±>¬>§>³>·>£>¯>¬>©>§>°>¬>µ>¥>¸>±>¬>­>°>­>¿>±>¬>­>°>>©>µ>³>¡>«>[>¸>µ>¹>©>§>¬>±>³>±>µ> >«>¨>¸>­>¡>µ>¯>°>´>»>«>¨>­>©>­>µ>µ>´>¹>µ>­>«>¸>»>«>ª>§>±>³>¥>µ>­>­>·>“>­>°>¥>³>µ>¸>µ>±>ª>±>ª>Ÿ>¯>°>Ÿ>·>¥>µ>·>°>³>±>£>µ>¡>·>µ>°>·>·>­>µ>°>µ>¥>¸>«>«>µ>¬>µ>±>À>°>µ>µ>½>°>«>±>œ>µ>±>§>¸>µ>­>«>­>³>µ>¸>¸>§>´>«>¹>µ>³>À>¨>¨>©>±>­>±>­>­>¯>·>±>³>©>­>«>¸>´>°>µ>©>ª>¹>´>¸>±>±>±>µ>³>>°>±>­>±>¨>©>­>©>¬>§>°>°>«>°>©>£>¹>§>±>¯>©>«>±>©>°>·>µ>«>´>°> >©>­>©>µ>­>¨>¸>«>¥>µ>«>³>«>­>°>°>´>­>¥>±>³>§>¼>¸>µ>¸>½>³>§>±>¡>·>«>À>¹>¨>­>°>¸>¬>ª>»>«>µ>µ>ª>­>³>§>©>µ>µ>»>©>¬>°>«>±>°>¹>½>¯>£>¸>·>¸>³>¸>>°>³>±>¡>­>´>¤>µ>±>´>¥>µ>À>³>£>«>°>°>ª>«>ª>¹>µ>¹>¼>¿>±>µ>¨>¿>§>§>µ>µ>½>¸>­>°>­>±>´>£>³>¥>³>«>©>§>µ>½>¸>±>§>´>°>¬>±> >½>­>±>´>‡>·>µ>µ>·>Ÿ>©>©>¿>µ>­>³>¡>§>¨>¬>µ>ª>µ>»>­>­>¹>¼>­>±>°>>·>±>«>´>´>¢>µ>¹>·>¯>³>°>«>¸>À>>¨>¸>µ>­>­>µ>´>´>¸>´>¼>´>³>´>¸>§>¬>¨>£>°>©>¸>·>«>¬>À>©>£>¬>¯>±>µ>©>­>±>ã>¹>¡>°>¢>˜>­>¸>±>§>¯>·>¨>³>¯>¼>°>¹>³>¸> >¬>³>³>>µ>µ>a>©>­>±>·>°>³>¬>·>³>·>¯>ª>°>´>µ>¼>¸>­>¨>¼>¹>¬>ª>µ>«>µ>µ>·>±>´>À>±>µ>«>¯>§>³>¥>±>¯>µ>Ÿ>£>»>³>°>§>±>¼>­>µ>°>´>«>±>£>°>°>¡>§>½>¸>³>¸>­>³>£>´>­>°>µ>©>´>­>¼>¼>­>t>µ>±>¯>©>µ>§>‘>¸>µ>«>­>´>·>µ>µ>Ÿ>µ>¿>ª>µ>£>µ>»>µ>›>³>µ>·>µ>¯>½>©>£>¹>°>­>¹>·>Ÿ>»>°>·>³>¬>§>€>°>³>µ>·>³>»>µ>Š>¯>µ>­>ª>«>°>À>­>³>«>´>¼>µ>´>¼>¥>·>§>µ>§>­>¢>¥>«>¯>¸>­>­>±>µ>­>¹>·>«>·>µ>°>´>±>´>§>§>«>´>µ>´>§>°>¸>¯>¥>£>½> >>µ>­>¸>µ>±>¸>»>©>½>§>ª>¯>£>½>¦>¬>µ>µ>·>½>°>³>¼>«>°>¢>Ÿ>½>­>£>½>¯>¬>³>´>·>µ>¦>¼>£>µ>­>³>°>¤>³>›>°>·>“>¸>ª>¯>­>´>µ>±>¨>°>­>¯>³>¹>Y>´>¯>½>±>¸>µ>­>«>­>µ>¤>¼>±>³>·>°>¼>³>¹>U>°>µ>µ>¹>Ã>¬>´>µ>½>µ>°>µ>¥>ª>­>©>°>¸>¡>±>§>³>°>­>­>°>¸>“>¹>¬>¹>±>¡>µ>¼>°>³>¯>«>´>µ>¬>³>´>Ÿ>±>³>¯>«>©>µ>­>­>¯>»>°>µ>«>½>³>¥>¥>¸>§>½>¢>¹>£>­>§>¸>ž>½>£>´>­>±>´>±>¯>¯>¼>Á>­>·>°>³>½>¥>Ÿ>Ÿ>©>ª>µ>«>­>¹>´>¸>¸>³>°>C>¯>©>·>±>§>Ÿ>­>¸>´>·> >µ>´>³>­>³>­>§>»>¯>¡>­>³>³>·>­>c>µ>´>µ>°>¹>¢>¯>±>´>´>µ>©>§>³>§>°>´>£>¯>­>¥>)>«>¼>¥>³>È>¹>½>­>µ>·>±>§>´>°>´>¯>³>›>³>¯>µ>¦>«>³>´>°>¸>­>»>³>©>¬>³>¼>¯>­>§>¸>¯>­>´>«>µ>¸>¦>¯>¡>µ>¤>³>«>°>½>¨>¼>¯>­>´>°>­>©>¼>ª>¯>µ>·>´>µ>¯>µ>±>µ>°>»>­>«>¡>°>µ>½>¬>µ>¯>·>±>¼>&>¡>¹>±>£>±>À>±>±>¼>±>­>¯>µ>¯>¸>>¸>£>¸>·>«>µ>µ>©>±>µ>µ>³>¹>­>«>¥>³>±>¯>¬>¹>³>­>d>¯>¬>´>°>±>¸>µ>³>­>·>­>¥>»>»>°>»>±>µ>©>µ>¯>±>·>¿>À>¨>¸>¥>±>«>§>¢>³>°>³>¥>©>´>Ÿ>½>¯>µ>µ>´>­>>¯>§>©>³>°>´>¸>½>µ>«>­>¨>½>­>°>µ>°>¹>±>¯>³>­>´>¬>¨>±>¹>³>£>³>­>±>°>½>µ>´>µ>¯>¡>´>©>°>­>³>µ>¹>§>³>·>µ>¬>±> >§>°>³>µ>½>ª>·>´>³>µ>±>´>·>¹>§>°>¸>±>±>¸>¥>µ>´>¹>¤>©>¥>­>¬>±>­>«>¡>˜>¡>¤>§>±>¡>½>µ>«>­>­>­>¯>³>ª>¹>§>­>´>µ>­>>³>©>¸>Ÿ>°>±>«>¯>¢>¯>ª>¼>±>¹>Ÿ>·>µ>Ä>¿>µ>µ>µ>>¸>¯>µ>µ>°>°>µ>­>­>¼>°>¯>´>±>¹> >·>»>¯>°>¹>»>¹>´>¯>Á>±>±>¯>¤>µ>±>À>±>§>°>°>·>µ>«>°>À>¹>¯>­>­>§>›>³>{>°>«>¥>±>±>¯>­>°>µ>»>±>´>½>µ>³>«>œ>°>±>©>³>´>—>«>»>µ>³>±>>¡>¸>À>­>>°>±>¯>°>§>£>°>»>¯>¹>µ>§>°>À>»>³>·>°>µ>°>ª>µ>Ã>«>Ÿ>°>´>±>­>«>«>¸>§>³>´>>¯>·>´>™>µ>´>§>Ÿ>¡>§>µ>³>µ>«>½>©>§>·>«>ª>À>µ>Ë>©>¬>¸>¸>µ>»>©>§>»>°>£>µ>«>­>£>·>³>­>©>«>¸>¿>»>³>µ>·>´>¬>«>·>¸>§>´>µ>¬>°>¥> >¸>µ>µ>¹>­>¬>µ>¯>µ>¸>©>°>»>µ>§>¸>©>¯>´>±>›>£>¯>°>°>¸>©>¥>¹>°>µ>¯>¸>ª>l>´>¸>¼>©>¸>¯>£>±>«>£>±>¬>§>µ>´>³>³>±>±>¬>¸>¯>¯>¹>§>µ>µ>£>¢>¸>¥>­>­>­>³>±>¯>µ>¹>¹>¯>±>§>µ>©>µ>¯>­>¨>©>µ>±>«>¯>´>µ>½>¸>±>¬>Á>¯>³>¹>°>·>´>©>³>¸>°>¬>³>Ë>µ>­>¬>´>±>°>›>·>»>K>©>£>¸>£>±>µ>¯>°>«>µ>¯>°>±>°>¡>µ>¥>­>Á>¨>­>±>°>µ> >¤>¥>±>°>¸>•>«>µ>­>·>°>©>­>¬>©>´>§>¦>³>µ>³>µ>°>£>«>ª>¸>­>‡>´>´>¸>­>°>­>­>¹>­>«>¯>µ>°>¬>³>¹>»>©>µ>¨>ª>§>¯>­>¥>µ>›>°>³>°>­>¡>—>³>°>·>«>¡>©>­>³>¼>¸>À>µ>¯>°>­>µ>µ>½>¸>°>»>µ>§>µ>°>½>¬>µ>¸>µ>­>µ>­>µ>½>¥>µ>µ>³>±>°>°>³>¯>°>·>¥>µ>©>©>¬>¯>µ>§>°>­>³>»>ª>ª>»>¯>¸>±>»>µ>¸>¹>­>°>¸>°>±>¯>¹>¬>°>­>±>·>·>»>±>¬>¯>µ>±>­>­>µ>>¯>µ>­>´>·>¸>“>ª>£>­>­>Ä>½>­>³>©>‹>´>±>³>µ>½>©>µ>¹>»>­>À>µ>¥>«>·>±>¹>À>¯>­>¡>§>­>°>¥>´>¯>±>¯>—>¿>µ>ª>·>´>¯>­>´>µ>´>µ>µ>›>³>©>­>­>·>»>¬>µ>¯>­>©>§>°>´>´>ª>¥>±>¦>¹>³>¯>»>«>°>±>µ>­>»>³>›>¬>Ÿ>¯>”>³>¥>¡>µ>«>£>¸>³>³>¹>³>·>±>¹>¼>ª>§>°>°>­>¯>¿>½>±>µ>¹>¼>L>¹>µ>¿>±>‹>°>¯>­>·>«>µ>´>¹>¯>±>¹>¸>¤>³>£>µ>¸>­>>·>¯>©>µ>°>¨>¸>©>§>µ>·>µ>±>»>¸>°>±>´>±>¡>°>¹>±>«>¬>µ>µ>·>¬>´>¯>>«>°>§>³>¯>´>­>­>µ>À>Ÿ>¥>³>§>µ>µ>µ>¹>³>±>§>³>°>¦>«>±>¯>µ>±>³>­>¹>­>¥>£>°>À>¸>°>¹>·>µ>«>°>³>¬>Ð>³>•>­>³>°>·>£>´>±>«>µ>©>¸>±>¯>·>½>¹>µ>À>±>³>¡>µ>£> >¢>­>>©>Ã>Ÿ>¨>›>µ>¸>­>·> >¯>°>©>¯>Ÿ>¬>„>³>¹>·>½>À>³>¸>°>§>°>µ>µ>Ä>«>³>¹>»>¯>£>¥>°>³>°>±>£>µ>·>¹>¸>>¯>°>­>Ã>¢>ª>­>>°>³>ª>¬>¼>¯>¯>›>µ>¿>¸>»>³>³>±>©>·>¥>±>­>¹>½>µ>¯>«>¯>Ÿ>·>°>«>§>«>©>»>«>©>µ>·>°>¹>³>±>™>ž>´>ª>ª>­>A>±>µ>»>µ>½>³>³>±>³>µ>³>µ>µ>À>»>©>¸>©>»>±>±>«>·>³>µ>­>«>­>»>¡>­>±>«>µ>±>µ>©>¬>¬>´>µ>µ>±>³>´>°>³>¯>´>«>µ>±>£>­>°>´>¹>±>¯>´>©>»>³>·>µ>¡>°>¯>µ>­>>¹>´>§>µ>´>¯>µ>±>©>¸>ª>­>¬>±>°>§>»>š>¥>«>³>µ>°>µ>¥>µ>¹>¯>¡>¯>¿>¹>«>°>£>­>±>¡>ª>¨>´>©>¸>µ>­>«>µ>¸>³>¥>±>³>»>±>¨>±>­>´>£>¸>³>…> >¼>¼>°>±>»>´>›>³>·>«>­>µ>¹>Á>³>­>¯>µ>§>Ÿ>­>·>°>¯>Ÿ>´>°>±>°>¯>¯>°>µ>¸>­>³>¹>¯>µ>°>¸>U>°>½>¯>·>«>¦>°>°>¼>·>µ>¸>µ>¡>±>µ>µ>±>±>±>°>¸>°>§>­>¬>¯>§>¯>³>¨>> >¸>»>¹>¥>³>»>±>°>¼>±>ª>µ>Á>°>«>«>«>>’>ª>­>¯>µ>¸>¡>µ>ž>£>µ>¹>­>µ>±>»>±>À>¼>µ>¯>£>³>¥>µ>¥>±>°>°>µ>¹>µ>¸>Ð>¯>£>±>·>£>µ>½>°>±>±>­>·>µ>¸>«>”>½>¸>·>³>À>¡>­>±>±> >«>°>©>¯>¸>­>™>¡>ª>·>³>µ>³>³>³>¸>¼>Á>´>¬>´>°>·>§>»>­>¸>»>±>»>»>˜>£>µ>™>³>³>¹>µ>±>³>¹>¹>µ>³>´>¸>«>µ>±>·>³>C>±>§>‘>­>µ>ª>¥>¹>·>¸>¸>´>¸>¸>±>°>¹>µ>µ>½>µ>±>¨>³>£>°>´>W>¯>«>±>­>©>u>˜>´>¹>µ>£>¯>­> >¼>»>±>ª>±>µ>»>Õ>Ã>±>½>¸>¸>­>­>¨>±>­>³>»>³>µ>·>©>µ>³>°>°>·>€>­>ª>µ>­>­>Ÿ>»>ª>¬>£>>µ>µ>°>´>³>¯>£>°>§>§>˜>³>°>½>¹>°>µ>±>¸>µ>¥>¡>©>·>±>´>»>Ÿ>µ>±>µ>·>µ>µ>­>«>­>œ>¸>¹>¸>µ>ª>¯>¥>¹>«>¢>¡>°>°>¨>«>·>¥>¯>°>¯>»>±>³>·>¸>«>·>¦>£>¹>«>¯>¬>¥>¸>µ>µ>§>°>¥>£>­>«>·>°>³>³>µ>·>´>¸>´>µ>»>­>µ>³>©>³>¯>¼>Ÿ>´>­>­>µ>¯>«>°>±>°>«>¼>­>¦>§>½>·>¨>¯>·>µ>µ>¸> >µ>°>¸>·>µ>±>§>µ>µ>±>©>µ>°>»>³>£>¬>¯>¸>°>¬>µ>¨>¹>¹>´>¹>°>´>³>­>«>µ>E>©>©>µ>¡>´>µ>¼>µ>³>¤>S>³>´>­>µ>­>ž>±>¡>±>½>³>´>°>¸>·>¡>µ>¿>°>¹>³>¸>§>³>µ>£>¢>µ>°>¦>­>¸>°>,>»>¯>§>µ>­>±>±>³>°>´>¬>ž>¿>¯>>§>£>§>§>½>¬>¸>³>´>µ>·>¸>¸>£>­>™>¥>¸>¿>«>´>´>¡>¹>§>¯>¹>µ>·>>¸>§>­>·>·>ª>µ>­>§>±>·>£>¹>©>´>¯>¥>¯>±>³>©>·>µ>¬>«>»>›>­>¯>¯>¼>¨>³>>´>°>±>µ>¹>­>£>©>·>­>¯>·>°>…>ª>±>·>©>š>¬>³>¼>½>©>·>´>¸>µ>ª>¼>µ>§>°>»>µ>©>±>¥>½>¨>©>·>›>­>©>¯>­>½>±>³>«>°>µ>³>±>±>½>´>°>£>¸>³>°>°>¹>¢>¸>«>­>·>±>³>·>µ>¢>´>§>À>°>±>³>±>¼>°>µ>§>°>¤>¯>°>±>µ>°>Ÿ>±>«>½>µ>¯>­>°>¨>µ>³>§>¯>À>­>µ>µ>>·>¯>µ>°>¸>­>³>´> >°>´>´>µ>µ>©>»>Å>¼>ª>¯>•>µ>³>°>µ>³>¯>¯>­>µ>¥>¨>©>µ>ª>­>°>°>¸>°>­>¯>µ>¢>µ>­>¥>¨>¼>³>­>µ>¼>±>·>·>š>°>»>¸>¯>¤>¨>]>·>¯> >¬>¼>¯>¸>­>¸>µ>¥>±>¯>³>±>±>µ>µ>µ>µ>µ>¨>¹>±>°>³>«>·>µ>³>µ>µ>­>À>L>°>Ã>´>°>»>°>·>·>´>µ>©>­>­>µ>­>´>ª>µ>¸>°>°>¸>­>³>‰>³>µ>¡>°>½>£>»>¯>·>´>ª>°>˜>½>°>µ> >½>»>¹>­>±>¯>¥>’>³>¥>Ã>³>°>·>µ>³>¨>£>§>³>¹>³>«>³>¯>µ>¨>­>¯>¨>±>³>³>›>µ>¥>§>·>¥>¹>·>«>¥>¼>µ>¯>¸>¯>¸>±>Ÿ>±>­>±>>±>´>­>´>µ>³>±>š>µ>µ>¬>·> >µ>­>±>½>¸>¨>µ>¸>¿>°>´>¹>«>­>´>±>­>¬>µ>¨>­>­>¼>°>¯>§>¸>¸>µ>¯>°>¿>µ>­>µ>·>±>°>µ>±>¯>·>°>¡>±>µ>«>ª>µ>µ>«>¸>·>¯>¯>­> >¯>¹>µ>©>³>«>µ>°>³>³>»>­>³> >­>°>±>±>³>µ>·>³>±>µ>±>°>­>±>±>³>°>µ>±>»>´>³>µ>ª>´>¿>°>Ÿ>¡>«>¸>°>·>¨>°>°>¯>´>·>­>>µ>·>¡>­>´>­>°>§>±>¯>¼>»>µ>·>­>³>¹>ª>°>­>¹>·>¯>­>³>©>¥>5>°>³>°> >§>>µ>­>µ>¹>¯>£>·>»>À>½>¯>¸>¹>­>«>ª>·>¸>™>³>»>¯>¹>œ>»>¯>´>µ>±>½>±>´>¸>µ>·>¥>µ>·>¨>±>¯>´>µ>©>¯>³>³>¯>©>­>­>³>³>»>°>¸>µ>©>µ>§>ª>¸>‘>µ>»>±>¸>·>¼>°>­>±>¡>§>·>±>´>­>±>¯>>µ>¹>´>¯>¸>¦>°>£>µ>¥>µ>¬>§>¬>«>¹>Ÿ>­>§>ª>µ>³>±>¹>©>§>±>±>Ÿ>©>ª>¥>¸>±>¹>¡>¬>»>°>¸>³>µ>µ>µ>ª>«>—>§>ª>£>±>¼>¹>¯>¯>±>­>¯>¯>©>©>µ>³>¸>¸>·>­>¹>¯>´>°>µ>¥>¹>´>­>±>¬>¼>³>·>´>µ>¼>´>±>¸>°>¸>¬>³>°>·>­>­>¸>±>­>©>¸>¡>«>¹>·>µ>­>«>¬>µ>±>³>³>¸>µ>°>´>¸>°>¥>µ>«>³>«>«>›>°>´>«>±>«>´>«>¿>·>±>À>œ>¸>¹>¸>´>Ÿ>¯>³>´>À>µ>ª>±>£>±>©>£>³>£>±>­>´>¬>µ>±>¤>¯>µ>™>´>»>µ>µ>·>¨> >»>µ>»>©>­>­>°>³>¹>¡> >©>µ>¥>µ>±>·>¸>°>¹>°>µ>·>¯>µ>¹>¹>µ>¯>·>°>¸>½>±>µ>´>µ>±>­>°>·>µ>¡>·>ª>­>±>Ÿ>³>«>Ç>±>³>±>°>§>«>¹>>¸>¡>µ>¥>°>µ>±>¹> >°>³>­>£>±>±>¹>´>´>£>Å>­>´>¨>±>³>­>·>µ>¹>©>µ>±>±>°>m>­>´>µ>œ>´>«>´>µ>¡>¯>À>c>§>´>³>­>Á>¥>¹>©>ª>«>½>°>¸>³>¬>Ã>»>´>À>³>¥>´>µ>¯>´>¤>¯>£>¹>·>µ>³>£>«>§>­>­>­>¸>´>´>°>©>µ>Ÿ>¸>ª>´>·>´>§>¼>±>´>­>±>¹>¡>¯>¸>«>¿>°>¡>¹>»>±>°>˜>»>«>»>­>·>­>³>µ>³>·>·>°>°>§>­>±>´>¯>±>¯>§>­>»>¯>­>»>µ>¼>±>±>³>¯>¸>°>´>±>½>§>»>­>·>µ>§>¯>©>­>³>¨>³>¸>µ>­>­>¬>±>³>¸>¸>¢>­>§>µ>¸>¥>»>¬>­>¯>¯>­>·>ª>½>³>Ä>±>³>Ÿ>±>¡>µ>µ>µ>¸>µ>­>¸>­>±>Ç>³>·>µ>°>µ>¬>­>´>°>¥>¸>¸>¸>­>…=³>±>´>·>±>¹>‹>»>¸>´>¯>±>µ>°>«>´>«>³>¹>£>µ>¸>µ>µ>«>¬>µ>»>·>£>±>­>©>­>ž>³>¬>§>µ>­> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/15.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/15.0 new file mode 100644 index 0000000000000000000000000000000000000000..660a0b95255655d188ef49ee06aa387fde2a087d Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/15.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/16.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/16.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b0ee00e18178640763c50f29fe108a82485e4a4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/16.0 @@ -0,0 +1 @@ +½>½>Å>»> >Ë>Ã>Ç>Ã>Í>µ>È>É>Å>Ì>À>Á>É>Á>Å>¼>Å>È>¹>¹>¹>Ï>‘>Ç>Ÿ>Å>¿>¹>È>À>À>Å>À>·>Å>­>Ë>µ>»>Ä>«>À>¸>À>È>±>È>¯>Ç>Ä>Å>Ä>µ>É>£>É>À>Á>Ë>Ã>Å>È>Ã>À>É>Á>Å>È>·>´>Å>Á>É>À>Ì>³>½>£>Ç>Ç>Í>Í>>È>Ç>Ä>¿>Å>Ã>É>Ã>Ç>Å>É>Ì>Ë>È>©>ˆ>Ë>É>Å>È>Ë>Å>Ä>Ã>½>È>Á>Ë>Ë>¿>Å>½>¸>Å>Ç>Ä>Á>À>Ã>É>Ç>É>Å>Ï>Á>!>Ç>·>Á>È>Å>Ç>«>À>Í>³>Á>É>™>¿>Ì>Å>³>È>½>½>Ë>Å>É>Å>¹>Ã>©>Á>·>±>Ã>¬>­>Ì>¥>È>Å>Í>Ë>Å>¥>0>Ç>Ë>Ä>¼>š>Ã>É>É>Á>È>À>½>Å>Ï>±>Ë>Ï>½>›>Å>Ã>Å>Å>›>¿>É>À>Å>Å>±>É>Ç>Í>¿>Á>Ã>›>Ð>³>Ä>½>Ã>Á>Í>È>À>Å>À>Ç>Ã>­>É>¿>Å>¹>É>Ï>¸>Ë>É>É>Ã>·>Å>É>Ä>É>Ã>È>Ë>½>½>Ç>É>Ð>·>É>Å>¥>Å>Å>Í>Ä>Ì>Ã>È>Ì>½>¿>É>£>É>È>¼>Ç>Ç>É>Í>Í>Á>½>Ç>Å>Ë>È>@>Å>Å>Å>Ç>È>Í>Ä>È>Ý=*>Ç>Å>½>³>»>Ì>£>Ë>½>™>Õ>½>Ë>Ã>¸>È>µ>É>¼>Ì>¹>Ô>•>»>»>Ã>½>Å>>Å>Ë>Á>Å>»>Á>Ä>¿>¿>Á>Ë>É>Ç>Å>Ì>ª>Ô>Ï>¹>Ã>É>È>Á>¹>É>Ë>­>À>À>À>¸>Á>Á>Ë>µ>È>Í>Á>Á>Å>Ã>Ô>Ä>À>À>Ä>”>¼>Ì>È>°>¿>G>Í>Å>É>½>¸>½>Ä>É>Å>Ë>¦>Á>¸>Ç>½>§>Í>Á>È>Ç>Í>»>½>Á>»>¼>Ç>È>À>Ì>È>Ç>»>É>Ì>½>Ÿ>µ>Ã>Ë>³>È>Á>Ä>Í> >Á>Å>¹>È>»>Ë>É>Ç>¹>Ã>¿>§>Å>Å>³>Ì>¹>É>È>Ä>È>Ã>µ>Ã>>Ç>Ä>Á>É>Ë>¹>È>È>É>³>È>½>À>Ã>¿>Ç>Ã>Ð>Å>Å>È>Í>¿>Ã>Ã>¥>Å>È>·>É>É>À>À>Á>Å>Å>Ì>¥>­>É>Á>Ì>È>È>Ï>¸>¸>À>Ç>Å>Å>Á>¿>Å>Ç>Ä>À>½>À>¼>È>Å>Ã>Ç>™>½>Ë>È>É>È>É>Ç>Ã>Å>>Å>Å>½>Ç>©>½>Á>¸>Ä>£>Ç>Å>½>Ã>¹>¤>Í>¹>À>Á>»>¡>Ç>¸>Å>Í>Å>À>Å>Á>§>¿>¿>¿>Ç>Ã>¹>É>»>§>É>—>É>¿>¿>Å>Á>Å>½>¹>Á>É>¹>Ð>Ë>È>È>É>Ã>»>À>±>Ë>»>Ô>É>¸>Á>Ä>Ì>À>½>Ï>¼>Ë>Ç>À>Á>£>·>¸>É>È>Ï>¼>À>Å>¹>Ã>Ç>Ç>Ð>½>¯>È>Ë>Ë>Ä>È>¨>Å>Å>½>±>Á>Å>­>É>Ã>Å>“>Ç>Ô>È>¹>¹>Ã>½>»>½>³>Ä>È>¢>É>Ô>È>È>±>Ð>À>µ>Í>Í>Ø>Ë>Á>¿>À>Å>È>µ>Á>¡>Ä>Á>»>­>È>Ð>É>Å>½>Ã>À>½>Ä>­>Ñ>Ç>É>Ï>k>Ë>Å>É>Ì>¥>¿>•>Í>Å>Á>É>°>µ>½>½>È>»>Ä>Ì>À>Ã>Ð>Ï>Ã>Å>Å>U>È>È>¿>Ì>Ë>¨>Å>É>Ç>Ã>À>Ã>À>Ç>Ë>u>©>Ì>Ç>À>À>Ë>È>Ã>È>Å>Ð>É>Å>É>Ç>˜>Á>¼>·>À>¼>È>Ë>¿>¹>Ï>»>§>À>À>Ã>Å>¼>¿>Ã>ø>Í>±>À>°>Š>Á>Ç>Á>¼>¿>Å>½>Ë>Á>Ð>È>Ë>Ë>È>¬>¹>È>É>©>É>Ë>3>»>Á>Ã>Ç>Å>Å>»>Ë>Å>Í>À>·>Ä>Í>É>Í>È>Å>½>Ð>È>»>»>È>»>Ë>Å>Ë>Ä>È>Ó>Á>É>»>Ã>µ>Ã>´>É>Á>Ì>£>™>Ï>Ã>Å>¹>Ã>Í>À>É>Ã>Á>»>Ç>½>Ã>Á>µ>¹>Ì>É>É>È>Á>Á>³>Ë>½>Å>Å>½>Ä>»>Ï>Ì>Å>E>È>Ç>Á>¸>É>¿>>Ç>È>À>¿>Ç>Ì>È>É>°>È>Ï>À>Ç>­>Ì>É>É>›>È>Å>È>Ç>Ã>Ð>¹>³>Í>Å>Á>Ï>Ë>¬>Í>Å>É>È>¹>>m>¿>Ç>Å>Å>Ã>Ë>È>‡>Ã>È>¿>¼>¿>Å>Ï>Á>Å>À>Ì>Í>Ç>Ã>É>µ>Ì>µ>Å>¹>À>±>µ>Å>À>Ì>Ç>À>Å>È>¿>É>È>½>È>©>Ã>Ç>Ã>È>µ>¯>½>Å>Ä>À>¹>Ã>Ì>Á>µ>µ>Í>©>ª>Ç>Ã>Í>š>Ç>Å>É>¿>Í>½>»>Á>¥>Í>·>’>Ë>É>È>Ó>Á>É>Ë>›>Å>­>­>Í>Á>¸>Í>Á>À>Ç>È>É>Í>µ>Ï>¼>È>À>Å>À>±>È>§>Ç>Ë>˜>Ï>»>Á>È>Ä>Ë>Ç>¹>Ä>¿>¿>Å>Ì>=>Ã>Ç>Í>Å>Ì>É>À>À>½>Ç>¯>Í>Ä>É>É>Å>Õ>È>Í>5>Å>Á>È>È>Ó>»>Ç>É>Ì>Å>Ã>Ç>³>¿>À>>Ã>Ì>­>Ç>¹>Å>Á>Ä>Á>Ã>È>ƒ>Í>À>È>È>¥>Ç>Ì>À>Ì>¿>¹>Ã>É>¿>Ã>Ç>§>Å>Ã>Ç>½>“>È>À>»>Ä>Ë>Ã>Ë>½>Ð>Å>µ>¹>™>¸>Ï>³>Ë>–>Å>»>Ç>­>Ï>£>Á>Ä>½>Å>Ã>Á>Å>Ï>Ï>Ã>Í>É>Å>É>¸>«>©>½>¸>É>½>Å>Ð>Å>Ç>Ë>É>Ä>">>½>Ì>Ä>¹>™>À>È>Å>Ç>¬>Ç>Ð>Å>½>Ã>À>¹>Ð>Ç>±>Ä>È>Ä>Í>À>K>Å>È>È>Á>Ì>­>À>Ã>Å>Å>Ç>¿>½>Å>µ>Ç>Ç>·>À>À>­> >»>Ï>µ>Ä>Ð>Ë>Ñ>»>Ï>Ç>Á>¸>Á>Å>Ã>À>É>©>È>¿>É>£>»>È>Å>Ã>Í>Á>È>Ç>¿>¿>Å>Ñ>Ã>À>½>Ç>Ã>Á>Å>À>È>Ì>³>¿>¨>Å>¹>Ë>¹>À>Ë>»>Í>Á>Á>Ç>Å>Å>½>Ë>À>Ä>Ç>É>Í>Å>Á>É>Ã>Í>Ä>Í>É>¼>­>À>É>Ï>½>Á>»>Ë>¢>Ô>>¯>Ë>Ã>¹>Ä>Í>È>Ç>Ë>È>½>Ã>È>Ä>Ë>¯>É>¹>É>Ç>À>È>È>½>À>Ç>È>È>Í>À>Á>±>Á>Å>Á>Ã>É>Å>Ä>I>Ã>À>Ë>À>Ç>Ç>È>Å>¿>È>À>³>É>Ì>Å>Ð>Ã>È>¸>Å>À>È>É>Ð>Í>½>Å>±>Á>Á>¸>´>Ç>Ä>Á>¸>½>Å>©>Ç>Å>Å>É>Å>Ä>ƒ>À>¿>½>È>Ç>Ç>Ç>Ó>É>½>½>¸>Í>›>Ä>Ë>Ã>Ë>Á>Å>Ç>À>Å>¼>¼>Ã>È>Ã>·>Ã>Ã>Å>È>Ë>É>Å>“>Á>­>Á>¸>Ä>¿>Ä>È>É>¸>Å>Ç>Å>À>½>±>»>Å>Í>È>É>½>Ã>Å>È>É>½>È>Ï>Ï>µ>Á>Ë>Ã>Ç>Ì>¸>Á>È>É>°>¸>¸>Á>¿>Á>Á>½>¯>£>¡>¼>¹>È>£>Í>Ç>½>Á>½>Á>Ç>Ã>»>È>µ>À>Å>Ë>½>>Ä>¹>Ä>¥>½>È>½>À>­>Ã>¯>Í>È>Ñ>>Ì>Å>Ó>Ð>È>È>È>£>Ì>½>É>È>¿>Ã>Ë>Ã>Å>Ð>Å>Ä>Á>È>Ë>«>Ä>È>Á>Ã>Ì>É>Ë>Ã>½>Ô>Ã>Ç>Á>³>Ç>Á>Í>Å>°>Ä>À>Å>Í>¿>Å>Ï>Í>Á>¿>À>¸>§>Ã>g>Å>À>»>Ç>Ã>Ä>Ã>Ã>Ç>Ç>Å>È>Í>È>Å>>§>É>É>½>Å>Å>™>»>Ë>Ç>È>Á>§>±>È>Ë>Ã> >Å>É>Á>Ã>½>¥>Ä>Í>À>Ó>È>½>Ã>Ð>È>Å>É>Á>Ç>Ä>¹>È>Ô>¿>­>½>Ç>Å>Á>Á>½>Ë>¸>Ç>È>§>Á>Ç>È>­>È>Á>¹>°>¨>½>Ë>È>Ç>½>Ô>¹>·>Ç>½>½>­>È>Ã>»>¥>É>Í>Ä>Ë>À>·>Í>Á>—>È>À>¿>±>É>Ç>À>¹>¿>È>Ð>Í>Ç>É>Ë>Ë>•>¿>Ç>É>·>Ì>Ë>À>Á>¸>­>Ä>Í>Ä>Ç>Á>½>È>Å>Ç>É>¹>Å>Ð>Å>¼>Å>½>À>È>Ã>£>µ>½>Ç>Á>Ë>»>¹>È>Ä>Ì>À>À>½>C>Á>Í>Ð>»>Ë>Å>¹>Å>»>«>Ç>À>±>Å>É>Á>Ã>Å>Å>Á>É>Ä>Ä>Ï>¢>È>¿>±>·>È>³>Á>À>À>Ç>Å>Á>É>Ç>Ç>È>¥>´>Í>¹>É>½>À>½>»>Ç>É>Á>À>Ã>Ï>Ø>Ç>Ã>À>Ð>À>É>Ì>Ã>È>È>»>¨>Ç>Å>¼>Ä>Ü>Ä>¿>Ã>Å>Ë>Ã>­>Å>É>->½>°>Ë>·>È>Ç>¿>É>À>Å>Ã>Ä>Å>Á>³>Å>¡>Ã>Õ>Ÿ>¿>Á>Å>Ì>¡>µ>»>Á>Ä>Ì>>»>É>À>Ì>Å>¸>¿>À>¹>˜>¹>³>Å>Ç>Å>È>È>³>½>»>Ì>¿>l>Ä>Ë>È>¿>Ç>Å>Ã>È>Á>Ä>Á>É>Å>½> >Í>É>¹>Í>»>»>¼>À>Å>°>É>­>Ã>Å> >Ã>­>>Ã>Å>Ì>½>§>»>Ç>Ç>Ï>É>Ð>À>Ã>Å>½>É>Ë>Í>Ç>Á>Í>È>¸>Ä>Å>È>½>Å>Ç>Ÿ>½>Å>À>É>Í>¼>Ã>Ë>Å>Ä>Ç>Å>Ç>Ä>Ã>Ì>¹>Ç>½>À>¿>À>£>·>Ã>Á>Å>Ì>»>»>È>Ã>Ë>¿>Í>È>Ë>Ï>¼>À>Ë>—>Á>À>Ï>¼>Ã>Å>Å>Å>É>Ï>Ÿ>Á>½>Å>À>¿>À>È>©>Ã>Ç>À>Ã>É>Ë>>½>¸>Ã>Á>§>Ð>Ã>Ç>À>>Å>È>Å>Ã>Ï>½>Ç>Ë>Ë>½>Ï>Ç>»>½>Í>Å>Ç>×>Å>Á>¢>½>½>Å>¹>Å>Å>Ã>½>‚>Ý>Ë>½>×>É>Å>Á>È>Ç>Ã>È>Å>•>Ä>½>Á>Ä>—>Ë>À>Ì>À>½>¿>»>¸>Ç>Ç>›>»>Ã>¹>Ë>Ã>Ä>Ç>Ã>Á>Å>È>Á>Ï>Á>±>À>°>Ã>>É>·>·>È>À>±>È>É>Ã>Ð>Ç>Ç>Ã>Í>Ð>½>µ>À>È>½>È>Í>Ô>¿>É>Í>Ð>G>È>Å>Ð>Á>‡>Ä>Ã>¹>Í>À>Ã>Í>Ì>Ä>Á>É>É>¸>Å>¸>Å>Í>½>“>È>Å>¹>Ë>Ä>·>É>Á>¹>Ì>Å>Ë>Å>Ì>È>¿>Å>Ã>Ë>±>À>Í>Ã>¸>¸>É>Ç>Ï>¿>Å>À>«>À>Å>¹>Ë>Á>É>Ã>À>Ç>Ó>—>Ÿ>Ÿ>»>È>Ã>Ë>Ï>È>Å>°>É>Á>³>½>È>¿>Ì>Ä>Å>Å>Ë>À>»>¯>Ç>Ô>Å>Á>Ì>È>È>¸>Ä>Ã>À>Ë>É>¢>À>Ã>Å>Ä>³>É>Ç>Á>È>À>Í>Ã>É>Ç>Ì>É>È>Ð>Å>Ç>°>È>µ>³>µ>Ã>ž>»>Ô>¯>µ>›>Å>É>¼>È>±>½>Å>‘>Å>°>½>m>Ã>Ç>Ç>Ï>Í>Å>Ç>Å>·>Ë>È>Ç>Ñ>¹>È>È>Ï>£>µ>°>Á>Á>Ä>Å>µ>É>É>Ï>È>°>¿>Ã>¼>Ð>’>Á>Å>ð=Á>Ä>½>À>É>Ã>Ã>°>É>Ð>É>É>Á>Ä>Ç>À>È>³>È>Á>É>É>È>Å>½>À>Š>Á>Ã>¹> >½>Ã>Ï>¿>½>Ã>Ç>Å>Ë>Å>Á>‰>´>É>½>Á>»>,>À>É>Ì>Å>Ë>É>Ã>Å>Å>Ã>Ç>Å>É>Ð>Ë>¼>É>Á>Ï>Å>Ç>µ>Å>Ã>Ç>¿>Á>Ã>Ì>­>½>Ä>½>Í>Ä>È>Ÿ>À>Á>È>É>Á>Å>Ç>Å>Ä>Ç>Å>Å>À>Ë>Å>¬>¿>É>Å>È>Ã>Ã>É>½>É>È>Ç>Å> >Ä>Á>Ç>À>©>É>Å>½>È>Å>À>Å>Ç>½>Ë>½>Ä>Á>Ã>Å>³>Ì>¦>·>½>Ç>È>Ã>Ç>µ>É>Í>Å>±>À>Ð>Í>š>À>µ>Á>Ç>›>¿>½>Å>¸>Ç>É>Á>À>Å>É>Ç>·>É>Ä>É>Å>À>À>»>Ã>³>É>Å>g>¬>Í>Í>Å>Å>Ë>Å>¨>Ã>É>½>Ã>Ä>Ï>Ë>Ã>Ã>Á>Ë>·>•>Ã>Ì>Ç>Á>­>Á>Ä>Å>Å>Á>Å>À>È>Ï>¿>È>Ó>¿>È>¿>Å>G>Á>Ì>Á>Ë>Á>·>Ã>À>Ì>Ä>Ä>Í>Å>¯>Á>Í>Ë>Á>Å>È>Å>É>È>¹>À>À>Ç>¸>Å>È>¿>‰>§>È>Ð>Ì>¹>È>Ì>Á>Å>Ï>Ã>¿>Ç>Ì>Ã>À>¹>Á>—>•>§>Å>Å>Å>Í>­>Ã>£>¸>Å>É>Ã>É>Ã>¡>Á>Ï>Ì>É>Á>µ>Ã>¸>Í>³>Ç>Ã>À>Ç>É>Ë>Ë>ç>¿>°>Ã>Ä>Ÿ>É>Ë>Ã>Å>Ç>À>Ä>É>Ë>»>>Ì>Å>Í>Ç>×>¨>Ã>Á>Ã>­>¸>Ç>¿>Å>Ë>¼>ƒ>§>½>Ì>Å>Å>È>É>À>Í>Í>Ô>Ä>½>›>Á>É>µ>Ë>Á>Ð>Ì>Å>Ð>Ë>ª>µ>Ì>˜>Å>È>Ë>Ì>Ã>Ç>É>É>Ã>È>Ë>Ç>¼>Ç>Ç>Ç>É>$>Ç>µ>—>Ã>È>½>µ>Ë>È>Ì>É>Ç>Ë>Ì>½>Á>Ë>Ã>Ç>Ð>Å>Ç>¹>È>¹>À>É>=>Ç>½>É>Á>¿>€>¡>Ç>Ë>È>¯>Á>½>§>Ì>Ï>Ã>Ã>È>Ç>Í>ù>Ô>Á>Ì>É>É>»>½>¹>½>Å>Å>Ë>Ç>Å>É>£>É>È>Å>Å>È>d>À>À>Ì>Å>¼>·>È>À>À>±>§>Ç>È>Á>Ä>Å>Ã>¡>À>»>½>›>Á>Ã>È>Ë>À>Ç>Å>É>È>³>«>À>Ì>Á>Å>Ç>±>É>Ä>È>Í>Å>Ä>À>»>Á>>Ë>È>É>Å>¿>À>¹>Í>¥>µ>>Ã>Å>¼>½>È>µ>Ã>Ä>Å>Í>Ä>Á>Ë>É>¥>Ç>¸>³>È>Ã>À>Á>¸>Í>Å>È>±>Á>¸>³>Á>¸>É>Ä>Å>Ã>Ä>É>Á>È>À>È>Ì>Á>È>Ë>¼>Ç>¿>Í>±>È>À>¼>Ã>Ã>½>Ë>È>À>Á>È>Ã>›>¸>Ì>Ì>¹>Ë>Ç>Ç>É>Ï>«>Ì>Ã>Ë>Ç>Ì>Ç>¹>Ä>È>Ä>¼>È>À>Ì>Á>¹>Á>Á>È>Ã>Á>Ç>»>Í>Í>Ç>Ë>Ã>Å>È>Ã>À>Å>'>½>¸>È>©>É>Ì>É>Å>Ã>³>)>È>Å>À>È>À>›>Ã>¥>Á>Ï>Å>Å>Á>Ë>Ç>³>Ÿ>Ï>Á>Í>É>Ë>½>Å>Í>¥>©>È>Á>’>À>È>Á>>¤>Á>µ>È>Á>Ç>É>Å>Ç>Å>½>­>Í>Å>‹>µ>µ>­>½>Ï>¿>È>È>Ç>È>Í>Ì>Å>µ>½>‡>·>Í>Õ>½>Å>Ç>¤>Ë>¹>Å>Ì>Å>Ë>«>Ç>µ>¿>Ä>È>½>È>À>¼>Ä>È>·>È>¸>Ã>Ã>·>¿>Ä>Ã>¹>Ë>Ë>Á>¸>Ï>§>¿>Ã>Ã>É>»>À>§>Å>Ã>Å>Å>Ì>½>°>»>È>¿>Á>Í>À>S>¿>Å>Í>½>¨>Ã>Ã>Ì>Ð>½>É>Å>Ë>È>¸>Ï>È>¸>Á>Ë>Ì>»>Å>·>Ð>«>»>Ç>«>¹>À>Ä>½>Ð>Ã>Å>Å>Á>É>Ã>Å>É>Í>Å>Å>´>Å>Ç>½>Á>Ì>­>É>»>À>È>Å>Á>Ã>Ï>«>Å>·>Ï>Ã>Ã>Ç>Ã>È>À>É> >Ä>·>¿>Ç>À>Ç>À>´>Å>Á>Ì>É>¿>Á>À>¿>Ì>Å>¸>Å>Ï>À>Ë>É>­>É>Ã>È>•>É>À>Ã>Å>­>Ä>Ã>Ç>Ë>È>»>Ÿ>Õ>Ë>¦>Á>Ÿ>Í>Ë>À>Ç>Å>Ã>¿>¼>˜>·>±>·>Å>µ>Á>Ã>½>Å>À>À>Á>É>­>É>¿>°>À>È>Å>Á>É>Ì>À>È>È>¦>Á>Ë>Í>Ä>³>©>G>Å>Ã>¤>Ã>Ë>Ã>È>Å>É>Å>½>Å>Ç>Å>Á>Ã>È>Å>Ã>É>É>µ>É>Ã>Å>Ã>¹>É>È>Ÿ>Ç>Ã>Á>×>0>Å>Ó>Å>Å>É>Á>É>Ç>Ä>Ã>¹>½>½>Ë>¼>È>½>È>Í>Á>È>Ë>À>È>Ÿ>È>Å>¹>Á>Ï>³>Ì>¿>È>Å>¿>È>§>Ì>½>Ì>­>Ð>Ï>Ï>½>É>À>·>¤>½>±>Ð>Ä>É>É>È>À>¹>³>¡>Á>Ì>Ç>Ã>Å>Á>É>¿>¼>Á>½>Á>Å>Å>§>Ç>·>½>Ç>³>È>È>»>³>Ç>É>Ã>É>Ã>È>È>­>È>š>Ç>­>¿>Ç>Ä>È>È>Á>Ì>˜>È>Ã>À>Ç>­>È>À>È>Ë>Ó>¸>Ï>Ä>Ì>Ã>É>Ì>¼>Ã>Ç>Ä>Á>½>Ë>¹>Ã>¿>Ë>À>À>»>Í>É>Å>Å>Å>Ó>Ç>Ã>Ë>È>Å>È>Í>Ç>À>É>Á>µ>Å>È>¿>·>Ì>Å>½>É>Ì>À>Å>À>£>À>Ð>É>¿>Å>»>É>Ç>Ë>Å>Í>Ã>É>µ>š>À>Á>À>È>Ç>È>É>Á>Å>Å>Å>À>Á>È>É>Á>Å>Ä>Ë>È>È>É>»>É>Í>Ã>•>§>À>É>Á>È>½>À>½>Å>¿>Í>Á>ƒ>Ç>Ç>¨>¿>É>Å>À>¿>Ä>Ä>Ó>Ï>Å>Ç>Ã>À>Ï>½>À>›>Ë>É>Å>À>Å>À>³>>Ã>Ç>Å>³>¸>š>É>Ã>È>Ð>Å>µ>È>Ë>Ï>Ï>Ã>Ä>Í>È>¿>»>É>Ï>£>Á>È>¿>É>©>Í>Ã>È>Å>Ç>Ï>¡>Ë>È>È>Ë>µ>Å>È>»>Ä>½>È>È>½>Ã>Ã>Ã>Á>Ã>¿>Å>Ã>Å>Ì>È>Ë>Å>»>Ì>¸>¼>Ì>p>Ã>Ï>Ä>Ì>Í>Ð>À>À>Ç>—> >É>Ç>È>Á>Ç>Á>¡>É>Í>È>Å>œ>¸>Ã>¼>Í>½>Å>¹>·>Ã>»>Í>¥>À>µ>À>Ç>Í>Ä>È>¹>³>Ã>Ë>Ž>¿>½>·>È>Å>Ð>ª>Ã>É>À>Ï>Ë>Å>Å>Í>Á>Å>…>¹>¿>¹>Ç>Í>É>Ã>Ã>Ç>½>>Á>»>»>Ë>Å>É>Ç>Í>Á>È>Á>Ç>Ã>Å>·>Í>Å>À>Á>¿>Ô>Ä>È>Ë>É>Ñ>Ë>Å>Ï>À>É>½>Ç>¥>É>Á>¼>Ë>Á>Ã>¸>Í>³>Á>É>È>Í>Á>À>¿>È>Ä>Å>Ç>Í>È>È>Å>È>Á>µ>È>À>Å>À>¿>¦>¹>Å>¿>Å>»>É>¿>Ð>Å>É>×>¨>É>Í>Å>Ç>Ÿ>Å>È>Å>Ï>Å>¢>Å>±>Ç>¹>¸>Å>µ>Å>À>È>Á>Å>Ã>¸>À>È>¯>Å>Å>Ç>Å>Ë>¿>©>Ë>Ë>Ë>½>¿>À>Å>Ã>Í>µ>>»>£>­>Ë>¿>Ç>Í>Á>Ï>Ã>É>Ë>Ç>Ë>Í>Ñ>Ã>Å>Ç>Ã>É>Í>Å>É>Í>Ì>Ç>Á>Á>Ç>Ç>¸>Ï>Å>Á>Å>¬>É>¼>×>Å>Ã>¿>Ä>·>»>Í>«>È>¡>£>·>È>É>Å>É>µ>Ã>Ç>Ã>±>Á>Ä>Ë>È>Å>­>Ô>À>È>½>»>Å>¨>Ë>È>Ð>¸>Ã>Ç>Å>Ã>P>Å>É>È>¯>Ë>Á>Ç>Å>±>Ã>Í>D>¸>Ä>Å>Ä>Ð>¸>É>»>¸>Á>Ï>Ç>Ë>Å>Á>Ô>É>Å>Ï>Ã>·>Å>Å>Ä>Å>°>À>Š>Ì>Ç>Å>Á>¹>À>±>¿>Á>Á>Ë>Ç>Ã>Ã>»>Ä>¤>É>»>Ç>Ë>É>§>Í>Ã>Å>Ã>Å>É>°>Å>Ì>½>É>Å>­>É>Í>À>À>«>Í>»>Ï>À>Ã>¼>Ç>È>Ã>É>Å>¿>Ç>À>À>Å>É>À>Ç>Ä>½>½>È>È>Å>Ì>È>Ð>È>Á>È>½>Å>Ã>Ç>È>Ï>½>Í>¿>É>Ç>¹>Ã>¹>Á>Ã>·>Ä>É>¿>À>Ã>¿>Ã>Å>Ë>Å>·>À>¹>Ç>Ï>°>Ë>¼>Á>À>Ã>Ç>É>¿>Í>Å>Ó>Å>À>©>Å>±>Ã>Å>Ç>Ë>Ë>¿>Ç>Á>Ë>Ô>Ç>Ç>š>Å>Ç>¬>À>É>À>´>Ë>Ç>>Ã>—=Å>Ä>Å>Ç>Ã>Ë>>Í>Ë>À>Å>Ç>É>À>¿>È>Å>Å>Ì>´>Å>Ì>Í>Ç>»>Á>Ë>É>È>³>Á>Á>À>Á>Ÿ>£>»>»>Ç>Á> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/17.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/17.0 new file mode 100644 index 0000000000000000000000000000000000000000..a674edcd346dc970b93b0b7658d0ed8b4093ef18 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/17.0 @@ -0,0 +1 @@ +Å>Å>Ë>Ã>£>Í>Í>Ì>È>Ñ>·>Ó>Ó>È>Ì>Ã>É>Ð>Ä>É>Å>É>Í>»>»>Ã>Ñ>—>Í>§>Ð>Å>À>Ð>Ã>Á>Ï>Ä>¿>É>µ>Ð>¸>½>Ì>°>Å>Ã>Ç>Í>¸>Ñ>µ>Ë>È>È>Ï>¸>Ï>©>Ï>È>Ç>Ñ>Ë>Í>Ë>È>Å>Ï>Ç>Ë>Ð>»>·>Í>Ç>Í>Ë>Ð>·>Ä>¦>Ë>Ë>Ó>Ñ>£>Í>Ì>É>È>Í>Ç>Ð>Ë>Ï>Ë>Ï>Ó>Í>Ð>«>>Ð>Ï>Ï>Ð>Ï>Ì>É>Ì>Ç>É>È>Ð>Ð>É>Ë>È>¿>Ë>Ï>Í>È>È>Í>Í>Ï>Ï>Í>Ñ>Å>)>Ë>¸>Å>Ï>Ë>Í>µ>È>Ñ>¹>Ã>Í>›>Å>Ð>Ë>»>Ð>Ã>Á>Ì>Ë>Ð>Ð>À>Ë>¬>É>¿>»>È>±>µ>Ï>«>Ï>Ë>Ð>Ñ>É>­>4>Ð>Õ>Ë>Á>˜>È>Ï>Ï>È>Ï>È>Ã>É>Ô>´>Ð>Õ>Å>¡>É>Í>Ï>Ï>¡>Å>Í>Ç>Í>Ç>½>Ñ>Ë>Ñ>Á>Ë>É>£>Ô>»>Ë>Ã>Ç>Ì>Ô>Ï>Å>É>È>Ï>È>µ>Í>É>É>¿>Ï>Ô>Á>Ð>Ï>Ï>Í>¹>Ç>Ð>É>Ï>Ì>Ð>Ï>Ç>Å>Ç>Ï>Ø>½>Ð>É>«>È>Ì>Ó>Ï>Õ>Å>É>Ï>Å>Ç>Í>§>Ï>Í>Ã>Í>Ï>Ï>Ð>Ï>Ã>Å>Í>Ï>Í>Í>5>Ñ>Ì>É>Í>Ë>Õ>È>Ð>¬=*>È>Ë>¿>¼>Á>Ñ>­>Ï>Ã>Ÿ>×>Ç>Í>Å>À>Ï>¼>Ñ>Ã>Ô>½>×>›>Á>Á>Ç>Á>È>¡>Ì>Ñ>É>É>Ä>Ë>Ç>Ç>Å>Å>Ï>Ì>Ë>Ë>Ð>³>Ô>Ð>Á>É>Ð>Ï>Å>½>Ï>Ï>´>È>Å>Á>»>È>È>Ô>¿>É>Ø>Ë>Ë>Ë>È>Û>É>Å>Å>É>—>Å>É>Í>»>Ã>A>Ô>É>Ï>Ã>»>Á>É>Í>É>Ë>«>Ç>À>Ë>Ä>¬>Ð>Å>Ë>Ï>Ð>Ã>Å>È>Ã>Á>Ë>Ï>Ë>Ð>Ï>Ì>Á>Ï>Õ>À>¢>½>Ì>Ì>´>Ï>È>Ç>Ð>§>Ë>Ë>Ä>Ï>Á>Ë>Ë>Í>»>Í>É>°>Ë>È>½>Ô>¿>Ï>Ï>Í>Ï>Ë>¸>Í>–>Í>Í>Ç>Í>Í>À>Í>Ï>Ï>¸>Ð>Å>Å>È>Ä>Ï>É>×>È>É>Ï>×>È>Å>Ï>¨>Í>Ì>À>Ï>Ë>Ã>Ç>Å>Ë>È>Ï>¬>³>Ï>È>Ð>Í>Í>Õ>½>»>È>Ë>Í>Ì>Ç>É>Ì>Ï>Ë>Ç>Å>É>Ä>Í>Ì>Ï>Ï> >Ç>Í>Ë>Ô>É>Í>Ë>Ë>Ë>«>É>Í>À>Ð>°>Å>Ë>Á>Ç>¨>Ð>Ì>Ã>Ë>¿>­>×>Á>È>Ç>À>ª>Ï>Ã>É>Ð>Ì>É>Ë>È>¯>Ã>Á>Ã>É>È>¿>Ð>À>°>Ï>š>Ó>Å>Ä>È>È>Í>Å>½>È>Í>À>×>Ó>Í>Í>Ð>Ë>Å>Ç>±>Ë>¼>Ü>Õ>½>È>È>Ï>Å>À>Ñ>½>Ì>Ë>Ã>È>§>½>À>Ñ>Í>Ñ>Ç>È>Ë>Á>Ç>É>Ë>Ð>Á>µ>Ð>Ñ>Ô>Ë>Ï>­>Ë>Ì>Á>¹>È>Í>´>Í>Í>Í>“>Ì>×>Ï>¼>Á>È>Å>Á>Ã>¿>Ç>Í>«>Ó>Ñ>É>Í>¸>Ð>Å>¿>Ñ>Ð>Õ>Ó>Ç>È>È>È>Ñ>»>Å>¥>É>É>¿>·>Í>Õ>Ë>È>Å>É>É>Ã>Ì>´>Õ>Ì>Ë>Ñ>e>Ñ>Í>Ð>Õ>©>Ç>—>Ô>Ñ>Ë>Ï>µ>½>Á>À>É>¿>É>Í>Å>Ç>Ñ>Ñ>Ã>É>Í>U>Ð>Í>Ä>Ï>Ï>¯>Å>Ð>Ë>Å>Ç>Ë>Å>Ï>Ð>>¯>Õ>Ì>Ç>Ç>Õ>Í>Ï>Í>Ï>Ô>Í>É>Í>Í>Ÿ>Ç>Ä>»>Ç>À>Ó>Ð>Ç>À>Ï>½>°>É>É>É>Ð>È>Å>Í>õ>Ñ>»>É>¹>>Å>Í>Ë>Å>Ã>É>À>Ñ>Ë>Í>É>Ë>Ï>Ë>°>À>Í>Ë>¯>Ë>Ð>$>À>Å>Ç>Í>É>Ï>Ã>Ñ>Ë>Ð>È>À>Í>Ð>Ï>Ó>Í>Ï>Å>Ù>Ï>Å>»>Ï>Ã>Ï>Ì>Í>É>Ï>Ù>É>Ï>À>Í>À>È>·>Ï>Ë>Ï>­>¡>Ð>Ë>É>Ã>È>Õ>Å>Í>È>Ï>Å>Í>Ç>Å>É>½>À>Ð>Ï>Ï>Í>Ç>Ç>¼>Ï>Á>É>Ë>Ã>É>Ã>Õ>Ð>Ï>O>Ë>Ï>Ë>Á>Ð>Ã>ƒ>Ë>Ë>Ã>Ç>Ë>Ï>Ë>Í>¹>Ï>Ø>Å>Ë>°>Ë>Ñ>Í>¢>Í>É>Ì>Ë>Ë>Õ>Á>µ>Ð>Í>È>Ó>Ð>·>Ñ>Ì>Ô>Í>À>™>e>Å>Ë>Í>Í>Ë>Ñ>Ï>‹>Ë>Ï>È>Ã>Á>É>Ó>Å>Í>Å>Ð>Ó>É>Í>Ñ>¼>Ñ>¹>Å>Ã>È>¹>¿>Å>É>Ð>Ë>Á>É>Ð>È>Í>Ï>Å>Ñ>­>Å>Ï>É>Ï>¹>¸>Ã>Ç>Ë>½>À>É>Ñ>Å>¼>¿>Õ>³>³>Ë>Ç>Ï>Ÿ>Í>É>Í>¿>Ô>Ä>Ä>Å>©>Ð>¼>™>Ô>Í>Ð>Õ>Ë>Í>Ð>¡>Å>¸>±>Ó>É>Á>Ñ>Ç>Ë>Ð>Í>Ï>Í>¼>Ó>Ã>Ï>Å>Ï>È>»>Í>°>Í>Ë>Ÿ>Ð>½>É>Ë>Ë>Í>Í>À>Ë>Á>Ç>Ï>Ñ>9>É>Ë>Ñ>Ç>Ë>Í>Å>Ç>À>Ë>µ>Õ>Ë>Ï>Ï>Ï>×>Ë>Ð>;>Í>Ç>Ì>Ó>Õ>½>Í>Ð>×>Ì>È>Ï>¹>È>È>¢>Ì>Õ>´>Ï>¿>Ë>Í>È>È>È>Ó>x>Ð>É>Ë>Ë>¥>Ï>Ñ>Ç>Í>Ç>Ä>Í>Ñ>Ã>Ï>Ë>°>Ë>Å>Ì>À>•>Ï>È>Ã>Ï>Ï>É>Ï>Á>Ø>Í>¹>Å>£>½>Ñ>¸>Í>˜>È>¿>Í>°>Ô>«>É>É>Å>Ì>Ç>È>Ë>Ù>Ñ>É>Ñ>Ë>Í>Ð>½>µ>³>Å>Á>Í>Ã>Å>×>É>Ë>Ð>Í>È>!>¦>Á>Ð>Ï>À>™>È>Í>Ì>Ì>±>Ë>Ð>Í>È>È>Ç>Ã>Ñ>Í>¹>Ë>Í>Ì>Ï>Á>[>Ñ>Ï>Ô>Ç>Í>´>È>Ì>Ì>Ë>Ï>Á>Á>È>¼>É>Í>½>Å>Ç>¸>>Ã>Ó>»>Ë>Ð>Õ>Í>À>Ð>Ï>Ç>À>É>É>È>Ç>É>¯>Ë>È>É>©>À>É>Ë>É>Ï>É>Õ>Í>Ç>À>È>Õ>Ã>Ç>Ä>Ë>Ë>Ä>Õ>Ã>Ï>Í>»>È>«>Ë>Á>Ð>½>Í>Ï>Ã>Ñ>È>Ã>Í>Ë>Å>Á>Ñ>Å>Ì>Ì>Ï>Ô>É>È>Ï>Ë>Ð>É>Ð>Ñ>Ã>±>É>Ï>Ó>Å>É>Ã>Ï>¥>×>>µ>Ó>Ç>Ã>Ä>×>Í>Ë>Ð>È>Á>È>Ï>È>Í>µ>Ó>½>Í>Í>Á>Ï>Ó>Á>Ç>Ñ>Ì>Ë>×>È>Ç>µ>Ë>Ë>Å>Ç>Ï>É>È>K>Å>É>Ð>É>Ë>Ï>Ï>Ì>Ã>È>Å>¹>Ó>Ï>É>×>Ë>Í>¼>Ë>È>Ì>É>Ñ>Ñ>À>Í>½>É>Ç>½>¸>Ë>É>Ã>À>Á>Í>­>Í>Ç>Í>Ë>Í>Å>€>È>Ç>Å>Í>Ð>Ë>Ð>Ø>Ï>Á>Á>¿>Ô>Ÿ>È>Ð>Ë>Ó>É>Ë>É>Ç>É>Ã>Å>È>Ï>Ì>Á>Í>Ë>Ë>Ë>Ð>Ð>Í>€>É>³>Ë>Á>È>È>È>Ï>Ï>Á>Í>Ï>Ë>È>Ç>´>Á>Ë>Ð>Í>Ð>Á>Í>Ï>Í>Ô>À>Ë>Ñ>Ñ>½>Í>Ñ>È>Ì>Ì>½>É>Ë>Ð>µ>½>Á>Å>Å>Ç>Ä>¿>±>§>¨>Å>À>Ï>§>Ð>Ï>Å>Å>Å>Ã>Ë>Ï>À>Í>¹>Å>È>Í>À>£>È>½>Ë>¬>Ä>Í>Ç>È>·>Ç>³>Õ>Ë>Õ>£>Ð>Ì>Õ>Ñ>Ð>Ï>Í>«>Ð>Ç>Í>Í>Å>É>Ð>È>Ç>Õ>Ç>È>Ç>Í>Ñ>±>Í>Í>È>É>Í>Ð>Ð>Í>Å>Ü>Ç>É>Ç>µ>Ð>É>Ñ>É>¹>Ë>È>Ë>Ó>Å>Í>Õ>Õ>È>Å>Ç>À>¬>É>k>Ë>É>À>Ï>É>Ë>Ë>É>Ë>Í>É>Ó>Ð>Ð>É>£>±>Ï>Ï>Å>É>É> >Ã>Ð>Ð>Í>Å>°>½>Í>Õ>Å>¥>É>Ï>Å>Ç>Ã>«>Ë>Ñ>Å>×>Ï>Ã>É>×>È>È>Ï>È>Ì>Å>Á>Í>×>Å>¸>Ç>Í>Ë>Å>È>À>Ï>½>Ë>Í>­>È>Ï>Ì>³>Ë>É>À>µ>¬>Å>Ð>Ë>Ó>½>Ô>½>½>Í>Å>À>´>Í>Á>Å>©>Ñ>Ó>Ë>Ô>Ã>½>×>É>˜>Í>Ë>Ã>»>É>Í>É>½>Ç>Ó>×>Ð>É>Ï>Ð>Í>>È>Ë>Ï>¼>Ð>Ì>Ã>Ë>Ã>·>Í>Ô>Ë>Ï>È>Ä>Ï>Ç>Í>Ð>Á>Ë>Ñ>É>½>Ï>Á>Å>×>Ë>§>»>Å>Í>È>Ð>¿>¼>Ð>Ð>Ï>È>É>Á>T>É>Ï>Ð>À>Ð>È>»>Ë>È>¯>Í>Á>¸>É>Ï>È>É>Ë>Ï>Ä>Ï>È>É>Ñ>¨>Ï>Å>·>½>Ï>¹>Å>Å>Å>É>É>É>Ï>Ì>Ð>Ë>¯>¹>Ï>»>Ï>Ä>Ã>À>Å>Í>Í>È>È>Ë>Í>Ý>Í>Í>Ç>Ô>Ç>Ï>Ñ>Ë>Ï>Ï>Å>Ÿ>Ñ>Í>Ã>É>à>Ç>Ç>É>É>Ë>Ì>µ>Ì>Ð>4>Á>¸>Ð>¼>Í>Í>Ä>Ï>È>Ë>È>É>Ë>É>»>Ë>¥>Ë>×>¡>É>Ë>Å>Ð>«>À>½>Å>Å>Ð>“>Ã>Ó>Å>Ñ>É>½>Ã>Ã>¿>¡>¿>»>Í>Ë>È>Ï>Ï>¼>Å>Ã>Ñ>Ã>i>É>Ð>Í>Å>Í>È>É>Ð>Å>Ä>Ç>Ñ>Ç>Ç>¨>Ñ>Ô>À>Ï>¿>¿>Å>Ä>Í>µ>Í>¸>È>Ï>§>È>­>£>É>Í>Ô>Ç>¯>Á>Ì>Ð>Ó>Ô>Ó>Ç>É>É>Å>Ï>Í>Ó>Ï>Ë>Ï>Í>½>Ë>È>Ï>Ã>Ì>Ë>§>Å>Í>Å>Í>Ô>Á>Ì>Ñ>Ì>É>Í>É>Ì>É>Å>Ï>½>Í>Ë>È>Å>Å>¨>¼>Å>È>Ë>Í>Á>½>Ð>É>Ï>Ç>Ó>Ë>Ñ>Ñ>À>Å>Ï>ž>Ì>É>Ñ>Á>É>Ç>É>Í>Í>Ñ>¥>Ã>Á>È>Ç>Ç>Å>Ï>±>Ë>Í>Ë>Ç>Ï>Í>>Ç>½>Å>È>«>Ð>Ã>Ï>Å>–>È>É>Ï>Ì>×>Å>Í>Ñ>Ð>Å>Õ>Ë>Á>Ã>Õ>Í>Ë>Õ>Ç>Å>©>Å>Å>Ç>Ã>Í>È>È>È>‰>Û>Ó>Å>ã>Ñ>È>Ç>Ì>Ì>É>Í>Ë>›>Ë>Ã>Ç>Ç>Ÿ>Ð>Ã>Ñ>Å>Ã>Ç>Á>¹>Ì>Í>¥>Ã>È>À>Ñ>É>Ç>Í>Ã>É>É>Í>Ë>Ó>Ç>¹>Å>µ>Í>“>Ï>»>½>Ï>Å>¸>Í>Í>É>Ó>Ï>Ï>É>Ï>Ô>Á>»>Å>É>¿>Ï>Õ>Ô>Ç>Ï>Ó>Ï>M>Ð>Ë>Ó>É>>Ë>È>À>Ô>Ã>Í>×>Ð>Í>È>Õ>Ð>½>Ì>¿>Ï>Ð>Ã>“>Í>Í>¿>Ô>Ç>¿>Ï>É>Á>Ó>É>Ñ>É>Ð>Ñ>Å>Í>É>Ï>¸>È>Ï>Í>Á>À>Í>Ð>Ô>È>Ï>Å>±>È>È>À>Í>Ï>Ë>É>Å>Í>Ô>š>¢>£>Á>Ì>Í>Ð>Ó>Ë>Ë>·>Ð>Å>Á>Å>Í>Ä>Í>Ë>É>Ë>Ñ>Ç>Ã>·>Í>á>Í>Ç>Ô>Í>Í>Á>Ë>Í>Ç>Õ>Í>£>Ã>Ë>Í>Ë>½>Ì>Í>Å>Ñ>Å>Ð>Ë>Í>Ë>Ó>Ï>Ï>Ó>Ë>Ï>µ>Ï>»>·>½>Å>§>Á>Û>¹>»>Ÿ>Í>Ë>Ä>Í>·>Å>Í>Š>Í>µ>Ã>g>È>É>Ï>Ó>Õ>Ì>Í>É>¿>Ë>Í>Ë>×>Å>Í>Ð>Õ>­>»>´>Ç>É>É>Ð>µ>Ï>Í>Ó>Ì>µ>Ä>È>À>Ð>—>Ç>É>ð=Ä>É>À>Ã>Í>È>È>¸>Ë>Ø>Ï>Ï>È>Ë>Ð>Å>Ñ>»>È>Å>Ð>Í>Í>É>Ã>Ã>‰>É>Å>½>©>Ã>Ç>Ô>Ç>Ã>Ë>Ë>Ë>Õ>Ì>É>‘>¸>Ï>Á>Å>Ã>>È>Ï>Ñ>Í>Ñ>É>É>Å>Í>É>Ë>Ì>Ì>Ý>Ï>Ã>Ï>Å>Ñ>Ë>Í>À>Ì>È>Ï>Ã>É>Ë>Í>°>Å>Í>Ã>Ô>Í>Ï>£>Ë>Å>Ì>Ó>Ç>Ë>È>Í>È>Ì>Ð>Í>Å>Ñ>Ë>µ>Ä>Ð>Ï>Ì>Ç>É>Í>Å>Ì>Ï>Í>Ë>£>Ã>Å>Í>Å>­>Ñ>É>À>Ï>Ï>É>Ï>Ï>¿>Ð>Á>Í>Ç>É>Í>¹>Ó>¯>½>À>Ì>Í>É>Í>¹>Ô>Õ>È>³>É>Ñ>Ð>ž>È>»>Å>Ë>Ÿ>Ç>Ç>Ë>½>É>Í>Ã>É>Ï>Ï>Ë>½>Ñ>Ë>Ñ>Ë>Á>Å>Á>Í>µ>Í>Í>o>´>Ô>Ð>Ë>Í>Ñ>Ï>³>Ë>É>Å>É>È>Ð>Ï>Ç>È>Å>Ï>¼>›>È>Í>Ë>É>·>Í>È>Ë>Ì>Ç>Ë>È>É>Í>Ã>É>Ñ>Ã>É>Ì>Ï>A>È>Ï>È>Ñ>Á>½>É>Ë>Ð>É>Í>Ï>Í>µ>Ç>Ð>Ï>Ì>Ï>Í>È>Ï>Ì>½>È>È>É>»>Å>Ì>Ã>>«>Ð>Õ>Ó>Ã>Í>Ñ>Ë>Ç>Ð>È>Ë>É>Ø>Ë>Ç>À>Ç>¡>—>­>Í>É>Ì>Ï>µ>Í>§>Á>Ë>Ï>Å>Ð>É>£>É>Õ>Ï>Ï>Å>»>Ë>¼>Ë>¼>Ë>É>Ä>Ð>Ì>Ð>Ï>ç>Ã>¹>Í>É>£>Í>Õ>É>Í>Í>È>È>Ï>Ð>À> >Ð>Ì>Õ>Ì>×>³>È>Ì>É>³>Ã>É>Ã>É>Ë>Á>€>­>Á>Ï>Ï>É>Ë>Ï>È>Í>Ó>Ù>È>Å>Ÿ>É>Í>½>Ó>Å>Ñ>Ô>É>Ô>Ï>°>»>Ð>ž>É>Í>Ñ>Ð>Ã>Ï>Ð>Ó>Ë>Ë>Í>Ï>À>É>É>Í>Ð>->Ë>¹>™>É>Í>Å>¼>Ñ>Í>Ð>Ï>Ì>Ð>Ó>Ä>È>Ð>Í>Í>Ù>Í>Ï>Á>Ï>Ã>Ë>Ì>;>É>Ã>Í>È>Å>‚>£>Í>Ó>Ï>¹>È>Ç>«>Ó>×>Ë>È>Í>Ë>Õ>ð>Ø>É>Ï>Í>Ó>Á>Ã>¿>Å>Ë>Ì>Ð>É>É>É>¦>Ï>Í>É>È>Í>g>Á>È>Ó>É>Á>»>Ì>Ã>Å>¿>«>Ï>Ó>Å>É>Ë>Ç> >Ë>À>Ç>¡>È>É>Ñ>Ï>Å>Ë>Ë>Ñ>Ï>´>°>È>Ð>Ç>Ì>Ï>¸>Í>Ì>Ë>Ñ>Í>É>È>À>Ç>£>Ñ>Ï>Í>Í>Ã>È>Á>Ï>­>¸>™>È>É>Á>Ã>Í>¸>É>È>Ë>Ô>Ç>É>Ð>Õ>§>Ë>¿>¹>Í>É>Ã>Å>½>×>Ë>Ë>¸>Å>½>»>Å>Á>Ï>Í>È>É>Í>Ï>É>Ñ>È>Ï>Ô>Å>Ï>Ï>¿>Í>Å>Ï>¸>Ñ>Å>Á>Ç>È>À>Ð>Ì>É>É>Ð>È>¡>À>Ó>Í>Å>Ë>Ï>Ë>Ì>Ó>¯>Ð>Ç>Ñ>Ì>Ð>Í>¿>Í>Í>È>½>Ì>Ç>Ó>Ë>½>À>Å>Ë>Ç>Ç>Ð>¼>Ñ>Ð>Í>Ó>È>Ì>Ð>É>Á>É>#>Å>À>Ð>¯>Ë>Ô>Ó>Í>É>·>->Í>Ì>Å>Ï>Ç>¡>Ë>©>Ë>Õ>É>Ì>È>Ï>Í>¼>©>Õ>Å>Õ>Ð>Í>À>Ë>Ï>­>­>Í>Ç>—>Á>Ï>È>!>£>Ë>¿>Ë>È>Ë>Í>Ì>Ì>Ë>Ä>³>Õ>È>ˆ>½>À>·>Ã>Ó>Á>Ï>Ï>Ë>É>Ñ>Ð>Ë>¼>Å>ˆ>Á>×>Ø>Á>Ë>Ì>¬>Ô>Á>Ë>Ó>Ë>Ó>°>Ë>½>Ã>É>Ð>Å>Ï>Ç>Á>È>Ð>½>Ï>À>Ë>Å>»>Å>È>Í>Á>Ó>Ð>Ä>Ã>Õ>©>Ä>É>É>Ñ>À>È>°>Ì>Ç>Ë>Í>Ï>Å>µ>Ä>Í>Ä>É>Í>Ë>I>Ä>É>Ð>Ä>¬>È>Ë>Ð>Ô>Ã>Ï>Ç>Í>Ï>¿>Ñ>Í>½>È>Ï>Ð>¿>Í>À>Ô>´>À>Ë>´>Á>Ç>È>Ä>×>Ë>Í>Ë>Ã>Ï>Ì>Í>Ï>Ñ>É>Ë>¸>Ë>Ë>Ã>Ç>Ó>±>Ð>Á>Ç>Í>É>Ç>Ë>Ð>³>É>¿>Ð>È>É>Í>Ì>Í>Å>Ð>©>È>½>Ç>Ì>É>Ë>Ç>¹>Ï>È>Ñ>É>È>È>Å>Ç>Ñ>É>Ã>É>Ñ>Ç>Ñ>Í>´>Í>È>Ð>>Ï>Ç>É>É>°>Ë>É>Ð>Í>Ð>Ã>£>Ù>Ñ>©>Ì>§>Ï>Í>Ã>Ï>Ë>É>È>Ç>£>½>µ>¿>Ë>Á>Ë>È>Ç>Ë>Å>Ã>È>Í>³>Ð>Å>»>Å>Ë>Í>È>Ï>Ó>Ç>Ì>Ï>¯>È>Ð>Ó>Ï>¹>­>W>Ñ>Ë>¨>Å>Õ>Ç>Ï>Ã>Ð>É>Ã>É>Í>Ë>Ç>É>É>Ë>Ë>Í>Ï>¹>Í>È>Ë>Ë>»>Í>Ì>£>Í>Ì>Å>Õ>->Í>Õ>É>Ç>Ñ>É>Í>Í>É>Ç>»>Ç>É>Ï>Ã>Ô>Å>Ï>Ï>É>Ï>Ñ>Å>Ì>©>Ï>Ë>½>Ç>×>µ>Ï>Ã>Ó>Ë>È>Í>°>Ó>Å>Ï>¹>Ñ>Ð>Ó>Å>Ì>Ã>Á>±>Ç>¸>×>É>Ð>Í>Ë>Ä>Ä>¸>§>È>Ó>Ï>Ì>Ï>È>Ë>Å>Å>É>À>Å>Í>Í>­>Ë>¿>Ç>Ï>´>Ï>Ì>½>¸>Í>Ï>È>Í>Ç>Ï>Ì>±>É>>Í>µ>É>Í>Ç>Ì>Ë>Ë>Ó>›>Ï>È>Å>Ï>µ>Ì>Ä>Ë>Ð>Ø>¿>Í>Ë>Ð>Ì>Ì>Ð>À>È>Ð>Í>É>À>Ï>¿>É>Á>Ð>Å>É>Á>Ø>Ó>Ð>È>Ë>×>Í>Å>Í>Ï>Ç>Ë>Ð>Ë>É>Ñ>Ë>½>Ë>Í>Ã>»>Ð>Ï>Ä>Í>Ð>Ä>É>É>ª>Ç>Ó>Ë>Á>Ï>Å>Ñ>È>Ð>Ï>Ñ>Í>Ì>¹>Ÿ>Ë>È>Å>Ï>Ï>Ï>Í>Ç>Ì>É>Í>Ë>É>Ï>Í>Í>Ë>È>Ð>Ï>Ì>Ë>Ã>Ó>×>Ë>>¥>Ã>Ñ>Ç>Ï>Ã>Å>È>È>Ë>Ï>É>Œ>Ï>È>°>Å>Ñ>Ï>Ç>Ã>Ë>È>×>Ô>Ì>Ì>È>Å>Ï>Å>Å>£>Ð>Ï>É>Ç>É>Ä>¹>#>É>Í>Ç>½>À>Ÿ>Ó>Ç>Ë>Ù>Ë>Á>Ï>Ï>Ø>Õ>È>Í>Ð>Í>Å>¿>Ë>Ð>¨>È>Ë>È>Ï>¯>Ð>È>Ï>Ì>Ì>Ó>§>Ð>Í>Ð>Ë>»>Ì>Í>Ã>Ë>Ã>Ï>Ð>Ã>Å>Ë>Ç>È>É>Å>Ç>É>Í>Ð>Ë>Ð>Ë>Ä>Í>Á>Á>Ñ>l>É>Ï>Í>Ô>Ó>Ô>Å>É>Ç>ž>«>Ð>É>Ì>Å>Ë>È>¢>Í>Ð>Ð>Ð>¦>»>Ë>½>Ï>Ã>Ë>Ã>À>È>Å>Ô>«>È>½>Ã>È>Ð>Ë>Ì>Ã>¸>Ë>Ì>‘>Ã>Á>»>Ë>È>Ó>³>Ã>Ï>É>Ï>Ï>Ç>Í>Ñ>Å>É>‡>Ã>Ç>½>Ë>Ó>Ð>È>Ë>É>Á>Ÿ>È>¿>Á>Ï>Ç>Ó>Ð>Ô>Ç>Ð>É>Ì>É>Ì>»>Ï>Ë>Å>É>Ã>Û>Ë>Ï>Ð>Ï>×>Ï>Í>Ó>Ë>Ó>Å>Ë>­>Ì>Å>Ã>Ð>É>Ç>»>Ó>·>É>Ï>Ï>Í>Ç>Ã>Ç>Ì>É>Ï>Í>Ô>Ë>Ë>Ï>Ï>É>»>Í>Ç>Í>¿>Ã>©>½>Ï>Ã>É>Ã>Ë>Å>Ø>Ð>Ð>Ø>­>Í>×>Í>Ë>§>Ç>Ì>Ë>Ñ>Í>§>É>¸>Ï>½>À>È>¼>É>È>Ï>È>Í>Ë>À>È>Ï>¼>Ë>Ï>È>Ì>Ï>Ä>­>Ñ>Ï>Ð>Á>Ç>É>É>Ë>Ð>¼>’>Ä>«>´>Ï>Å>Ï>Ñ>É>Ð>Ì>Ð>Ó>Í>Í>Ó>Ñ>Ì>Í>Í>É>Ñ>Ó>É>Ï>Ð>Ì>Ì>Ä>Ë>Ñ>Ë>½>Ó>Ç>Ç>È>¯>Í>Ã>×>É>Ç>Å>Í>¿>Ã>Ð>±>Ï>§>©>½>É>Ï>É>Ñ>¹>Ì>Í>Ç>¼>Ì>É>Ô>É>Ë>¸>×>Ã>Í>Å>Ã>È>©>Í>È>Ó>½>Ì>È>É>É>W>Ë>È>Ì>µ>Ï>Ç>Ñ>Ë>¹>Í>Ñ>5>Ã>Ì>Ë>Ë>Õ>À>Ð>Ä>¿>É>Ó>É>Ð>Í>É>Õ>Ï>Í>Õ>È>¿>Í>É>Ç>Í>µ>È>>Ñ>Í>Ë>Ç>À>Ç>¿>È>É>Å>Ñ>Ì>Ï>Í>Á>Ë>¬>Ñ>À>É>Ñ>Ë>¯>Ó>Ë>Í>Å>Ë>Ñ>¹>Ë>Ï>Å>Õ>È>¸>Ï>Ð>É>È>±>Ñ>Ã>Ñ>Å>Å>Á>Í>Í>Ë>Ó>Í>Ã>È>Ä>Å>Í>Ñ>Ç>Ï>Ë>À>Ã>Ñ>Í>È>Ï>Í>Ó>Ë>Å>Ð>Å>Í>Í>Ï>É>Ô>Á>Ï>Ã>Ð>Ó>À>È>Ã>Å>É>À>Ì>Í>Ç>Å>É>Á>Ë>Ï>Ï>É>»>Å>Á>Ï>Ñ>»>Ñ>Ä>Ç>Å>É>È>Ô>É>Õ>Ë>Ý>È>È>°>É>·>É>É>Ë>Ñ>Í>Ç>Ë>É>Ô>Ø>Ï>Ï>§>É>Ï>´>Ç>Ñ>Ç>½>Ð>Ï>£>É>‡=Ë>Ç>Í>Í>Ç>Ó>>Ó>Ì>É>Ç>È>Ð>Ä>Ã>Í>È>Ë>Ð>µ>Í>Ð>Ñ>Ï>Å>È>Í>Ñ>Ñ>¹>É>É>Å>È>£>¥>Å>À>Ð>È> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/18.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/18.0 new file mode 100644 index 0000000000000000000000000000000000000000..4fe38e7039ce3617b6fdf2f22d801c765f859532 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/18.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/19.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/19.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee034b4bd387ceec99162111170f0d3d66e1da40 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/19.0 @@ -0,0 +1 @@ +Ó>Ó>Ù>Õ>>ß>Ù>ß>Õ>à>Å>á>á>×>Ý>×>Õ>Ý>Ñ>Õ>Ñ>Ù>ß>Ë>Å>Ë>Ý>œ>Ù>¢>Ý>×>Ë>Û>Í>Ñ>ß>Ó>Ï>Ù>Á>Ý>È>Ï>Ü>½>Õ>Ð>Ñ>×>È>Ü>Ã>Ù>Õ>×>Ý>Ë>Û>«>ß>×>×>Û>Ó>Ü>Ù>×>Ô>à>×>Ø>á>É>Å>ß>Ù>Û>Õ>ß>È>Õ>¥>Û>Õ>Û>ß>—>Ø>Ù>Õ>Ù>Û>Õ>Ý>Ø>Ý>Ø>Ý>à>à>Ý>ª>…>Û>Ý>Ý>à>Ü>Ù>Ù>Ù>×>Ù>×>Û>Û>Ø>Ù>Õ>É>Ù>Ý>×>×>Ø>Ù>Ü>Û>Ý>Ý>à>Ð>ç=Ø>Ë>Ó>Ü>Ù>Û>Ã>Õ>ß>Å>Ñ>Ù>¡>Ó>Ù>Û>É>á>Ó>Ï>Û>Ù>Ù>Ý>Ï>Ó>¸>×>È>Ë>Ñ>½>Á>ß>·>Ù>×>Ø>ß>Ù>¹>3>Ý>Ý>Ý>Ñ>§>×>Û>Û>Ð>Ù>Ø>Õ>Û>à>Á>ß>á>Ó>š>Ý>×>Ý>Û>¥>Ð>Û>Ó>Ý>Ø>É>ß>Ù>Ý>Ó>×>×>˜>á>Ç>×>Ó>×>Ù>ß>ß>Ô>Û>Ï>ß>×>À>Û>Ø>×>Ë>Ù>ß>Ñ>ß>Û>Û>Ù>Ë>Ó>Ù>Ù>à>Õ>ß>Û>Ô>Ñ>Õ>ß>å>Ë>Û>Ø>¹>Ô>×>à>×>à>Õ>Ø>Û>Ó>Ô>×>ª>Û>Ù>Í>Û>Ù>Ý>ß>ß>Õ>Ñ>Õ>Ø>Ý>Ù>>Ù>Û>Ù>Õ>ß>á>Ù>Û>ª=÷=×>Ù>Ë>Ë>Õ>ß>³>ß>Ñ>˜>è>Ó>Ý>Ó>Í>Ù>Ç>Ý>Õ>Ü>É>ã>>Ð>Ì>×>Ñ>×>§>×>Ý>Ù>Ù>»>Ù>×>Õ>Ó>×>×>Ü>Ý>Õ>à>¿>à>Ý>Í>×>ß>Ý>Ð>Ï>ß>Ý>»>Ø>Ñ>Ï>Ì>×>Ô>Ù>Ì>ß>×>Ý>Ü>Ü>Ø>é>Ý>Õ>Ð>Ù>ž>×>Ù>Ø>Ç>Õ>%>Ý>Ý>Ý>Ñ>É>Ó>Ø>à>×>Ù>¹>Õ>Ë>Ù>Ð>¸>Û>Õ>Ý>Û>ã>Ð>Ï>×>Ó>Ð>×>Ù>Ó>ß>Ù>Ü>Ï>ß>Ý>Ï>§>Ë>×>Ø>½>Ý>Ñ>Õ>à>³>Ù>Ý>Ð>Û>»>Ü>Ù>Ø>Ç>Ø>Ù>À>Ù>Ù>Í>Ý>Í>Û>Ù>Ü>Ý>Ø>È>Ý>—>×>Ó>Ó>Û>Û>Ó>Û>Ü>Ý>É>Ù>Ô>Ñ>Õ>Ù>Ø>Ù>á>×>Ù>Ý>á>Ø>Ð>Ù>°>Û>×>Í>Ý>Û>Ñ>Õ>×>×>Ø>Ù>§>Ã>ß>Õ>Ý>Ù>Ø>à>Ë>Ç>Ù>Ù>Û>Ù>Õ>Ø>Ý>Ù>Û>Õ>Ñ>Ó>Ñ>ß>Ù>Ù>Ù>¨>Ó>Û>Ø>Ù>Û>Û>Ø>Õ>×>»>Ý>Ý>Ó>Ù>´>Ó>×>Í>Ó>«>Ý>Ø>Ð>Û>Ï>µ>à>Ï>Ó>Ó>À>©>Ù>Í>Ù>à>×>Ó>Û>Ó>µ>Ó>Í>Ð>Ø>×>Ë>Ü>Ñ>³>Ý>™>Û>Ñ>Ó>Ù>Ó>Ù>Å>Ï>×>Û>Ð>è>à>Û>Ù>ß>Û>Õ>Ñ>½>ß>Ì>å>à>Ì>Ø>×>Ø>×>Ð>à>Ï>Û>Ù>Ñ>Ø>«>Í>Ë>Ý>ß>ß>Ð>Õ>×>È>×>Ø>Ù>Ý>Ì>À>á>ß>Û>Ù>Ø>¹>Ù>Û>Ñ>Ç>Ù>Ý>À>Ý>Ý>ß>>Ù>à>Û>Ç>Í>Ù>Ó>Ï>Õ>É>×>Û> >ß>á>Ù>Ù>Ç>Ý>Ñ>Ï>Ø>Ý>è>Ý>Õ>Õ>×>×>Ý>Í>Ñ>­>Ô>Ù>Ï>¹>Û>å>ß>Ó>Õ>×>Ù>Ð>Ø>¿>ß>Ù>×>á>O>Ý>Ý>Ù>à>´>Õ>›>Ý>Ù>Ù>Ù>Ã>Ä>Í>Ï>Ù>Ï>Û>Ý>Ñ>Õ>à>à>Õ>×>×>>Ü>Ù>Õ>Ý>Ù>½>Õ>Û>Ý>Ô>Ñ>Ø>Ñ>Ù>Ý>s>±>ß>Ù>×>×>å>Ø>Ù>ß>Ü>ã>Û>×>Ø>á>œ>Õ>Ð>Ì>Ó>Ñ>Û>à>Ô>É>ß>Ë>»>Ñ>×>×>Ý>Ð>Ó>×>à>Ý>Ç>×>Å>‹>Ó>Ý>Û>Ó>Ô>Ý>Í>Û>Ñ>à>Ý>Û>ß>ß>·>Ë>×>Û>À>Ø>Ý>>Ó>×>×>à>×>Ù>Ñ>ß>Ù>ß>Ø>Ë>Ù>Ý>Ý>á>×>Ù>Ñ>á>Ý>Ó>É>Ý>Ð>ä>Ø>Ù>Û>à>á>Ù>Û>Ë>Ù>Ë>Õ>Ä>Ý>×>ß>´>Ÿ>á>Ø>×>Ñ>×>ß>×>Ý>Ù>Ù>×>Ý>Ó>Ñ>×>Í>Ð>Ý>Ù>Ý>Ù>Ó>Ù>É>Û>Ó>Ø>Ø>Ñ>Ó>Ñ>à>Ý>Ù>%>Ù>ß>Õ>Ï>ã>Õ>g>Ø>Û>Ñ>Ñ>Û>à>Ø>Ü>È>Û>ä>Ð>Ù>Å>Ù>Û>ß>«>Ý>Ó>ß>Ù>Ù>ß>Ï>Ã>×>Ø>Ï>Ü>Ý>À>ß>×>ß>×>Ð>—>0>Ñ>Ý>ß>Ù>Ø>ß>Û>>Ø>Ý>Õ>Ô>Ð>Û>à>×>×>Ñ>ß>Ý>×>Ý>ß>Ì>Û>Å>Ó>Ï>Ù>Í>É>Õ>×>à>Ù>Ó>Û>Ý>Ð>Û>Ù>Ó>ß>¤>Ó>Ó>Õ>Ý>É>Å>Ó>×>Ù>Ñ>Ð>Û>á>Ù>È>Ë>á>»>Á>Ø>Ø>à>•>×>Û>Ù>Ñ>ß>Ð>Ï>Ð>³>ß>É>>Ý>Ü>Ý>á>Û>Ù>á>£>Ù>È>¿>á>Õ>Í>Ý>Ñ>Õ>ß>Ù>Ý>Ý>È>à>Ñ>Ý>Õ>Û>Ð>Ç>Ù>À>à>Ý>¨>à>Ð>Ø>ß>Õ>Ù>Ü>Ï>Ù>Ï>Ñ>Ø>á>>×>Ø>Ý>Õ>Ý>Ù>Õ>Ó>Í>Ù>Á>ß>Ù>Ý>Ý>Ù>ã>Ù>Ý>>×>Ñ>Ø>à>ã>É>Ø>Ü>à>Ý>×>×>È>Ø>×> >Ù>á>Å>á>Ï>Ø>×>Ø>×>×>à>\>ß>Ó>Û>à>¨>Ø>ß>Õ>Ý>×>Ð>Õ>à>Õ>Ù>Ø>¸>×>Ñ>Ù>Õ>“>Û>×>Ï>Ø>Ù>Ù>Ù>Ó>ã>Ø>É>Í> >É>Û>Ç>Ø>—>Õ>Ë>×>¸>á>±>Ø>Ó>×>Ù>×>Û>Õ>á>ã>×>Ü>ß>Ý>à>È>Á>½>Ï>Ë>Ý>Ó>Õ>ä>Ý>Ý>ã>Û>×>Õ=£>Ñ>Ý>Ý>Ñ>›>Õ>Ù>Ù>Ø>¹>Û>à>×>×>×>Õ>Ð>ß>Û>Ç>×>Ù>Û>Ø>Í>>Û>Ý>Ø>Ø>Ý>½>Ó>Û>Õ>ß>Ø>Ñ>Ñ>×>Ï>Ý>Ù>Ë>Ô>Ô>Ä>ü=Ñ>à>É>×>Ý>á>Ý>Ð>Ý>ß>×>Ë>Û>Ù>×>Õ>Ø>»>Û>×>Ý>ª>Ð>Õ>Ù>×>ß>Õ>à>Ü>Ô>Ñ>Ù>à>×>Ó>Ñ>Û>×>Ð>Ý>Õ>Ø>Ý>É>Õ>³>Û>Í>Ù>Ë>×>Ý>Ô>Ý>Ó>Õ>Ü>Ù>×>Ñ>ã>Õ>Ù>Ù>Ý>à>Ù>Û>á>×>à>Ý>ß>Ó>Ô>Á>Õ>à>à>Ä>Õ>Ð>ß>£>ç>µ=Á>ß>Û>Ñ>Õ>Ü>Ø>Ù>Ý>Ø>Õ>×>Ù>Õ>Ü>Ã>Ù>Ð>Ü>×>Ñ>Ù>Ü>Ð>Ø>Ý>Û>Ù>à>Ô>Ó>Ä>Õ>Ô>Õ>×>Û>×>×>?>Ñ>×>à>Ü>ß>Ù>à>Ù>Ï>×>Õ>Ç>à>Ý>Õ>á>×>Û>Ë>Ý>Õ>Ù>Ý>Ý>ã>Ì>Ù>É>Ø>×>Á>Ë>×>Ù>Ñ>Ë>Ñ>Ù>»>à>Ó>ß>Ý>Û>Ñ>m>Ø>Ó>Ô>Ý>Ü>Û>ã>á>Ù>Ð>Ð>Í>à>™>Õ>Ý>×>ß>×>Ù>Ø>Ô>×>Ù>Ð>Ù>Ý>Ø>Ð>×>Ù>Û>Ù>ß>Ý>Ý>g>×>À>Ù>Ð>Ô>Õ>Ù>Û>Ý>Ë>×>ß>Ø>Ù>Õ>Ã>Í>Ø>Ù>Ü>Ý>Ð>Û>Ø>Ü>ß>Ð>Ù>ß>á>É>Ý>Û>Ø>Û>Û>É>Û>Ø>Ø>Á>Ì>Ñ>Ñ>Ñ>Õ>Ó>Ï>»>°>£>×>Í>×>­>á>Ø>Õ>×>×>Õ>Ñ>Ù>Ñ>Ý>Å>Õ>×>Ý>Ñ>«>×>Ð>Ù>¹>Ó>Ý>Ó>Ó>Ã>Ó>À>ã>Ø>à>«>ß>ß>á>Û>Ý>Ý>Û>¸>Ý>Õ>Ù>Ý>Õ>×>Ü>Ô>Ù>á>Ø>Ù>Ó>Û>à>¼>×>Ý>×>×>Ø>Ü>Û>Ó>Ó>ç>Ù>Ù>Õ>Ã>ß>Õ>á>Ø>Ã>Ù>Õ>Ù>ß>Ñ>Ù>ç>Ý>Õ>Ñ>Ô>Ë>¸>Ù>E>Ù>×>Í>Ø>Ø>×>×>×>Ó>ß>Ù>à>ä>Ý>Ø>§>¿>Ý>Û>×>Ù>Õ>ª>Ó>à>Ü>Û>Ô>»>Ë>Ý>ä>Õ>©>Ù>Ý>Õ>Õ>Ô>¸>Ù>á>Ó>å>Ý>Ó>Ý>å>×>Ô>ß>×>Ù>Ø>Ï>Ü>å>×>Ã>Ó>Û>Ø>Õ>Ô>Ï>à>È>Ù>Ü>»>Ó>Û>Ù>Á>×>Ó>Ë>Ç>°>Ó>Ù>Ø>Ý>Ñ>á>Å>Ë>Ü>Ó>Ð>¨>Ù>±>Ô>¯>Û>à>Ù>à>Ñ>Ç>ß>Ù>˜>Ü>Ü>Ñ>Å>Ù>Ý>Ü>Å>Ø>Ü>à>Ù>Ù>Ý>Ý>ß>›>Õ>Ù>Ù>Í>Û>Ü>Ð>Ù>Ð>Á>Ø>Û>Û>ã>×>Ð>ß>Õ>×>Û>Ñ>×>á>Ø>Í>Û>Ñ>Ð>ß>Õ>±>È>Ð>Ù>Ù>Ù>Ï>Ð>Ý>Ó>ß>×>Õ>Ñ>)>Ý>ß>Û>Ð>×>×>Ì>Õ>Õ>»>Ù>Ñ>Ç>×>Ø>×>Ô>×>×>Ñ>Ý>×>×>á>¯>ß>Ñ>À>Ð>Ù>Ç>×>Ù>Õ>Ù>Ù>Õ>ß>Ø>Ý>Ý>©>È>Ý>Ë>Ü>Ï>Ô>Í>Ñ>×>Û>Õ>×>Ù>Û>ç>Ù>Ù>Ó>ß>×>Ü>ß>×>Ù>×>Õ>Š>Ý>Õ>Ñ>Ù>É>×>Ø>×>Û>Ù>Û>Ã>Ù>Ý>ë=Ñ>À>Ù>Í>Ù>Õ>Õ>ß>×>Ü>Ó>×>Ø>×>È>×>ª>Õ>å>>×>Ù>Õ>Û>°>Ð>Í>Ô>×>ß>‘>Ñ>ß>Ø>Ý>Ù>Í>Ó>Ó>Ë>›>Ñ>É>Ø>Ý>Ø>Ø>ß>È>Ñ>Ô>Ü>×>W>Ù>Û>Ù>Ï>Ø>Õ>Õ>á>Ô>Ó>Ð>Ý>Ó>×>©>ß>Ù>Ñ>ß>Í>Ï>Ð>Ð>Û>È>ß>É>×>×>¥>Ó>¸>¯>Ø>Û>å>Ó>·>Ð>Ü>Ø>à>á>à>Ñ>Ó>Ý>Ð>Ü>Û>ß>×>Ø>Ý>Ý>Í>Ý>×>Ý>Ï>Ù>Ó>¤>Õ>Ù>Ó>Ù>à>Ð>Ø>ß>Ô>Õ>Ù>×>×>Ü>Õ>Ý>Å>Ý>Ë>Ø>Õ>Ï>§>È>Õ>Õ>×>Ý>Í>É>Û>Ó>Ù>Ô>ß>Ù>á>à>Ï>Ó>Ý>˜>Ù>Ó>à>Ñ>Õ>Ù>Ø>Ý>Ý>á>¦>Õ>Ñ>Û>Ñ>Ó>Ñ>à>´>Ó>×>Õ>Ù>Ü>ß>—>Õ>Ï>×>Ø>¥>ß>Ð>Õ>Ñ> >Õ>Ý>Ù>Ü>å>Ñ>Ý>á>ß>Ó>ß>Û>Ñ>Ï>ß>Ø>Û>á>×>Ð>³>Ó>Õ>Ù>Ñ>×>Û>×>Ó>>ç>à>Ð>å>Ù>Ó>Ó>Ù>Ý>×>Ý>Ø>£>Ù>Õ>×>Ù>>Ý>Ñ>ß>Í>Ô>Õ>Ï>È>Ü>Ø>›>Ï>Ó>Í>ß>Ø>Ø>Ü>×>Ù>Ù>Õ>Õ>Ã>Ø>É>Ñ>Ã>Ø>ˆ>ß>Í>Ï>Õ>Ð>Ç>Ù>Ù>Ý>é>Ý>ß>Ù>ß>à>Ð>È>Õ>×>Í>×>ß>Ý>×>Û>á>ß>5>Ù>Ø>à>Ø>>Ø>Ø>Ç>ß>Ó>Õ>ã>Û>ß>×>ã>Ý>É>Ø>È>Ø>Ý>Ð>>Û>Ù>Ë>à>Ù>Í>Ù>Õ>Ð>ã>×>Ý>Ù>ß>Ý>Ô>Ø>×>ß>Ã>Ó>ß>Ü>Í>Ë>Ý>Ù>ß>×>Ù>Ó>½>Ñ>×>Í>Ý>ß>Õ>×>Ó>Ù>á>—>£>>Ñ>×>Ø>á>á>Ù>Ø>Á>à>Ô>È>Õ>Ù>Õ>Ù>Ü>Ù>ß>á>Ñ>Ð>Á>Ù>á>Û>Ó>ß>Ù>Û>Ð>Ù>Õ>Õ>Á>ß>¯>Ó>Ü>Ù>Ý>Ë>Ù>Ù>Ñ>Ý>Ñ>å>×>Ù>×>Ý>Ý>Ù>á>Û>Ý>Á>Ù>Í>Ã>Ï>Ó>¯>Ï>ã>È>É>¥>Ø>Ù>Ñ>ß>É>Ó>×>w>Û>Ä>Ñ>A>Ý>×>Ý>Ý>Ý>Ù>Ù>Õ>Ë>Ý>Ü>Ù>ß>Ñ>×>Ý>à>©>È>Á>×>×>Ô>Û>Ç>Û>Ù>ä>Ù>À>Ó>Ù>Ð>Ó>•>Ø>×>«=Ó>Õ>Ï>Ñ>Ù>Õ>×>Å>Ý>á>Ù>ß>×>×>ß>Õ>Ý>Å>Ù>Õ>á>ß>Ý>Õ>Ï>Ð>>×>Ô>É>±>Ð>Õ>ß>Ó>Ô>Ù>Û>Ù>Ý>×>Ø>ˆ>Ë>Û>Ë>×>Ð>>Õ>à>Û>Ù>à>Ý>Ù>Ø>×>×>Û>Õ>Ý>ç>á>Ñ>Ù>Ó>à>Ù>Û>Í>ß>Õ>Ý>Ó>Ø>×>Ý>¹>Õ>Ý>Ð>Ù>Ü>Ý>¬>Ô>Ó>Ý>Ý>×>Ý>Ù>Ø>×>Ù>à>Ù>Ñ>à>×>»>Õ>Û>Ø>Û>Ô>Ù>Ù>Õ>Û>Ù>Ý>Ù>¨>Õ>Ù>×>Õ>»>à>×>Ñ>Ý>Ý>Ù>Ù>Ù>Ð>Ý>Ð>×>Õ>Ó>Ù>Ç>Ý>½>Ë>Ñ>Ü>Û>Õ>Û>É>ß>Ý>Ó>Ã>×>ß>Û>›>Õ>È>×>Ù>§>Ñ>Ó>Ù>Ç>Ù>Õ>×>Ð>ß>à>Û>Í>ß>Û>á>×>Ï>Ñ>Í>Ý>Ä>ß>Ù>@>À>å>Ý>Ù>Ù>ß>Ù>½>Ù>×>Ð>Õ>×>ß>à>Ó>×>Ó>Ý>Ë>–>Õ>Ý>Ù>Ù>»>×>Õ>×>Ù>Ó>Ù>Ñ>Ø>Ý>Ñ>Ù>á>Ó>Ù>Ø>Ý>)>Õ>Ù>Ø>Ý>Ï>È>Ô>×>Ý>Ø>Ù>×>Û>Á>Ù>à>ß>Õ>Û>Ý>Õ>ß>Ù>Ï>Û>Õ>Ø>Í>Ó>Ù>Ñ>‰>¼>Ý>à>ß>Ð>×>ß>Õ>Ø>ã>×>Ø>Ù>á>Ù>Ó>Ð>Ó>­>£>°>Û>Ù>Ù>Û>À>Ù>¨>Ð>Û>ß>Õ>ß>Ó>£>×>á>ß>ß>×>É>×>Ï>Ù>É>Ù>Ø>×>Ù>Ù>Ý>à>Û>×>È>×>Õ>£>Ý>ß>Õ>×>Û>Õ>Ø>Ý>Ý>Ë>ˆ>à>Õ>ß>Ù>á>¿>Û>Ñ>Õ>½>Í>Ø>Ó>×>Û>Ó>U>³>Ï>Ý>Ý>Ø>ß>Ý>Ñ>Ý>à>ß>Õ>Õ>˜>×>Ý>Ë>à>Ô>Ý>à>×>Ý>à>¿>É>Ý> >Ù>Ý>à>Ý>Ð>Ø>ß>à>Ù>Ù>ß>Ù>Ð>Ñ>Ù>Ù>Ü>Ü=Ø>Å>§>Ù>Ý>Ñ>É>ß>Ý>Ý>Ý>Ý>ß>Û>Ï>Ù>Ý>Ù>Ý>å>Ù>Û>Í>Ù>Ó>×>Û>>Õ>Ð>ß>Õ>Õ>‹>­>Ù>ß>Ù>Å>×>Ó>¹>ß>å>Ø>Ù>Ø>×>à>×>á>×>á>á>à>Ï>Õ>È>Õ>Ø>Ù>Û>×>Û>Ý>¦>á>Û>×>×>ß>C>Ð>Ù>ß>Ô>Ð>Ë>Ü>Ó>Ó>É>µ>Û>à>Ó>Û>Û>Ñ>§>Û>Ñ>Ñ>§>×>Ý>Ý>à>Ð>Ø>Û>ß>Ü>¿>¸>Õ>ß>Õ>Û>Ý>È>Ù>Ù>Ù>ß>Ø>Û>Õ>Ð>×>­>ß>Ø>Û>Ø>Ñ>Ø>Ó>Ý>°>É>•>Õ>Õ>Ñ>Ð>á>Ï>Õ>×>×>ß>Õ>Ø>ß>Ù>­>Ø>Ï>Á>Ý>Ù>Õ>Ó>Ð>Ý>×>Û>»>×>Í>Ë>Ó>Í>ß>Ý>Ø>Ù>Û>ß>Ù>Ý>Ó>Ù>ß>Ð>Ý>Ý>Ð>Ø>Ó>Û>Ç>Ý>Õ>Ë>Õ>Ô>Ð>Ü>×>Ó>×>Û>Õ>¡>Ë>Ù>ß>Ñ>Ø>Ý>Û>Ü>Ý>¹>Û>×>Ý>ß>Ý>Ý>Ì>Ù>Û>Ø>Í>Ý>Ó>ß>Õ>Ë>Ð>×>Ý>Ø>Õ>Û>Ë>ß>ß>Ý>ß>Ó>Ø>Ý>×>Ð>Ü>Õ=Õ>Ï>Û>»>Ù>Ý>Û>Û>Ý>Å>÷=Û>Ü>Ó>Ù>×>>Ü>¯>Ù>à>×>Ù>Õ>Û>Û>Ç>¡>ß>Ñ>ç>Ý>ß>Ó>Ø>Ý>³>¸>Ý>Ó>>Ó>Ý>×>Ð=’>Õ>Ë>ß>×>Ù>×>Ù>Ü>Û>Ô>À>ã>Ø>ƒ>Í>Ë>Ã>Ô>å>Ó>Ù>Ý>Ø>×>à>ß>×>È>×>i>Ï>ä>Ý>Ñ>×>Ù>¹>à>Í>Ø>á>Ù>Ý>À>Õ>Ë>Ñ>×>à>Õ>ß>×>Í>×>Ý>Ï>Ù>Í>Û>Õ>Å>Ô>Û>Ù>Ñ>Ý>×>Ó>Ð>ã>³>Ð>Ó>Õ>ä>Ï>×>¼>Ù>Ù>ß>×>à>Ñ>Ä>Ô>Ù>Ù>Õ>Ý>×>">Ó>Ø>á>Ô>¸>Ø>Ø>à>ß>Ñ>Ý>Õ>à>Ý>Ñ>à>ß>Ë>Ó>Ù>Ý>Í>Ù>Í>ß>·>Ð>ß>Ã>Ï>×>×>Ñ>å>Õ>Ü>Ù>×>ß>Û>Ù>Ø>ã>Ù>Õ>È>Ù>×>Í>Õ>Ý>»>Ý>Ì>Õ>Ù>Ø>Ø>Û>ß>¿>×>Í>á>×>Ø>á>×>×>Ñ>ß>¯>Ø>Í>Ñ>Ü>Ø>Õ>Õ>È>Ø>×>Û>Ü>Ó>Ù>Ñ>Ù>Ù>Ø>Ð>×>à>Ó>ß>Ý>Ä>Ý>Õ>Ù>˜>Ý>Ó>Õ>×>¸>Û>Û>Ø>à>Ý>Ð>>ç>ß>¬>×>°>Ý>Ü>Ñ>Ø>Õ>Ó>Ó>Ñ>˜>Ë>½>É>Ø>Ð>Ù>Ó>Õ>Ý>Ó>Ñ>Ó>Û>¿>Ù>Ñ>Ç>Ð>Û>Ø>Ó>Û>à>Õ>Ù>Ù>»>Ù>Ù>ß>×>À>µ> >ß>Ø>­>Ø>Û>Ô>Ü>×>Ý>Õ>Ñ>Ó>Ü>Ù>×>Ù>Õ>Ø>×>Û>Ý>Å>Ý>×>Ù>×>È>à>Ù>Ÿ>Ü>Ù>Ó>á>>×>å>×>Õ>á>Û>Ü>Ù>×>Ý>Í>Õ>×>à>Ñ>Ù>Ð>Ý>Ý>×>Û>Ý>Ó>Ù>»>Û>Ù>Ë>Õ>ã>Å>Ý>Õ>Ý>Ô>Õ>Ý>À>×>×>Û>Å>ç>ß>á>Ó>Ý>Õ>Ï>¿>Ñ>Ã>ã>Ù>à>ß>×>Õ>Ñ>Å>¬>Õ>á>Ù>Ù>Ý>Ù>Ø>×>Ñ>×>Í>×>Û>à>»>Ø>Í>×>Ù>Å>Ý>Ü>Ï>À>ß>Û>Õ>Ù>Ø>à>Ù>À>Ù>Ÿ>Ü>À>Ø>Ý>Û>Û>ß>Ù>Û>¥>à>Õ>×>Ý>Á>Ý>Ó>Ø>ß>Ó>Ï>Ù>à>á>Ù>Û>ß>Ñ>×>Û>Ù>×>Ñ>Ý>Ï>Õ>Ð>Ý>Ñ>Õ>Ñ>á>Ý>ß>×>×>á>Ý>×>Ù>ß>Ù>Ø>Ý>×>Ø>à>Ü>Í>Ù>Û>Ô>Í>Ý>Ù>×>Û>Ý>Ó>Ý>×>³>Ô>à>Ù>Ñ>Ý>Ñ>Ý>Ü>à>Û>ß>Ù>Ù>Ë>Ÿ>×>Ù>Ô>Ý>Ù>ß>Ø>×>Ý>×>×>×>Û>Û>Û>Ø>×>Õ>Ý>Ù>Ù>Ý>Ó>Û>ã>×>˜>µ>×>Ý>Û>Ý>Õ>Ñ>Õ>Ø>Ù>Ý>×>‡>Ý>Û>¹>Ô>Ý>Ü>Õ>Ñ>Ø>×>å>Ý>Ø>Ý>Û>Õ>Ý>Í>Ó> >ß>Ø>Ø>×>Ù>Ï>È>Ü=×>Ù>×>Ñ>Ì>­>à>Õ>Ù>á>×>Í>Ý>Ý>å>ß>×>Û>ß>Ý>Õ>Ð>Ù>à>±>×>Ý>×>Û>·>ß>Û>Ù>Ù>Ø>ß>¡>Ü>Ý>Ù>à>Ë>Ø>Û>Í>Ó>Ñ>ß>Ý>Ñ>Õ>Ý>×>Ù>Õ>Õ>×>Ø>Û>Ù>×>à>×>Ð>Ý>Ï>Ï>à>K>Õ>Ý>Ø>Û>ã>à>Ñ>×>×>>¤>Ý>×>Û>×>Û>×>£>Ù>Ý>ß>Ù>›>É>Ø>Í>Ü>Ï>Ø>Í>Í>×>Ñ>Ý>´>Õ>Ë>Ó>×>ß>Ø>Ý>Ï>À>Ø>Ý>‡>Ñ>Ï>É>Ù>Ø>Ý>»>Õ>Ý>Ô>Ý>Ü>×>Õ>à>Ñ>Ó>ƒ>Ï>Ó>Í>Õ>à>Û>Ø>Ó>Ù>Í> >Ù>Í>Ð>ß>Ù>à>ã>ã>×>ß>×>×>Ø>Ø>Ë>Û>Õ>Ó>Õ>Ñ>å>Û>Ø>Ù>Ü>ä>Ý>Û>á>Ý>Ý>Ù>Û>¨>Û>Õ>Ñ>ß>Õ>Õ>Ç>Û>Ç>Õ>ß>ß>Ý>Õ>Õ>Ø>Ø>Ù>Ù>Ý>Ý>Ù>Ü>ß>Ý>×>Ï>Ü>Õ>Ý>Ì>Ó>±>Í>Û>Ô>Ø>Í>×>Ð>à>Ù>ã>ë>µ>ß>Ý>Ù>×>«>Ù>Ü>Ø>á>Ù>©>×>Ì>Û>Ë>Ð>×>È>Ù>×>Ý>Õ>ß>Õ>Í>Ó>Ý>Í>Ù>à>Ù>Ý>Û>Ñ>¸>Ý>á>ß>Ñ>Õ>Ô>×>Ù>Ý>Í>‰>Ó>¦>À>ß>Ó>Û>Ù>Ù>Ø>Ù>ß>à>×>Ù>á>á>Ù>Ý>Ù>×>Û>à>Ø>Û>ß>Ü>Ù>Õ>Ø>Ý>Ø>Ç>Ý>Ð>Ñ>×>Á>Ý>Ó>é>×>Ù>Ó>×>Å>Ñ>à>Á>Û>­>¥>Ñ>Ø>Ü>Ó>ß>È>×>Ù>Ó>É>Ù>×>Ù>Õ>×>È>Ý>Õ>Ø>Ð>Ð>Ù>™>Ý>Ù>à>É>Ù>Ù>×>×>3>Ù>Û>Û>É>Ü>×>à>Û>Ë>×>à> >Ñ>Ý>Ø>×>á>Ì>Ý>Ð>É>Õ>à>Ù>Ý>Û>Ô>á>Ý>Û>à>Õ>É>Ù>×>×>Ü>Á>Ó>‡>ã>Ý>Ø>Õ>Õ>×>É>Ó>Ñ>Ô>ä>Û>Û>Õ>Í>Û>¸>ß>Í>Ø>ã>Ø>¼>à>×>Ù>Ù>Ü>ß>Å>Ó>ß>Ó>Ü>×>Ã>Ý>Ý>×>Ó>À>Ù>Ó>á>Ñ>×>Ó>ß>Ý>Ø>á>×>Í>×>Ð>Ø>×>Ù>Ó>Ù>Ù>Ô>Ð>Ù>Ø>×>à>Ý>ã>Û>Ø>à>×>×>Ù>Ý>Ù>ß>Ñ>á>Ñ>Ù>ß>Ñ>Ø>Ï>Õ>×>Ì>Ù>á>Ó>Ð>Õ>Ñ>×>Ù>Ý>Ø>É>Û>Ñ>Ý>á>É>å>Ï>×>Ó>×>Ø>ß>Õ>å>Õ>ç>×>×>½>×>È>Ù>Ø>Ü>á>Ù>×>×>Ù>ã>á>ß>Ü>Ÿ>Õ>Û>­>×>ß>Õ>É>Û>Ù>Ÿ>Õ>«=Ù>Ø>Ù>Ü>Õ>Ý>g>á>×>Ø>Ø>Ù>Û>Ô>Í>Û>×>Ù>Ý>Í>×>ß>ß>Ù>Ð>Õ>Ý>Ý>Ý>Ã>Ù>Ù>Ó>Ï>«>£>Ô>Í>Ø>Õ> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9aa211e876db87964b6a5d02f85fd13b2487b76a Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/2.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/20.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/20.0 new file mode 100644 index 0000000000000000000000000000000000000000..65681d42f8f01654c99e82edbc6e4598db77044e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/20.0 @@ -0,0 +1 @@ +Ù>Ø>á>Ù> >ã>å>ä>Ù>ä>Ë>è>ã>à>á>ß>Ý>ã>Ù>Ù>Ø>à>ä>Ï>Í>Õ>ã>£>à>£>ã>Û>×>ã>Ó>Ø>ß>Ü>Õ>ß>È>ç>Ñ>Ñ>ß>Å>Ù>Ñ>Ù>Ý>Ð>ã>É>ß>Ý>Ý>á>Í>ä>±>á>Ù>×>à>Ý>Ý>á>Ø>Ù>ã>Ù>á>á>Ï>Í>ã>Û>á>Ü>ç>Ï>Ù>«>Ý>à>á>ã>—>Û>à>á>Û>ß>Û>ç>á>á>ß>á>é>á>ß>³>‡>ã>à>à>ç>ã>á>á>Ý>Û>ç>Ù>ã>á>Ù>ß>ß>Ó>ß>ß>Ý>Ý>Ý>ß>à>ã>å>Ù>è>Ø>ñ=ß>Ð>Ü>ã>ß>à>Ë>Ù>å>Ë>Û>ä>«>Ù>á>ß>Ó>å>×>×>ã>à>ß>á>×>Ø>Á>Ý>Ì>Ó>Û>Å>Ç>ã>¹>ß>ß>ã>ç>Ý>Ã>3>ã>ã>á>Ù>¬>ß>ã>á>ß>ã>Ù>ß>à>å>Ì>á>ì>Ø>™>Ý>Ý>à>ß>¨>Ø>ã>Ù>à>Ý>Ñ>à>à>ã>Ø>ã>à>£>ç>Í>á>Ù>Ü>ß>ç>å>Ù>Ý>Ø>å>Ù>Ë>á>Û>Ý>×>á>å>×>ç>ã>à>Ý>Ñ>Ù>ß>Ý>ã>Ø>à>á>Û>×>Ý>ç>ë>Õ>á>Ù>À>Ý>Ý>ä>Ý>é>Ø>Ý>å>Û>Ý>ß>±>ã>à>Ø>á>á>á>ã>á>Ù>Õ>ß>ß>ç>ã>#>à>à>ß>Ý>ß>ç>ß>å>§=ÿ=Û>ã>Õ>Õ>Ù>å>µ>ä>Ù>—>è>Ý>á>Û>Õ>ã>Ì>á>×>å>Ó>ç>•>Ù>×>Û>Õ>ß>°>á>å>ß>á>Ã>à>Ø>ß>Ù>Ý>à>ä>á>Ý>ç>Å>ë>å>Ó>Ý>å>á>Õ>Ñ>ã>å>Ã>ä>Û>Ó>Ð>Ý>Ý>ã>Ô>á>ß>à>á>ã>à>ï>å>Ù>Ù>Ý>¢>Ý>à>Ý>Ð>Ý>1>ã>á>á>Û>Ï>Ù>ß>ß>ß>Ý>»>×>Ó>Ý>Ó>»>å>Ý>á>á>á>×>×>Ù>Ü>Ù>á>Ý>Ý>å>á>à>Õ>ã>ç>Ù>­>Ñ>Ý>ß>Ç>á>Ù>Û>å>»>á>á>Ø>å>Å>ä>à>ß>Ï>à>ß>É>à>Ý>Õ>ç>Ù>ç>å>á>å>Ý>Ñ>á>—>á>á>Ù>ß>á>Ø>á>á>à>Ï>á>Ü>×>Õ>Ý>á>ß>å>Û>à>ß>á>ß>×>à>¹>á>à>Õ>ß>ã>Û>Ù>Ý>Ù>ß>á>¯>È>á>Ù>ã>ß>Ý>é>Ó>Ð>á>Û>à>ß>Û>ß>Ý>å>à>Û>Ù>Ü>à>å>ã>á>Ý>¨>Ø>à>Ý>á>ß>á>ß>Ý>ä>Ã>ä>ã>Ù>ç>»>Ù>Ý>Ñ>Ù>«>ã>à>×>ß>×>Á>è>Õ>Ý>ß>Å>¬>ß>Ó>Ý>à>ß>Ù>á>Ù>À>Ý>Ù>Ù>Û>Ý>Ô>à>Ø>»>ç>Ÿ>å>Ù>Ù>Û>×>á>Ë>Ø>ß>ç>Ó>ã>ã>ã>å>ã>ß>à>Ý>È>á>Ð>è>ç>Ñ>à>ß>á>Ý>Õ>ã>Õ>á>à>Û>ß>±>Õ>Ñ>á>ã>å>Ø>ß>Ý>Ë>ß>à>ã>à>Ñ>Ë>ã>ã>á>Ý>ß>À>à>ß>×>Í>Ý>ã>Ç>ã>à>à>“>à>é>á>Ï>Ô>ß>Û>Õ>Ù>Ï>Û>à>¨>ã>å>á>ä>Ï>ã>×>Ó>à>è>ï>ã>Ù>Ý>Ý>Ý>ã>Ó>Ù>±>Ü>á>Õ>Á>ã>ç>ã>á>Ù>Ý>á>×>Ù>Å>å>ß>ß>è>L>á>å>á>å>½>Ý>™>å>à>ß>à>Ë>É>Ó>Ù>á>×>à>ã>Ù>à>ã>ç>Ù>ß>ß>&>ç>à>Ý>ã>à>Ä>Ý>ß>ß>Ù>×>Ý>×>ã>ç>y>·>ç>á>Ù>Ù>å>à>ã>à>à>å>å>ß>á>é>¡>Ý>Ü>Õ>Ù>×>à>å>ß>Ó>å>Ð>À>Ü>Ý>ß>à>×>Ü>á>ç>ä>Ñ>ß>Í>>Ù>ä>ã>Ü>Û>à>Û>ã>Õ>ç>á>á>è>á>¸>Ñ>à>á>Ä>á>á>#>Ý>Û>ß>á>Ý>à>×>á>ä>ç>á>Ô>á>á>á>ä>à>á>Ø>ë>å>×>Ñ>á>×>ã>ß>å>Û>à>ì>Û>ã>Ñ>ß>Ó>Ý>Í>ã>Ü>á>¸>¥>å>à>à>×>Ý>ã>Ý>á>Ý>Ý>Ý>á>Û>Û>ß>Ó>×>á>à>ã>ã>Ý>Û>Ï>Ý>Ø>ã>á>×>Û>Ø>ç>å>à>'>ß>à>Ý>Ù>ã>Û>l>ã>ä>Ø>Ù>à>å>á>ã>Ñ>ã>é>Ù>ß>Ë>á>å>ä>µ>á>á>ä>à>Ý>ç>Ó>É>à>Ù>Û>ä>á>È>å>Û>ã>á>Õ>›>9>Ù>à>á>ß>á>ã>å>“>ß>á>Ø>Ù>×>à>å>Ø>ß>Ù>è>á>Ø>à>á>Í>á>Í>Ù>Ó>à>Ð>Ñ>Ý>ß>ç>Û>Ô>à>ã>Ü>à>á>Ó>á>§>Û>Û>ß>à>Ï>Ë>Ù>Ý>à>Ó>Ó>á>à>Û>Ñ>Ó>å>Á>È>å>à>ç>›>Ý>ß>á>×>ç>×>Õ>Ø>¹>ã>Ó>Œ>ß>á>å>é>ß>ß>ç>«>à>Ô>Å>å>Ý>Ñ>ä>Ù>Ù>ã>à>á>á>Ñ>ç>Û>Ý>Ü>á>Ù>Ì>à>Ä>å>á>°>è>Ø>Û>ã>ä>ã>ã>Ô>Ý>Õ>Ø>ß>ã>>Ý>á>å>×>ß>ç>Ù>Û>Ñ>à>È>å>Ù>à>ã>ã>ç>á>á>>ß>Ø>å>ç>ç>Ô>á>å>ç>ã>Ý>Û>Ð>Ù>Ø>¥>ã>ç>Í>å>Ñ>à>ß>Ý>ß>ß>ç>l>á>×>ß>ä>­>á>ç>Û>ç>Ý>Õ>Ý>å>Ù>Ý>á>Á>Ý>Ø>à>Ø>•>á>Û>×>Ý>ß>ß>à>Ý>ç>Ý>Ï>Ø>¥>Ñ>è>Í>á>›>Ü>Ó>á>Å>å>¸>ß>Ù>ß>à>Ù>Û>Û>ë>è>à>å>ç>á>ã>Í>Å>Å>Ù>Ó>å>×>Ù>ç>Ý>ã>ã>à>ß>ó=¥>Ù>á>ä>Õ> >Ù>á>á>ã>½>à>å>ß>ß>ä>×>Õ>å>á>Ð>à>Û>á>å>Ñ>>á>à>Ý>ß>á>À>Û>á>à>á>ß>Ù>×>ß>×>á>à>×>Õ>Ù>Í>>×>å>Ð>ß>ë>è>à>Õ>ã>á>ß>Ñ>ß>ß>ß>Ý>Ý>Ç>á>à>á>¯>Û>ß>á>ß>ß>Ü>ä>á>Õ>×>á>å>Ù>Ý>×>á>Ý>Ø>á>Ý>ã>á>Ó>Ü>¼>à>×>à>Ñ>Û>ä>Ó>å>Ù>×>á>ß>Û>Ø>å>Ù>ß>ß>ã>ç>á>ã>ç>à>ã>ä>ã>Û>Ø>Ë>à>ç>å>É>Ý>×>å>¥>è>Ó=Å>å>á>Ø>Ù>å>Ý>Ý>á>ß>Û>à>ã>Û>á>Ï>ä>×>ä>ß>Õ>ã>á>Ñ>Ý>ã>à>ä>è>Û>Ü>Ë>Ý>Ù>ß>×>ç>Û>Û>L>×>Ý>ã>á>ã>á>á>ã>Ù>Ý>Ü>Ð>å>ã>Ù>ã>á>Ý>Ñ>à>Ý>ß>à>ç>ç>Õ>Ý>Ó>à>Û>É>Ð>Ý>à>Ù>Ð>Ø>á>Ã>ä>Û>á>à>Ý>Ù>u>à>Û>Û>á>ã>Ý>è>è>á>Ù>Õ>Ñ>ç>ž>Ý>à>Ý>ç>Ù>à>ß>Ù>Ý>ß>×>ß>ä>ß>Õ>á>à>á>Ý>ç>ã>á>c>Ø>Ë>á>Ð>à>Ù>à>à>å>Ó>Ù>Û>Ý>ß>Ø>É>Ð>Û>ß>ã>á>×>ß>ß>á>à>Ó>à>é>é>Ñ>ã>ß>á>ä>ã>Ñ>Û>á>Ý>É>Õ>Ø>Ù>Ù>Ù>Ù>Ó>Ã>µ>¥>Ý>Õ>à>¸>å>à>Ø>Ù>×>Ý>Ù>à>Õ>ç>Ï>Ý>ß>å>Ù>«>Ý>Ñ>ß>¿>Û>á>Ù>Ù>É>Ý>È>å>ß>ã>°>á>ß>é>ç>ç>ã>ã>Ã>ä>Ù>á>ç>Ù>ã>å>Ý>Ü>é>ß>à>Ý>å>ã>Ã>ß>á>Û>Ý>á>å>å>Û>Ø>ç>ß>á>Ü>Ë>ã>à>ç>ß>Ë>ß>Ý>Ý>ç>Ù>ã>ç>å>Û>Ù>Û>Õ>À>á>H>à>Ý>Ó>Ü>ß>ß>ß>ß>Ý>á>Ù>ã>ç>à>Ý>¨>Ã>ß>ß>Ý>ß>×>³>Õ>á>å>á>Ý>Á>Ñ>à>ç>Ù>¯>Ý>ã>Û>à>Ù>½>Ý>ç>Ý>ç>á>ß>ß>è>ß>Ø>ä>Ü>å>ß>Õ>à>ë>ß>Ï>Õ>ß>á>Ù>Ü>Õ>ç>Ñ>á>Ü>Á>Û>ß>á>È>à>Ù>Ó>Í>·>Ù>ä>à>à>×>ç>È>Ð>å>Õ>Ù>­>å>±>Ø>´>á>ç>Ý>ç>Û>Í>à>ß> >ã>à>×>Ë>Ý>á>ß>Í>Ü>ã>é>å>à>Ü>ä>ä>Ÿ>ß>á>ß>Ó>á>à>×>ß>×>È>ß>ã>ß>å>Û>Õ>á>Ù>ß>à>Ô>Ý>å>à>Õ>ß>×>Õ>á>à>¹>Ë>Ø>ß>Ý>à>×>×>á>Ü>å>Ý>Ý>Ø>0>à>å>á>Ø>à>Ý>Ï>Ý>Ù>À>Ý>Ù>É>ä>ß>Ý>Ý>ß>Ý>Ù>à>Û>Ý>å>°>ã>Ù>Ç>Õ>à>Í>Ý>ß>Ý>Ý>à>Ù>ã>à>á>ß>¯>Í>à>Ñ>ß>×>Û>Õ>Ù>à>ß>Û>Û>á>ã>é>ä>Ý>Û>ç>à>á>à>à>å>Û>Û>>ã>Ý>Û>à>Ë>Ý>Ù>à>á>ã>ã>Ð>á>à>>Ø>Ë>á>Õ>Ý>Ý>Ø>ç>Ý>à>Ý>ß>ß>à>Í>Û>´>Û>é>£>à>Ü>á>å>¹>Ó>Ó>ß>Ý>ç>•>Ù>á>Ý>ç>ã>Õ>Û>×>Õ>Ÿ>Ø>Ð>ß>á>Ý>á>á>Ð>Õ>Ø>ã>Ù>Y>á>á>á>Õ>ß>Ù>Ø>å>Ù>×>Û>å>Ù>Ý>ª>ã>á>Õ>å>Õ>Ù>Õ>×>á>Ï>à>Ð>á>Ù>©>Ù>À>¹>Û>à>è>Ù>»>Ù>ß>ß>ç>à>ä>Ý>ß>ã>Ø>ä>à>ç>à>à>å>ß>×>ä>Ý>á>Õ>á>Ý>¥>Ù>Ý>Û>à>è>Ù>á>ä>à>à>à>Ý>Ü>á>à>ç>É>Ý>Ô>á>Û>×>©>Ï>Ý>ß>ß>á>Ó>Ñ>ä>à>å>ß>á>Û>å>ä>×>Ù>å>˜>à>Ü>ç>Ø>ß>Ù>ß>ã>á>å>­>Û>×>Û>Ù>Ù>Ù>ã>À>Ü>Ý>Ù>ß>á>ã>™>Ø>Õ>Ý>Ù>>å>Õ>ß>Ù>§>Ý>Ý>á>ß>é>Ý>ä>á>à>Ù>ã>ß>Ø>Ó>ç>ß>ä>é>Ý>Ü>¸>Ù>Ù>ß>Ø>á>à>ß>Ø>}>í>å>Ù>í>å>Ý>Ù>á>Ý>Ý>à>Ý>«>à>Ø>Ý>à>¡>å>×>á>Õ>Ù>Ù>Û>Ë>Ü>à> >Ø>Ø>Ø>å>Ý>ß>á>Ù>Û>Ý>ß>ß>Ã>Û>Ï>×>Ë>ß>Š>ã>Õ>Õ>à>×>Í>à>à>ä>ç>ã>ç>Ý>ç>ã>Õ>Ð>Ø>Û>Ó>Ý>ã>ã>ß>á>ç>ä>D>á>ß>å>Ý>“>à>ß>Ð>ë>Ø>Ù>ç>ß>ã>ß>ç>ç>Ó>ß>Ñ>Ý>å>×>–>á>á>Ó>å>à>Ñ>á>Ý>Õ>é>Ý>ã>ß>á>ã>Ý>Ý>Û>ã>Ð>Û>å>Ý>Õ>Õ>ã>à>ç>Ù>á>×>Ä>Ù>ß>Ó>á>å>ã>ß>Û>Ù>é>›>«>¡>×>à>Ü>ç>ç>ß>ß>È>ã>Ý>Í>Û>ß>Ù>à>ß>ß>ç>å>Ø>Ø>Ç>Ý>é>Ý>ß>à>á>ã>Ó>á>á>Ý>Ç>å>µ>Ù>ß>á>ã>Ñ>å>à>Ù>á>Ù>è>à>á>ã>á>á>à>é>Ü>å>È>á>Ð>Ë>Ñ>ß>µ>×>ì>Ï>×>±>à>ä>Ü>ß>Í>Ü>à>p>à>Ì>×>U>Ü>à>ã>ã>ç>ß>ã>à>Õ>ã>à>ã>ç>Ù>ß>å>é>¨>Ï>Ì>à>Ý>Ü>á>Ï>á>á>é>á>Ë>Û>à>Ù>Ù>˜>ã>à>È=ß>Ý>Ó>Ù>ß>Ý>Ù>Ð>ã>å>ß>á>ß>ß>á>Ø>á>Ï>á>Û>á>á>å>á>Û>Ý>w>Ý>ß>Ë>¸>×>Ù>ç>Ý>Ù>ß>á>ß>á>ß>ß>’>×>ã>×>ß>Ø>×=Ù>ã>á>á>ã>ã>Ý>ß>à>ß>ã>à>à>ë>à>Õ>á>Ø>å>ß>á>Ð>ã>Ý>á>Ù>Û>á>ã>½>Ý>ä>Ø>á>ß>á>´>Ý>Ù>ß>ä>Ý>á>á>à>Ý>Ý>å>Û>Ù>ç>Ý>Ã>Ù>á>Ý>à>Ù>à>á>Û>á>à>á>á>¯>Ù>Ü>á>Ù>À>å>Ý>Õ>á>ß>Ý>á>ß>Õ>ã>Ó>Ü>Û>Û>ã>Ð>ç>Á>Õ>Ù>Ù>ã>Ý>á>Ñ>ç>á>Û>Ë>Ü>ã>á>£>Ù>Ï>Û>ß>°>Ù>Ù>Ý>Í>ß>Ý>Ù>Ø>á>å>ß>Ñ>ä>à>á>à>×>Ü>Ù>à>Í>ã>á>E>Ã>è>á>à>à>é>à>Å>á>Ù>×>Ù>Ý>à>ç>Û>ß>Ø>á>Ó>›>Û>á>à>Ý>Á>ß>ß>à>Û>Û>à>Ü>å>ä>Ø>ã>ç>Ù>á>à>ã>4>Ø>ã>à>ã>Ô>Ñ>Û>Û>à>ß>à>á>ã>Í>Ý>à>é>à>å>ã>Û>á>à>Ï>á>Û>Ý>Ó>Ø>ß>×>‘>À>á>ã>å>×>Ý>ç>Ý>Ý>ä>Ý>Û>ß>é>Ý>Ù>×>Ý>µ>¥>´>ß>á>á>å>È>à>°>Ü>à>ç>Û>á>Ý>¡>Ù>é>ã>à>Û>Ó>á>×>à>Õ>ß>Ý>Ù>ß>ß>å>å>ï>Ü>Ð>Ý>à>©>ã>Ý>Ù>ß>à>ß>à>á>ç>Ñ>‹>á>ß>å>ß>ç>Å>Ý>Ý>Û>Ç>Ó>à>Ù>à>ã>Û>`>»>×>á>á>Û>ã>á>Ù>ç>ç>ã>Ý>Ù>¡>ß>á>Ñ>ã>×>à>å>Û>ã>å>É>Ñ>ß>§>Ý>ä>ç>ä>Ó>á>ä>á>ß>à>ã>à>Ù>×>á>å>ä>ü=ß>Í>¬>ã>á>Û>Ó>ã>ã>å>á>å>ã>ç>×>à>ç>ß>ä>ç>á>á>Ó>á>Ø>Ý>á>%>Ù>Ó>ã>Ù>Ù>•>µ>ß>á>Ý>Ñ>Ü>Û>Ã>è>é>Û>Ý>à>Ý>é>Ø>è>Ý>ç>å>á>×>Ù>Ó>Ù>Ý>ß>Ý>á>á>ã>ª>ä>ã>ß>Ý>à>K>Ù>ß>å>Ù>×>Ð>ã>Ù>ß>Ó>¹>à>ç>Ý>Ý>à>ß>°>à>Ø>Ù>°>Ý>ß>ä>á>Ù>Ý>à>ä>à>È>½>à>ã>×>á>á>Í>ß>Ý>ã>ã>à>à>ß>Õ>Ý>³>å>à>à>Û>×>ß>Ù>ã>µ>Ï>Ÿ>Ý>Ý>Ø>Ø>ß>Ó>à>Ü>Û>ç>Û>Ý>á>ã>³>à>Ó>É>à>Ý>ß>Ù>×>å>Ü>Ý>Ã>Ý>Ó>Ñ>Ø>×>ç>à>Ü>Ý>å>ç>Ý>à>Ù>á>à>Û>á>á>Õ>ß>×>å>Ñ>á>Ý>Ó>ß>Û>Ù>á>Û>Ý>Û>à>Ý>«>Ñ>á>ã>×>ß>à>á>ß>ã>Á>á>Ü>á>à>á>á>Ñ>ã>Ý>Ý>Ó>ß>×>å>à>Ñ>×>Ý>ß>ß>Û>á>Ñ>á>å>à>á>Ü>Û>ã>á>Ü>å>ë=Ø>Õ>à>¿>à>å>á>ã>á>É>>à>ç>×>á>ß>Ÿ>ß>³>Ý>ç>Ý>Ý>Û>å>á>Ï>£>ä>ß>é>á>à>Ù>Ý>ß>»>¿>ß>Û>•>×>ß>ß>ç=’>ß>Ó>à>Ù>Ý>à>ß>á>Ý>Ü>Ä>ç>à>>Õ>Õ>É>Ù>í>Ù>å>ã>ß>Ý>ç>à>Ý>Ï>Ù>m>Õ>è>ã>Û>Ü>à>Ã>à>×>ß>ã>à>ä>Ç>Ý>Ó>Ù>Ø>ç>Ù>å>ß>Ù>Ý>å>×>Ý>Õ>ß>Ù>Ð>Ü>Ý>ß>Õ>å>Ý>Ø>Ó>í>½>Ù>Ü>Û>ë>×>Ù>Ã>à>Ý>á>Ý>ä>Ù>Ì>Ù>á>Û>Û>á>à>/>Ø>à>ã>Û>Á>Ý>à>å>é>Û>ß>Ý>ã>á>Õ>å>ã>Ñ>Ø>á>ã>Û>ß>Õ>ç>»>×>ß>Ì>Õ>á>Ù>Ù>è>Ø>á>à>Ù>ã>á>á>ã>ç>ß>Ü>Ð>ß>Ý>Ø>Ù>á>À>à>Õ>Ù>ß>á>Ù>à>ä>Å>Û>Ó>å>à>á>ä>à>Ù>Û>á>±>Ý>Ó>Ø>á>ß>Ü>Ý>Í>á>Û>á>ß>Ù>Ý>Û>ß>ß>ß>×>ß>å>Õ>á>á>Ð>ã>ß>ß>™>à>Ù>Û>à>½>ç>á>ä>ä>ç>Ø>ž>è>å>±>Û>¸>á>á>Ù>á>à>Ø>Ù>×>£>Ñ>Ã>Ó>ß>Ó>à>ß>Û>ä>Û>×>à>ß>É>á>Ù>Ð>Õ>ç>ß>Û>ß>é>Ù>á>à>Ã>Û>á>å>Ü>Ë>¸>)>ã>Û>µ>ß>ã>×>á>Ù>å>Ý>Ø>Ý>á>à>à>à>Ý>à>ß>ç>ã>Ë>á>ã>ä>Ý>Õ>å>ç>¢>á>á>Û>í>ý=à>è>Ý>Ù>å>á>ã>ã>Ù>Ý>Ð>Ù>Ý>ã>Õ>á>×>ä>å>ß>ã>ç>Ù>à>Ç>á>Ý>Ô>ß>å>Í>ã>Û>á>Ý>Ü>ã>È>ã>Ù>á>Ë>ì>ä>ç>Ý>á>×>Õ>Í>Ø>Ë>ç>Ü>å>á>à>Ý>Ý>Ì>³>Ý>ç>á>à>à>à>Ý>Ý>Ù>á>×>Ü>à>Ý>Ä>ß>Ù>Û>ß>Ï>à>á>×>È>à>à>Û>á>Ý>à>ä>Ë>à>Ÿ>ß>É>ß>á>á>à>ç>Ý>á>¨>å>Ý>Ý>ß>È>à>Ý>à>å>Ý>×>ã>è>ç>à>á>ç>Ñ>ß>ã>à>Ý>×>á>Ø>Ý>×>ç>Û>Ù>Ó>ã>á>á>Ü>Û>ç>ß>Ý>à>å>à>ã>ç>ß>ß>å>Ý>Õ>ß>à>Û>Ó>á>á>Ù>ß>å>Ø>ã>Ù>½>Ý>á>Ý>Û>á>Ø>ã>ß>ã>å>å>à>á>Ñ>>Ý>á>Ý>á>à>á>á>ß>á>à>ß>Ý>á>ä>à>ß>à>Û>å>ß>à>ã>Ø>ç>è>Ø>£>»>Ø>å>ß>à>Ø>Ù>Ù>ß>ß>á>Û>ƒ>ä>ß>½>Ù>á>ß>×>×>ß>Ù>è>ç>à>á>Ý>Ý>à>Ó>Ø>¡>ç>ß>Ù>ß>Ý>Ø>Ð>é=Ù>Ý>Ý>Ø>Ó>³>à>Ù>à>ç>Ù>Ó>ã>ã>ç>ç>Û>ä>á>á>Ø>Ó>à>ç>½>ß>å>Ø>å>½>á>á>á>ß>Û>å>¥>ã>à>ä>á>×>Ý>á>Ü>×>Û>å>à>Ø>Ù>á>ß>ß>Ý>Ý>Ý>Û>à>à>á>ç>ä>×>ã>Õ>×>å>U>Û>ã>á>ä>é>á>Û>Ý>ß>¥>¨>ã>à>à>à>à>à>¨>ã>å>á>à>>Ð>ß>Ø>å>Ø>Ù>Õ>Õ>Û>Ù>å>»>Ù>Ð>Ý>Ù>ã>Ý>à>Õ>Ç>ß>á>‹>Ø>×>Ñ>à>ß>ã>½>Ý>å>Û>å>å>ß>à>ç>Ù>Ù>…>Ó>Ü>×>Ý>ì>å>á>Û>Ý>Õ>¥>Ý>×>×>á>ß>ç>è>å>Ü>á>Ý>ß>Ý>ß>Ó>á>Ý>Ý>Û>Ø>é>á>á>ä>ã>è>å>å>ç>á>è>à>ã>ª>ã>Û>Ù>å>ß>Ø>Í>ã>Ï>Ù>à>á>à>Û>Û>ß>ß>ã>ã>ã>á>ã>Ý>ç>ã>Ý>Ð>á>Ù>à>Õ>Ø>·>Ó>Ý>Ô>á>Õ>à>Ø>ç>á>ã>ì>½>á>å>å>Ü>¯>Ü>à>Ý>å>ã>­>à>Ð>á>Ñ>Ù>Ý>Ó>à>ß>ß>à>ã>Ý>Õ>Û>à>Ô>ß>å>ß>á>à>Ø>»>å>á>ç>×>Ý>ß>Ý>à>á>Õ>Ž>Ù>¤>Ç>ã>Ù>ã>á>Ý>ß>á>å>ç>ß>à>å>ç>ß>á>Ý>Ù>å>ç>à>à>ç>á>ã>Û>ß>ç>Ý>Ñ>å>×>Ù>à>È>á>Ø>í>Ý>Ý>Ù>Ý>Ï>Ø>ã>È>ç>µ>¤>Õ>ã>á>Ý>ä>Ï>á>à>Ý>Ó>Ý>Ý>á>Ý>Ý>Í>ç>Ø>ß>Ø>×>Ý>¡>á>ã>å>Ð>Ü>á>à>Ü>5>á>á>ß>Ô>ç>à>å>ä>Ó>à>è>>Û>å>Ü>Û>é>Ó>á>Ù>Ð>Ý>ç>á>à>å>Ù>ë>à>á>å>Ý>Ñ>á>Ý>Ü>á>Ë>Ý>>ç>ã>á>Û>Ø>à>È>Û>Û>Ù>å>ß>á>Û>×>Û>½>ã>Ð>ß>ç>à>À>ç>à>à>à>á>á>Ð>Û>ã>Ü>á>ß>É>å>á>ß>Ù>É>á>Ù>é>Ý>Ù>Õ>å>Ý>Ý>å>à>Ó>Û>Ù>å>á>á>Ø>à>à>Ù>Ø>à>ß>Ü>ä>à>å>ç>á>ä>Ý>ã>á>ã>ß>å>Õ>è>×>á>ç>Ù>ß>Õ>Ý>à>Ñ>à>å>Ù>×>ß>Ù>Ù>à>à>Ý>Ð>Ü>Ù>ã>ä>Ë>ç>Ó>Ü>Ù>à>Ü>é>Ý>ç>ß>é>ß>á>Ä>à>Ñ>á>Û>ß>é>à>Ù>ß>Ý>é>è>å>á>§>Ý>ã>±>ß>å>Ù>Ï>á>ß>¡>ß>d=Û>Û>à>ß>Ù>ç>a>ç>ã>Ü>Ý>ß>à>Ü>Ø>á>ß>ß>á>Ì>Ý>å>ç>á>×>Ù>á>ß>á>Í>ß>ß>×>Ø>°>§>Ù>Õ>à>à> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/21.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/21.0 new file mode 100644 index 0000000000000000000000000000000000000000..9ecf0aecd5375a7687bc030d5a777131d23cd380 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/21.0 @@ -0,0 +1 @@ +ã>ã>ç>ã>§>è>é>ï>á>í>Ô>ð>é>é>ë>á>ç>ë>ç>à>ã>ç>ï>Ù>Ó>Ù>é>©>é>­>é>ã>Ý>ç>Û>ä>è>ç>ß>ç>Ð>é>Ù>Ý>è>Ñ>å>à>å>ä>Ù>é>Ó>ì>ç>ã>í>Ù>ï>°>ë>ã>å>ç>å>ë>é>á>Ý>í>ä>í>ë>Ù>Ù>é>ã>é>á>í>Ó>á>µ>á>å>é>ë>£>é>è>ã>å>ç>ã>é>è>ë>ç>ë>í>ï>é>¹>>í>ì>é>ë>í>ç>ë>ç>ã>é>ç>ë>ð>å>ç>è>Ø>ç>ç>ç>è>å>é>è>í>í>è>ë>á>÷=ç>Õ>ã>å>é>ç>Õ>ã>é>×>á>è>³>ã>é>è>Ø>é>à>à>ð>é>é>ç>Ü>ã>È>å>Ø>Ý>ã>Ð>Ð>é>Á>è>á>é>ð>å>È>G>ë>é>ç>á>¹>è>ë>ç>á>ç>è>å>è>í>Ó>ë>ñ>á>ª>è>ç>ì>ç>°>à>í>á>í>ç>Ù>é>ç>ë>Ý>è>í> >ð>Ø>ç>á>ã>é>ì>í>á>é>à>í>ç>×>ï>ç>ç>Ù>è>é>ã>í>è>ç>ç>Ù>á>è>å>ï>á>é>í>å>ã>à>í>ô>Ý>é>ç>Å>ä>ä>í>å>í>ã>è>ë>Ý>á>ç>¹>é>ç>à>è>è>é>ì>ë>ã>á>ã>é>í>è>#>ç>í>é>ç>é>ñ>ã>ë>¼= >å>è>à>ß>á>é>½>ç>à>Ÿ>ð>ã>í>ã>Û>é>Õ>í>ã>ë>Ý>ñ>›>á>ß>ß>ß>ì>¹>è>è>ã>é>Ã>ì>ã>ã>à>è>ç>å>å>ã>í>É>ñ>è>Ý>ç>é>í>à>Û>í>ë>È>è>ã>Ù>×>ç>à>í>Ý>ë>ã>é>è>å>è>ø>ë>ä>à>è>«>à>é>å>Ü>ã>(>ï>è>ë>ã>Ù>á>ã>è>á>é>Å>ã>á>ç>à>Ç>é>á>é>å>è>á>ß>á>Ý>Ý>é>ç>ã>é>é>ë>Û>é>ë>á>¹>Ø>å>ç>Í>è>å>ã>í>Ç>è>è>ä>é>Å>ë>é>ç>Ø>ë>è>Ó>é>ç>ß>í>à>ë>é>ç>ë>è>×>è>¡>è>é>á>é>ì>ã>ë>ë>ç>Ù>ë>ß>ä>ß>å>é>ç>ï>ã>è>è>ï>ã>ã>è>Ã>ã>è>Ý>ç>é>ã>å>á>å>ã>é>±>Ð>è>å>í>è>å>ï>Û>Ø>é>ç>ç>è>å>é>ã>é>é>å>á>à>ð>é>é>è>ë>³>á>é>ã>é>é>è>ë>å>è>Ð>ë>è>ã>ë>À>å>ã>Ù>ß>³>é>è>à>è>Û>Å>é>á>å>å>Ç>¸>ä>Ý>å>í>ã>à>é>å>Ç>å>Û>á>å>å>Ü>é>Ý>Ã>é>§>ï>à>á>å>à>ë>È>Ü>è>ë>Û>ð>é>è>é>é>è>ç>å>Ð>è>Ø>í>í>Ý>é>ã>é>ç>ß>ð>á>ç>è>á>ç>·>Ý>Ø>ç>è>ð>ã>ä>ç>Ó>ã>å>ç>ç>ß>Õ>ë>í>é>ç>ç>Ë>ã>ç>á>Õ>å>í>Ì>í>ç>é>™>ã>í>ë>Ù>ß>è>á>Ý>å>Ø>å>ç>°>í>í>ë>è>×>è>á>Ü>é>ï>ô>ë>á>ã>å>ç>ï>Û>á>»>ã>ç>ß>À>é>í>ï>á>å>ã>è>á>è>Ð>ð>è>é>í>]>è>è>é>ñ>Ä>è>£>í>í>ã>è>Ñ>Ó>Û>Û>è>Ü>ç>å>à>ç>í>ï>à>é>ç>*>è>ë>ã>ë>é>Ë>å>ë>é>á>á>ã>Ý>è>ë>>½>ï>è>ä>ã>í>ç>é>é>ç>ð>é>å>ì>é>¤>ã>à>Ü>ã>ß>í>í>á>Ù>ï>×>Ë>ã>ç>ç>é>à>á>é>à>ï>Õ>ç>Ó>›>á>é>è>ã>ã>ç>á>é>ã>í>ë>è>é>é>Á>Ù>á>ë>Ð>ã>ç>/>ã>ã>ã>é>ç>å>ß>é>è>è>ç>Ý>è>å>ë>ë>å>é>à>ð>í>ß>Ù>é>Û>ë>ç>é>ç>é>ó>å>ï>Ü>è>Û>å>Ø>é>å>í>Á>±>ç>é>ç>ß>ç>è>ç>è>è>é>å>é>ç>á>ç>Û>ß>é>ç>ë>å>à>é>×>é>à>ë>å>ã>ç>ä>í>ï>ç>/>ç>ã>ç>ã>è>ç>‚>ç>ë>á>á>ç>è>è>ë>×>ë>ï>à>è>Ó>è>í>ë>·>ë>å>ë>ç>å>í>Ü>Õ>è>ç>à>í>é>Ð>è>ë>ë>ç>ß>§>K>å>å>ë>ç>è>ì>ð>™>ã>ë>á>à>à>é>ë>ã>è>ã>ë>ë>ä>è>í>Ù>ð>Õ>á>Ý>è>Ø>Ù>ã>à>ï>å>Û>í>ì>à>é>é>Û>é>³>á>è>ç>é>Ø>Ø>ã>å>å>ß>Ù>è>ë>å>Ø>Û>ð>Í>Ñ>è>ç>í>¢>è>ç>é>à>ë>á>Ý>à>Á>é>Ø>’>è>ë>ì>í>ä>è>ë>³>è>Û>Ï>ï>ä>Ý>é>á>å>é>è>ë>ì>×>ï>à>ç>å>í>ß>Ø>é>Ð>é>é>¹>ì>á>ã>í>ì>è>é>à>ç>Ý>á>è>ð>>è>é>í>ã>é>è>å>á>Ü>è>Ð>é>å>é>é>é>ñ>ç>ç>>ë>å>í>ï>ï>ß>ç>ì>è>è>å>å>Ù>ã>ç>­>é>ì>Ó>ï>Ý>è>ã>ç>å>å>ë>l>é>á>ç>ï>µ>é>é>ã>é>ç>à>å>ë>á>é>è>Í>ç>á>ë>ä>Ÿ>é>è>á>å>ç>å>í>å>í>ç>Ù>à>«>Ø>ñ>Ù>ï>>è>Ü>ç>Ì>ë>À>å>ã>è>ã>ã>è>ã>ð>ï>é>ë>é>í>ï>Ù>Ï>Í>à>×>è>ã>å>ï>é>è>ë>ë>ç>ÿ=·>à>è>è>à>Ÿ>ç>é>ç>è>È>ç>ë>å>ã>è>å>ã>ï>è>Ø>á>ç>ã>é>Ø>$>é>è>ç>å>å>Í>ç>ç>ç>é>ã>á>à>ã>ß>è>å>Û>à>è>Ù>>á>ï>×>å>ï>í>ë>á>ç>è>ã>Ù>é>ç>é>á>è>Ð>é>ç>é>¹>ß>å>é>ç>ç>å>é>è>Ü>à>é>ë>ä>å>á>é>ã>ã>é>á>è>è>Ù>ç>Å>è>à>ë>Ù>ã>é>ß>í>á>à>ë>è>å>à>í>á>è>ã>é>í>è>è>í>ç>ð>ã>é>á>ã>Ð>ã>ë>é>Ó>ç>á>ï>¬>ð>Ë=Ñ>í>è>ß>à>ð>ä>å>ë>ã>á>å>ë>ä>ç>Ô>ì>ß>é>å>à>é>è>ß>ã>ë>é>é>í>à>á>×>å>à>å>ã>é>á>å>L>Ý>å>í>è>è>é>é>é>ß>è>ã>×>ï>é>ã>ë>é>ç>Ù>é>ç>ç>ã>ì>í>Û>é>á>ç>è>Ï>Ù>ç>ç>á>Ù>å>ë>É>í>å>é>è>å>ã>m>å>à>á>ç>í>ð>í>ð>ë>ß>Ý>Ý>í>«>á>ë>ç>é>å>è>ä>á>ç>ç>à>ç>ë>ç>à>å>ä>é>å>ï>é>é>l>á>Õ>è>Ø>å>á>é>ç>ë>Ý>ã>é>å>á>ã>Ð>Ý>å>ë>å>ì>ß>ì>å>ç>ë>ß>è>í>í>Ù>í>ç>ã>å>í>Ø>é>è>å>Í>Ø>à>á>ã>á>ã>á>Ë>À>­>é>Ý>è>¿>é>å>ã>ã>Ý>å>à>ç>à>é>Ø>å>ç>í>ã>·>à>Ù>ç>È>á>í>ç>à>Í>ä>Ñ>í>ç>í>³>é>è>ï>ë>ð>è>í>Ì>ë>ã>å>ï>ã>ç>ë>ç>è>ð>ä>è>ã>ç>é>Ï>è>é>ã>è>è>é>ë>å>Ý>ð>è>è>ã>Õ>é>å>í>ç>Ó>å>á>ç>ì>à>è>ð>ë>à>Ý>à>Ý>Í>é>P>ç>ç>Ý>ä>è>ç>è>è>ç>é>ç>é>ð>ç>è>¯>Ï>é>ë>ç>ç>ã>·>á>é>è>ë>ã>Í>×>é>ë>ä>·>í>ë>á>å>á>Ç>ã>í>á>ð>ë>ã>ç>ï>ã>á>é>ã>ë>ç>à>è>ó>ã>Õ>ç>ç>é>ä>á>Ý>é>Ø>ä>è>Í>á>é>ì>Ñ>ç>á>Õ>Ø>»>ã>ë>å>é>á>í>Ñ>Ü>é>á>à>¸>é>³>à>Á>é>ï>ã>ë>á>Ù>ë>è>¥>ì>ì>à>×>è>é>å>Ó>ã>é>ï>é>å>í>è>í>¥>ã>é>å>Ü>é>é>ß>è>Ý>Ô>å>é>é>é>å>Ý>ï>ã>å>é>Ý>ã>ë>è>Û>ç>ß>à>è>è>Ã>×>à>ç>å>è>Û>Ý>é>ã>ë>ã>ã>ã>0>è>è>ë>à>ã>ç>Ø>ã>å>Ã>è>á>Õ>é>é>á>ã>è>ç>ç>è>á>ã>í>»>é>á>Ó>à>é>Ù>å>ã>ä>å>é>ç>å>ç>é>è>±>Ø>é>Ø>í>ß>ã>ß>ç>å>è>á>ã>å>ç>í>ë>é>ã>é>å>å>í>ä>é>é>à>…>é>å>à>é>Ð>å>ã>ç>ç>é>é>×>å>ì>>ß>Ó>è>Ù>ë>å>á>ë>è>è>å>ç>è>ã>Õ>å>¹>ç>ó>­>à>ã>è>ë>Á>à>Ø>ç>ã>é>—>á>ë>å>ë>ç>Û>à>á>Ý>¬>Ý>Ø>å>ç>ç>è>å>Ø>Û>å>í>ã>Y>é>ç>ç>Ý>å>à>ä>ë>ä>à>å>é>ç>ã>¸>é>é>à>ð>Û>å>Ý>ß>é>Ø>é>×>è>é>°>å>Ã>À>á>è>ë>ß>Ã>á>ç>ç>í>é>ë>ç>ç>é>à>ï>é>ð>ä>è>í>é>Û>é>ã>è>Ù>ç>å>±>ã>è>å>é>é>á>é>é>é>é>ë>ç>ã>ì>ã>ë>Ñ>å>Ð>ç>å>ß>¬>×>å>ã>è>é>Ý>Û>é>ç>é>å>é>è>ï>ë>Ý>á>ì>¥>ã>è>í>á>å>å>å>é>å>í>°>à>ß>ã>á>á>ã>ë>Ë>ã>è>á>é>ì>é>¥>å>ß>ä>å>£>í>ß>å>à>±>å>ç>é>ç>í>å>é>ë>ë>à>í>è>ã>ß>ï>ë>é>í>é>á>À>á>á>è>á>å>ç>ã>á>ƒ>ñ>í>ã>÷>é>ã>á>é>é>ã>é>ä>°>ç>á>ç>å>­>é>ß>è>à>á>ã>à>Ô>ç>è>«>ß>á>à>ì>ä>å>ã>ã>å>å>à>ã>Ä>ã>Û>á>Ù>é>‹>ï>Û>ß>é>Û>Ó>å>é>é>í>ë>ë>å>ì>é>à>Û>à>ã>Û>ã>ð>è>è>é>í>é>P>é>è>í>ç>>ç>é>Ù>ó>à>å>ô>é>è>ç>ï>é>Ü>è>Ý>é>é>Ý>š>é>é>Ü>ð>è>Ø>è>ã>ß>ë>ç>é>ç>í>í>å>è>á>í>Õ>á>í>å>Û>Û>è>ç>ï>ç>é>ã>Ë>á>å>Ý>ë>ï>ç>è>ä>à>ñ> >³>µ>à>è>ã>ñ>ï>ã>å>Í>ï>ã>Ó>ã>ã>ß>ç>ç>é>í>í>à>á>Ñ>è>ù>ç>å>ë>é>ë>Ý>ë>ã>å>Ë>è>½>á>è>è>é>Û>é>ç>ß>è>à>ï>å>ç>é>é>è>é>ï>è>í>Ð>ç>Ý>Õ>Ý>ã>¿>Û>í>Ù>Ý>¸>ã>å>ç>ç>Ø>á>ã>>é>Ó>Ü>W>ç>ç>é>í>í>ì>è>ã>Ý>é>é>è>í>ß>ë>é>í>¯>Ó>Ñ>ç>å>ç>ç>Ù>í>ë>ñ>é>Ó>ß>ë>ã>à>­>è>ã>·=á>å>à>ã>é>ã>å>Ø>ï>í>ç>è>å>è>ç>ã>í>Õ>è>á>ë>ð>ë>ç>ã>ã>‡>å>ä>Ù>À>à>á>ñ>å>ã>è>å>ç>è>ç>ç>™>ß>è>ß>å>ß>>ç>ë>è>è>é>ë>å>ç>ç>é>ç>é>é>ñ>è>à>é>á>ë>é>ç>Ý>ì>å>ç>ã>ç>å>è>È>å>è>à>é>è>é>¹>å>å>å>ï>å>è>é>ç>ã>ç>è>ç>á>í>ç>Ì>ã>ë>å>é>á>ç>é>ç>è>ç>ë>é>µ>á>ç>ç>ç>Í>í>ä>ß>ë>í>å>å>ç>Ý>ë>ß>ã>ã>ã>ç>×>í>Ë>Û>à>ç>ì>ã>ç>×>ï>é>å>Ñ>á>ë>í>­>á>Ù>á>è>±>à>å>é>Ø>ã>å>á>à>ë>ë>è>Ù>í>ë>ë>é>Ý>á>à>ä>Ð>ë>ç>=>È>ï>ë>ç>è>é>ç>Ï>é>á>á>à>é>é>é>ã>å>ã>è>ß>Ÿ>á>é>è>ç>É>å>é>ç>å>å>å>à>í>ä>à>é>ï>ã>ë>ë>è>3>á>ç>ç>é>Ý>Ø>ç>å>í>å>è>ç>ë>Ø>ç>ë>í>å>é>è>å>ë>é>Ý>ç>å>é>Ù>ß>í>à>–>É>é>é>è>á>å>ë>å>ã>í>é>å>è>ñ>é>ã>Û>ç>À>¯>»>å>é>è>ë>Ó>è>¹>à>è>í>å>é>ã>­>ç>ð>ì>ç>å>ß>è>Ü>é>Ø>å>é>á>é>ç>è>ë>í>ã>Ø>á>å>±>ë>é>ã>å>ì>å>ç>é>í>Û>>ì>ç>í>ç>é>Ì>á>å>ã>Ð>Ù>ã>ã>ç>ï>ã>g>Å>Ý>í>í>å>ï>å>á>ð>é>í>ä>á>§>á>í>Ù>é>á>è>ë>ã>ï>è>Ð>Ý>í>­>ã>é>ï>é>ß>ç>ë>ç>å>é>é>é>à>ß>ç>é>é>ë=è>×>µ>è>ë>ß>Ý>ï>è>ë>ë>ç>ð>ë>á>ä>ì>é>ç>ì>é>é>ß>ç>à>ç>é>>ç>Û>ç>å>å>ž>À>å>í>è>×>ã>á>Ë>é>ð>å>ç>è>å>é>×>í>å>ë>ð>è>Ù>á>Û>ã>å>å>ç>ç>ç>é>¬>é>è>ç>è>ì>\>á>ç>ï>ã>Ý>à>é>ã>å>Ý>Ä>ç>í>á>é>é>ã>µ>é>à>ß>³>ç>ë>ç>ë>ã>å>é>í>é>Ñ>Ç>ç>í>à>é>é>Ø>é>è>é>é>å>ã>ã>à>ã>¼>í>é>ç>é>á>é>à>é>¼>Ù>>ã>å>ß>ã>ç>Ù>ç>å>å>ï>ä>ã>í>è>¸>é>ã>Ï>ç>ç>ç>ã>ß>é>è>é>È>ã>Ý>Ø>ã>Ý>é>ì>å>å>ç>ë>ç>ë>å>é>ï>å>ç>é>à>ã>à>ë>Ø>ì>å>Û>å>ç>à>ç>ç>è>å>è>ã>­>Û>ë>é>á>ç>é>é>ë>é>Å>ì>è>è>å>ë>é>Ù>è>é>è>Ù>é>ã>í>ç>×>ß>å>è>å>ß>é>Û>é>è>é>ë>á>ç>é>è>á>é>û=á>ß>é>Ì>é>é>í>é>ç>Õ>>ç>è>á>é>ç>§>é>½>é>í>ç>ç>å>è>ë>Ù>­>ë>å>ï>ë>è>á>å>é>Á>É>è>å>>á>ì>è>Ü=•>ã>Û>å>ä>é>ã>è>é>ç>ç>Ð>ñ>ä>>Û>Ý>Õ>à>ñ>á>ë>é>é>ç>ð>í>ç>Ù>ã>k>Ü>ë>é>á>ã>é>Í>ë>ß>é>í>ç>é>Ð>à>Û>à>ã>é>å>ë>ã>å>à>é>à>ç>Ý>è>à>Ø>å>ã>è>ß>í>ç>à>ß>ð>Ç>á>å>å>ë>à>ã>Í>ç>å>é>è>ï>à>Ø>á>å>ç>ã>é>ç>'>à>ç>é>ã>Ë>å>é>ë>ñ>ã>ç>á>é>é>Ý>ë>ë>Ù>à>é>é>Ø>å>à>ñ>¿>Û>é>Õ>Ý>ä>å>á>í>à>ç>å>á>é>ë>é>è>ï>ç>ã>×>ç>ç>Ý>ã>é>É>è>ß>å>é>ç>ã>é>ï>Ð>å>Û>é>é>é>è>å>ç>ã>é>µ>ç>à>ã>é>é>ç>è>Ù>ç>ä>ç>è>ä>ç>á>å>è>å>ß>å>í>Ý>í>é>Ô>é>ã>ç>£>è>ã>ä>ç>É>ç>ç>é>é>é>á>¢>ñ>ï>¸>ç>Å>è>í>Û>é>ç>à>á>ç>¦>à>Í>à>å>Û>è>ã>å>é>ä>à>à>é>Ð>ë>ã>×>à>é>é>ã>ç>ð>á>è>ï>Í>å>í>é>ç>×>½>->í>ã>½>ç>í>à>è>á>é>ç>à>å>é>ç>ã>è>å>ç>ç>ë>è>Ô>ë>è>ç>ã>Ù>é>é>­>é>ë>á>ó>>ç>ñ>è>á>é>å>é>ï>å>ã>×>ã>é>í>ß>é>à>ç>ë>é>ë>ë>ã>è>Ð>ë>è>Ý>ã>é>Ð>é>à>ì>å>ã>ë>Ï>é>á>ð>Õ>ð>ë>ï>á>é>ç>Ù>Ó>ã>Ñ>ï>è>é>ç>å>ç>á>Ø>½>á>ï>å>ë>è>å>è>ç>å>è>ß>à>ç>è>Ë>è>à>å>ã>Õ>é>í>ß>Ó>ç>ç>ß>è>ç>é>í>Ó>é>ª>å>Ñ>å>é>ç>é>ë>ç>é>°>ë>ã>ç>é>Ð>ç>ä>ç>é>á>Û>è>è>í>ç>é>ë>á>à>ë>é>ä>Ý>á>Ý>ã>á>é>å>ã>ß>é>í>í>ç>á>ë>ç>ã>é>ï>è>ç>ë>ç>ç>é>ç>à>ë>é>å>Û>í>é>ç>ç>é>á>è>ç>Ä>è>í>ç>à>é>á>é>ç>é>ë>í>ç>ç>Ù>§>è>ç>à>ë>è>í>è>å>é>é>á>è>è>í>è>å>é>å>í>ã>å>í>à>ë>ñ>á>«>Ã>ã>é>ç>è>ã>à>å>ç>è>é>ä>>ë>ç>Ä>å>è>è>á>ä>è>ã>í>ë>ç>è>è>ã>ç>Ý>á>°>í>è>è>å>è>ß>Ø>å=å>ç>å>à>Ý>¼>ç>ß>é>ð>ã>Û>ë>é>ð>ë>è>é>é>é>à>Ý>é>é>Ã>é>é>á>é>É>é>è>è>ç>ã>ï>¯>é>ë>é>é>Ý>è>è>à>à>ã>é>é>ã>á>é>ã>á>å>å>å>å>å>ã>ç>é>é>ß>ì>Ø>Ù>ë>P>ä>è>è>ë>ó>ë>à>ç>ã>­>«>é>å>é>è>è>ä>°>é>í>ë>ç>¥>Ø>ç>Ý>é>á>ç>ß>Ý>ë>ã>í>Å>ã>Ø>ã>å>é>ç>í>Û>Ð>ç>è>“>ã>ß>Û>ç>ç>í>Ç>å>í>é>é>ï>ç>ã>ì>ç>å>>Û>à>Ý>ã>ð>ë>ç>á>ã>Û>­>ç>ß>à>é>ç>í>ë>é>ä>í>á>ã>é>ç>Ù>é>ç>è>å>á>õ>è>ç>í>í>ï>í>ë>è>é>ë>å>è>°>é>á>ß>ï>é>à>Ù>é>Õ>à>è>í>è>á>à>ç>é>å>ç>é>í>è>ç>í>è>ã>Û>é>à>è>ß>á>À>Û>ç>à>é>ß>å>ã>ì>ç>ï>ñ>Á>è>é>ï>å>¹>é>é>å>í>ë>¸>å>Ý>é>Ü>Ý>é>Ø>é>ç>ç>å>é>à>Ù>á>é>Ý>è>ð>ç>è>ã>ã>Ç>é>ë>ë>á>å>å>ç>ç>ë>Û>“>à>°>Ì>é>ä>í>í>è>è>é>é>ï>é>é>é>ï>é>é>å>ç>è>ï>è>ç>ë>ë>ë>å>è>é>é>Ù>í>à>ã>å>Õ>é>ß>÷>ã>é>à>ä>Ù>ß>í>Ó>í>À>°>ß>ç>è>ç>ì>Ù>å>ç>å>Û>ç>ç>í>ã>å>Ó>í>ã>å>ß>Û>ä>Ÿ>ç>é>ð>Ø>å>ã>ç>á>G>è>ë>è>ß>é>é>ì>ç>Û>é>ï>>ß>é>è>ã>ñ>Ý>é>ä>Ý>å>ë>ë>ë>å>ç>í>è>é>é>å>×>è>å>å>ë>Ð>à>•>ð>é>å>ã>á>ã>Ù>ç>å>ã>ï>ç>ç>å>ß>á>Ä>é>Û>è>ë>ç>Í>ï>å>è>ë>è>é>Ý>å>ï>ç>é>å>Ô>ï>í>à>ã>Ó>è>à>ð>ã>ã>à>é>ç>ç>ë>ã>Ý>ã>á>í>ç>ì>ã>ç>ç>ã>à>ë>é>ç>é>é>í>è>å>í>å>è>é>í>é>ç>Ý>ë>ã>é>í>Ý>è>à>ã>ç>ß>è>ï>ã>ß>ã>å>ã>ç>ç>ä>Ø>ç>á>é>ë>Ó>ï>Ù>è>á>ç>ç>é>ç>í>ã>ó>å>è>Ð>ç>×>é>å>é>í>è>á>è>å>ó>ï>ë>é>«>ã>é>³>ç>ë>ã>Ù>ã>é>©>á>†=å>ã>è>ç>ç>ë>i>ï>ð>å>ç>ç>é>ã>á>ï>å>é>é>×>è>ë>í>é>à>å>é>é>å>Ó>è>ç>ã>Ý>¹>­>ã>à>å>é> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/22.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/22.0 new file mode 100644 index 0000000000000000000000000000000000000000..4ef20a4d24ebed41d370e3d82cbccf4ea0fc8438 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/22.0 @@ -0,0 +1 @@ +é>ç>ð>é>¥>ó>é>ð>í>ñ>Ý>õ>ñ>í>ñ>é>ë>õ>é>í>è>í>ô>à>Ý>å>ó>¥>ñ>©>ó>ç>á>ñ>ç>ç>ð>é>é>ë>Ý>ó>à>ç>è>×>é>ç>é>í>ß>ó>Ø>ï>í>ë>ñ>ß>ó>°>í>ï>é>í>ð>ñ>ð>ç>è>÷>é>ñ>õ>ß>ß>ð>ë>ð>é>õ>Ý>é>­>ï>ì>ñ>ñ>Ÿ>ñ>ð>ï>ñ>ó>é>ó>í>ñ>ë>ó>ñ>ñ>ó>»>…>ñ>ë>ñ>ð>ð>ï>í>ï>é>ñ>é>ó>÷>ì>í>í>Ý>ñ>í>ë>ï>ð>í>ï>õ>ð>ð>ø>ç>å=é>à>í>ï>ñ>ë>Ø>ë>í>Ý>ë>ñ>³>í>ð>í>á>ð>è>ã>õ>í>ñ>ð>ç>è>Í>í>à>ã>ï>Ñ>Ø>ñ>Ë>ï>ï>ñ>ó>é>Ì>D>ñ>ó>ï>ç>¿>ð>ñ>ï>ç>í>ï>í>ñ>ó>Ø>ñ>ù>é>•>ð>ï>ô>ì>¯>è>õ>è>ï>í>Ý>ó>ñ>÷>ç>ð>ó>Ÿ>÷>Ý>ð>é>ë>ð>ó>ñ>ç>ï>è>ó>í>Ø>ñ>ñ>ï>á>ñ>ð>é>÷>ð>ï>ë>Ý>è>ë>ï>ó>é>õ>ð>ë>é>ë>ñ>õ>å>ï>í>Ë>í>ë>ó>í>ó>ë>ï>ð>ç>ì>í>»>ó>í>í>í>ñ>ï>ó>ó>è>ç>ï>ô>ô>ñ>>ï>ð>ï>í>ð>ø>é>ï>œ=é=ç>ñ>ç>ç>é>ñ>Á>ð>é>—>õ>è>í>ç>ã>ñ>Û>ñ>é>õ>ã>ø>>å>å>é>ã>ï>»>ð>í>ë>ð>Ì>ð>ì>ë>ç>ï>ï>ñ>ï>é>õ>Ó>÷>ô>å>í>ï>ó>ç>ç>ó>ð>Ì>ð>ë>à>Ý>é>í>ó>å>ñ>ð>ð>ï>ð>ð>ù>ó>é>ã>í>¯>í>í>ñ>á>ç>$>õ>ñ>õ>í>Ý>ç>ñ>í>é>í>Í>é>ç>í>ç>É>ñ>é>ñ>í>ñ>ë>ç>í>å>ë>ï>í>ç>í>ï>ï>ã>í>ó>ç>±>à>ð>ï>Ñ>õ>ç>í>ó>Ð>ë>ñ>å>ð>Ç>ó>í>ð>á>õ>ï>Ø>í>í>ã>ó>ã>õ>õ>ð>ñ>ë>Û>ï>—>ó>í>ì>ï>ñ>í>ï>ñ>ñ>Ù>ï>ç>é>å>ï>ð>ð>ñ>ë>ñ>ñ>ñ>í>è>ð>À>ï>ñ>ç>ñ>ó>è>é>é>é>í>ñ>©>Ô>ñ>è>ó>ð>í>÷>à>ß>í>ñ>ï>ï>é>ë>ð>ñ>ï>í>é>ë>ù>ñ>ñ>ë>í>­>ë>ð>í>ñ>í>ð>ï>ë>ï>Õ>ð>ï>è>ñ>Á>é>í>ã>ë>­>ó>ï>ç>ð>ã>Ç>ó>ç>ë>é>×>°>ï>ã>ï>õ>í>ç>ó>é>Í>é>ã>ç>í>é>à>ð>ã>È>ñ>>õ>ì>å>ð>é>í>Ð>ç>ï>ñ>å>÷>ñ>ð>í>õ>ñ>é>í>Ø>ï>à>ø>õ>á>ð>í>ñ>ï>ã>ô>ç>ï>ï>é>é>¬>å>å>ñ>ñ>ð>ç>ë>ð>ß>ì>ð>ë>ë>ç>Ý>ð>ï>÷>í>ë>Ð>ë>ð>ã>à>ï>ó>Ó>ñ>ï>ñ>>í>ó>ñ>Ý>ã>ï>ç>å>ë>ß>ë>ï>ª>ó>ñ>ï>ñ>Û>ï>ç>ç>ï>ó>ù>ñ>è>í>é>í>ó>à>è>¼>è>í>ç>Ç>ñ>ó>õ>í>í>ë>ï>é>ï>Ó>ó>ð>í>ñ>H>ð>í>ð>ó>Ç>í>™>ó>ñ>é>ë>Ø>Ø>á>å>ð>ç>ï>ï>é>í>ñ>ñ>ç>ñ>ð>'>ó>ô>é>ñ>ó>Ï>è>ï>ï>é>ç>é>å>ë>ï>p>¹>ô>ï>ë>é>ô>ï>ñ>ñ>ð>õ>í>í>ñ>ñ>>é>ç>á>è>é>ñ>õ>ë>á>ó>ß>Ì>è>é>ï>í>é>ç>õ>í>ñ>Ý>í>×>•>ç>ñ>ñ>é>ì>ï>é>ñ>è>ñ>ð>ñ>ó>ñ>Ã>Û>ë>ó>×>ë>ó>'>ì>í>è>ï>ï>ï>ë>í>ð>ñ>ñ>ã>ï>í>ï>ñ>ð>ó>ç>÷>ï>ã>á>ó>à>ô>ñ>ï>ì>ó>ù>ë>ð>á>è>à>ì>Ü>ð>í>ó>Ã>«>ð>ñ>ë>ç>ì>ñ>í>í>ñ>í>ë>ï>é>ç>ë>ä>å>ñ>í>ð>ñ>é>ð>Ý>ó>ç>ï>ñ>è>ì>í>ñ>õ>ï>!>ó>é>ë>å>õ>è>g>ð>ñ>è>é>ñ>õ>ñ>ô>Ý>ó>õ>ì>ð>Ø>ñ>ð>í>¹>ï>é>ð>í>ñ>ó>å>Ù>ñ>ñ>é>ñ>ï>Ù>ð>í>ð>ð>ã>˜>3>í>ð>ñ>ñ>í>í>ó>›>ë>ï>è>ë>ã>ð>ð>í>ë>è>ó>ó>ì>ñ>ó>à>ð>à>ì>à>ë>ã>ß>é>ë>÷>ë>ä>í>ð>è>ñ>ñ>ç>õ>¨>é>í>í>õ>á>Ý>é>ë>ñ>ç>ã>ï>ó>é>à>å>ñ>Ð>Ø>ï>ï>ð>›>ð>ï>ð>ç>ï>é>ç>è>È>ó>à>Œ>õ>ð>ó>ó>ð>ñ>õ>³>ï>ã>×>õ>ï>å>ð>é>í>ñ>í>õ>õ>Ý>ó>è>ñ>é>ð>å>Ý>ñ>Õ>÷>ð>¿>÷>ç>é>ñ>õ>ï>ñ>ç>ë>è>é>ë>õ>÷=é>ï>ó>ç>ð>ñ>é>é>á>ð>Ó>õ>é>í>ñ>ð>÷>í>ð> >ð>è>ó>ó>õ>à>ð>ñ>ð>ï>ð>ï>Ý>ë>ë>±>í>ñ>ß>ñ>à>í>í>é>ï>ð>ó>[>ñ>é>í>ñ>¸>ð>ó>ë>õ>ï>ç>ñ>÷>è>ð>ï>Ï>í>è>ð>å>“>ð>ï>è>ï>ñ>ï>ñ>å>õ>ë>á>ã>›>à>ô>Û>ô>›>ì>å>ï>Ð>ó>À>í>ë>ë>í>ë>ð>ë>ó>ù>ð>ó>ñ>ð>ñ>Ý>Ñ>Ñ>è>ß>ñ>ë>í>ø>í>í>ñ>ñ>í>Õ=¡>é>ð>ñ>ç>Ÿ>é>í>í>ó>Ë>í>ñ>ï>ð>ð>í>ä>õ>í>ß>í>ï>í>ñ>á>>ð>ó>ë>è>í>Ð>ë>ï>í>ó>í>é>ç>ð>å>ð>ï>á>ç>ï>ß>>è>ó>Ü>ï>õ>ñ>õ>è>ï>ó>ë>à>ñ>é>ï>é>ñ>Ñ>ð>ï>ñ>³>ç>ï>ð>í>í>ï>ñ>í>è>å>ð>ó>é>ï>ç>õ>é>ç>ó>ç>ñ>ð>à>í>É>ð>ç>ð>à>è>õ>å>ó>ë>è>ð>ð>é>è>ó>è>ë>é>ð>ó>ñ>ñ>ó>é>õ>ï>í>ï>í>×>é>õ>÷>Û>í>è>ñ>>õ>µ=Õ>ó>í>è>å>õ>ï>é>ð>ð>é>í>ñ>ì>í>Û>ñ>å>ð>ñ>è>ð>ë>ç>ë>ï>ï>÷>ð>è>ç>Ý>é>è>ï>í>ï>é>í>K>ç>é>ó>ð>ñ>ó>í>í>å>ë>è>Ý>ð>ñ>í>ô>ð>ð>å>ñ>ï>ñ>ì>ð>ô>ã>ó>á>ë>ð>Ó>à>ë>ë>é>Ý>í>ï>Ñ>ñ>ë>ó>ë>ì>í>w>é>í>è>í>ó>ñ>ó>÷>ó>å>å>å>ð>›>í>ï>é>ñ>ç>ð>í>é>é>í>ç>ë>ï>ð>é>ð>ï>ï>ñ>ó>ï>ð>P>é>Ù>ó>Ý>ë>í>í>í>ó>á>í>ó>í>ñ>ë>Õ>ã>é>ï>ï>ð>é>ð>í>ð>ñ>ç>ï>ó>õ>á>ñ>í>è>ñ>ï>á>é>ð>í>Õ>å>é>ç>è>é>é>ç>Ó>Á>©>í>ã>ñ>Ã>ó>ñ>ç>ë>è>ë>ç>í>è>ð>Û>í>í>ï>ã>´>é>ä>ð>Ë>í>ñ>í>é>×>ë>Ó>ï>í>õ>µ>ï>í>÷>õ>ó>ñ>ï>Ð>õ>è>í>ñ>é>ï>ó>ì>ï>÷>é>ï>é>ñ>ó>Ñ>ð>ð>é>í>ñ>ó>ñ>í>ç>õ>ì>í>í>Ý>ñ>ç>ó>í>Ø>ï>ë>ï>ñ>ç>ð>õ>ô>è>ç>é>á>Ñ>í>D>ð>ï>ã>ï>ñ>ì>ï>ñ>ï>ñ>ð>ñ>õ>í>ñ>©>Ó>ñ>í>í>ð>ç>·>ç>ð>ð>ð>í>Ó>á>ï>ô>ç>¹>ì>ñ>é>é>è>É>í>ñ>é>ó>ó>è>ë>÷>ï>é>ð>è>ë>í>ç>ï>÷>ë>Ù>ï>ð>ë>é>é>à>ó>ß>ï>ï>Ì>é>ì>ñ>Ø>é>é>Ý>Û>»>ç>ô>í>ô>ç>ô>Ø>å>ó>ç>ç>©>ï>´>ç>»>ð>ô>ï>ó>ì>ß>ð>é>>ñ>ð>è>Û>ë>õ>í>Ù>í>ð>ñ>ñ>ð>ó>ñ>ð> >ì>ñ>í>ã>ð>í>ç>ð>ã>Ø>ð>ï>ï>ó>ë>å>ð>ë>è>ð>ç>ë>ï>ð>ã>ñ>ã>é>ð>ï>Å>Ù>é>ñ>ð>ñ>ã>á>õ>í>õ>ë>ì>è>+>ë>õ>ñ>ã>ï>ð>à>í>è>È>ñ>ë>Ù>ï>ð>í>í>ë>ð>è>ï>é>ë>õ>µ>ð>ç>Ô>å>í>Ù>ï>ë>í>í>ï>ë>í>é>ñ>ñ>­>à>ô>à>í>ã>í>å>é>í>ë>ç>ë>í>ï>÷>ó>í>è>ó>é>ð>õ>ï>ð>ñ>é>‡>ñ>ð>è>ó>Í>ë>é>í>ì>ð>ñ>Ý>ë>ð>û=ç>Ù>ð>å>ð>ï>è>ñ>í>ñ>é>ë>ë>ì>à>í>¸>ð>ó>¨>é>é>ï>ð>Ã>ä>å>ð>é>ñ>’>ç>ñ>ï>ó>í>å>é>è>à>›>ç>á>ï>í>í>ñ>ð>Ý>å>ç>õ>é>[>ñ>ð>ð>å>í>å>ë>ñ>è>ç>è>ñ>ï>í>±>ó>ñ>ç>ó>á>é>ç>ç>ô>Ý>ð>Ý>ï>ë>ª>ç>Ç>Ã>í>ï>÷>ç>È>é>ó>í>ó>ô>÷>é>í>ï>ã>ð>í>õ>ð>í>ñ>í>á>ð>í>ó>á>ð>ë>¥>è>ï>é>ï>ó>é>ë>õ>ï>í>ë>í>ð>ó>í>ñ>Ý>ñ>Ó>ë>í>ç>£>Ý>ë>ë>ï>ñ>å>ã>ï>ð>ï>ð>ó>ð>õ>õ>á>ë>ó>™>í>í>ó>ä>í>ë>é>ð>ñ>õ>©>é>ã>ë>ç>é>ç>ô>É>ñ>ð>ç>ë>ñ>ñ> >ì>ç>ë>ë>š>ï>ç>í>è>µ>ï>í>ï>ï>õ>é>ð>ó>í>ë>÷>ë>é>é>ô>ð>ñ>ó>ð>é>Ã>í>ç>ï>ç>ï>ð>ï>è>>÷>ó>é>ý>ó>è>ì>ð>ë>ï>ì>ë>°>ë>è>ì>ë> >ó>å>ó>è>é>é>ç>Û>ð>ï>¡>ã>è>é>ñ>é>ï>ë>é>ï>í>í>ì>Ã>ì>ã>é>ß>ï>‡>õ>ç>ç>ï>ã>Ù>ì>ï>ð>õ>ï>õ>í>ñ>ó>å>à>é>ë>å>ë>õ>ñ>ð>ð>ó>ï>H>ó>ï>õ>í>>ï>ñ>á>ù>é>é>ó>í>ð>é>õ>ï>å>ó>ç>ð>ð>ã>”>ï>ð>å>ñ>í>ß>ï>è>ç>ô>ñ>ð>ï>õ>ñ>é>é>é>õ>Ý>é>÷>í>å>ã>ð>í>÷>ð>ó>é>Ð>é>ç>á>ñ>ó>ð>í>é>ç>ø>>°>¥>è>ï>ï>ñ>ó>ï>í>Ó>ñ>ë>Ý>ë>è>ç>ñ>ë>í>ð>õ>í>é>×>ð>?ñ>è>ï>ñ>ó>ä>í>ð>í>Ã>ï>À>í>ð>ñ>ð>ã>ñ>í>í>ñ>é>ó>í>ì>ñ>ó>ð>ï>ñ>ð>ð>×>ñ>á>Ý>ã>í>Ã>å>ø>á>ç>µ>ë>í>ë>ë>Û>è>ï>a>ó>Ù>ç>E>ð>ñ>ð>ð>ó>ï>ð>í>ç>ñ>ð>ð>ñ>è>ñ>ô>÷>«>à>×>í>é>è>ð>ã>ì>ï>÷>ð>Û>ç>í>é>ä>›>ï>í>³=ì>í>è>å>ï>ï>é>à>ñ>ñ>í>ð>í>í>ï>ë>ó>ß>ï>ç>ð>ñ>ó>í>ç>ë>s>ë>ï>Ø>Á>å>í>ó>ë>è>ì>ï>ï>ï>é>ï>‹>á>ñ>ä>í>å>”=ë>õ>ð>í>÷>ó>ë>ï>í>ï>é>í>ë>÷>ð>é>ñ>ç>ó>ï>ó>ß>í>é>ï>ç>ï>ì>ð>Ð>ç>ï>é>ó>ï>ó>¼>í>é>ð>õ>ë>ð>ð>ï>é>ì>ñ>ë>ë>ï>ë>Ñ>é>í>í>ð>é>ì>ð>è>ð>ï>ñ>ñ>¸>ð>ë>ð>é>Õ>ó>é>ã>ð>ñ>í>í>í>ã>ï>á>é>é>í>ð>Ý>ó>Ñ>á>å>í>ñ>í>ð>Ü>ñ>ï>í>Ù>è>ñ>ð>>é>à>í>í>³>ã>é>ï>Ý>ð>ð>ç>å>ñ>ð>ñ>Ý>õ>ñ>ð>ñ>ç>é>ç>í>Û>ð>ï>5>Í>õ>ð>ë>ð>÷>ì>×>í>é>é>ç>é>ð>ó>é>é>è>ó>ç>Ÿ>í>ð>í>ë>Ï>ñ>í>ñ>í>ë>ð>é>õ>ï>é>ð>÷>ç>ñ>í>í>*>é>ñ>ð>ñ>å>ã>í>í>ñ>ë>ð>í>ñ>Û>ï>ð>÷>ì>ó>ñ>ì>ó>ï>ç>í>ì>ë>ã>ç>ï>ç>>Í>ï>ó>ñ>è>ð>õ>é>ì>ó>ë>ë>í>õ>ñ>ë>ã>ë>Ç>¸>À>ï>í>ï>ó>Ó>ñ>±>ç>ó>ñ>è>í>í>£>ì>÷>ñ>ô>é>å>í>å>ì>ã>ï>í>ì>í>ñ>í>ð>û>í>à>ï>ï>³>õ>ñ>í>í>ñ>í>ñ>ð>ó>à>>ð>é>õ>ë>í>Ð>í>í>ñ>Ó>ã>ñ>í>ì>õ>í>_>È>å>ð>ñ>ë>ì>ï>ë>÷>ï>ó>é>è>Ÿ>í>ï>à>í>è>ñ>ñ>í>õ>ñ>×>ã>ð>¬>è>ñ>ó>ó>ç>í>ó>ï>ð>ï>ñ>ï>å>è>ñ>ð>ï>Ó=ï>Ý>·>ð>ð>ç>ã>ñ>í>ó>ð>ë>ñ>ð>è>ð>õ>í>ï>÷>ï>ð>á>ð>è>í>ð>>ð>å>ë>è>é>£>Á>ð>ñ>í>ß>ì>ç>Ð>ñ>õ>ë>í>ñ>í>ð>Û>÷>ë>õ>ô>ë>ç>ë>á>å>ï>ñ>ð>í>í>ñ>°>ð>ï>í>í>ñ>Q>ë>ï>ô>é>ç>à>ë>ë>ë>ä>È>é>ð>é>í>ñ>å>³>í>å>è>·>í>ð>ï>ð>è>ï>ó>ó>ï>Õ>Ë>ë>í>è>ï>ð>Ý>ï>ï>ñ>ñ>ð>ð>í>å>í>À>õ>ó>ï>ï>è>í>è>ð>¹>à>˜>ì>ë>å>è>ó>Ý>í>ë>í>õ>è>ï>ó>í>±>ð>ë>×>ñ>ð>é>ë>ã>ñ>í>ñ>Ð>ë>è>á>è>ã>ó>ð>ì>é>ñ>ñ>í>ó>é>ñ>ð>é>ï>ð>ç>ï>ç>ð>á>ï>é>à>é>è>ç>ð>í>é>è>ð>í>§>ã>ï>ó>ë>ë>ð>ï>õ>ñ>Ë>ó>ð>ï>ñ>õ>ó>ã>ñ>ñ>ð>å>ñ>ã>ó>ë>à>ç>ë>í>í>é>ñ>ã>ó>ñ>ð>ð>ì>ï>ñ>ë>ç>õ>Ç=ë>å>ñ>Ë>í>ó>ñ>í>í>Ø>ó=í>ï>é>ñ>ï>§>ï>»>ë>õ>ë>ð>í>í>í>á>Ÿ>ñ>é>û>ï>ð>å>í>ì>Ã>Ë>í>ë>“>è>ñ>é>Ñ=>é>ã>í>ï>ï>ï>ð>ð>ì>ë>×>õ>ð>{>á>ã>Ø>ë>õ>è>ó>í>í>í>õ>ð>í>à>é>c>ã>ô>ð>è>ë>ë>Ó>ð>ç>ð>ô>ñ>ï>Ñ>é>ä>é>é>ó>ë>ñ>ð>é>é>ñ>å>ë>å>í>é>á>ë>ñ>í>å>ó>í>é>á>÷>É>è>é>ï>õ>é>í>Ó>ð>í>ñ>í>÷>ã>á>ï>í>í>é>ó>ð>>é>ï>ô>é>Ð>ï>í>õ>ø>é>ï>ì>ð>ï>ã>ó>ó>ã>ç>ñ>ó>å>ð>å>ó>À>è>ï>ß>ä>í>í>å>÷>ç>ð>ñ>ë>ð>ð>ñ>í>ó>ï>ë>ß>ç>í>å>é>ï>Ë>ð>ç>ì>í>ë>ë>ï>ø>Ñ>é>ç>ñ>ï>ï>ó>ñ>å>è>õ>¹>ñ>à>å>ð>í>ë>ð>Ý>ï>í>í>í>í>í>è>ì>ñ>í>ç>ë>ñ>å>õ>ñ>Ý>ð>ë>ë>•>ï>ë>é>ð>Ï>ñ>ï>ð>ð>ñ>è>•>÷>ó>µ>í>È>ó>÷>ë>ð>ë>è>ë>è>£>ã>Ð>á>ñ>à>é>é>í>ï>ë>ç>é>ï>×>ó>ç>Ý>é>ñ>ñ>í>ð>ó>ë>ð>ï>Ï>ï>ð>ð>é>Ý>Á>#>ó>é>Á>é>ñ>ç>ð>ç>í>í>í>í>ô>ï>ï>ð>ë>í>í>ñ>ñ>Ù>ñ>ï>ð>é>ã>ó>ï>œ>í>ñ>è>÷>ß=ñ>õ>í>ï>ñ>ô>ð>ð>í>é>à>é>ë>ð>è>ñ>ç>ó>ð>ï>ð>÷>é>ð>Ù>ì>ð>à>é>ô>Ù>ñ>è>ó>í>é>í>Ù>ï>è>í>ß>õ>ï>÷>ë>ï>ë>ã>Û>è>Ù>ó>í>ñ>ï>ë>ë>é>à>¼>è>ñ>í>ï>ï>ñ>ï>í>å>ð>å>í>í>ï>Ó>í>é>è>ï>Û>ñ>ó>ç>Ó>ï>í>ç>ë>ï>ð>ó>Ø>ð>Ÿ>ï>Ù>ë>ð>ð>ï>ð>í>ó>°>ñ>ë>ë>ð>Ø>ï>è>ñ>ð>è>å>ð>ó>ó>ð>ð>ð>ä>ë>ó>ï>ì>å>ð>ç>é>ã>ñ>ë>é>é>ñ>ð>ñ>ï>ï>ñ>ï>é>ñ>ó>í>í>ð>ë>ï>ñ>ë>å>ñ>ñ>é>ã>ó>ï>é>ñ>õ>é>ï>ë>Ç>ï>ñ>ï>ë>ï>é>ó>ð>ð>ð>ô>í>ñ>Ý>™>ð>ñ>é>ó>í>í>ñ>ë>ð>ï>ë>ë>í>ð>í>ï>í>í>õ>í>ð>ð>è>ó>ø>é>«>Å>ë>ñ>ï>ñ>é>è>ë>ð>ð>ï>é>>ó>í>Ë>ë>ñ>ï>í>é>í>é>õ>ó>ï>ï>ð>è>í>à>è>©>÷>ð>é>ï>ñ>å>Û>Ó=í>ï>é>ç>ã>¹>ñ>è>í>ó>ë>ç>í>ñ>õ>ñ>í>ð>õ>ó>é>è>í>õ>È>ì>ô>ë>ð>Í>ñ>ñ>ñ>ï>ì>ñ>§>ñ>ë>÷>ð>á>í>ñ>é>é>í>ï>ð>è>é>ð>é>í>í>é>í>ë>í>é>ð>ñ>ñ>á>í>ç>ç>ð>H>ë>ð>ï>ñ>õ>õ>ë>í>ë>¨>­>ñ>í>ì>ð>ð>é>­>õ>ñ>ñ>ë>›>á>ð>å>ñ>è>í>ã>ã>ð>é>õ>È>ï>à>ë>ë>õ>í>ð>ä>Ø>í>ð>‡>è>í>ã>ï>ð>ð>Ë>í>ñ>ë>ó>ð>ñ>ì>ó>è>é>‡>å>í>å>ç>÷>ñ>ï>ï>ð>å>­>í>ä>è>ó>ë>÷>õ>ð>ë>ñ>í>í>ï>ë>å>ñ>ñ>é>è>ë>ó>ð>í>ï>ó>÷>ð>ô>õ>ë>ñ>é>ð>­>ï>é>ç>õ>í>é>Ý>ñ>ß>è>ñ>ó>í>ë>å>é>ô>í>ð>ó>õ>í>í>ñ>ó>ë>á>ñ>å>ñ>å>è>Ã>ã>í>é>ï>å>í>é>õ>ð>õ>ù>Ç>í>ó>ñ>ë>¸>ì>ñ>ì>ô>ð>³>é>à>ï>á>å>ï>à>ï>ë>ï>ì>ô>í>å>ç>ñ>ã>ï>ø>ï>ñ>ç>é>Å>ó>ó>õ>ë>ë>ë>í>ë>ó>à>ˆ>ë>§>Ð>ñ>ç>ñ>ñ>í>í>ï>õ>ô>ï>ó>í>ñ>ð>ð>ñ>í>ñ>÷>í>ì>ñ>ñ>í>ï>í>ñ>ï>á>ó>ç>é>ë>×>í>è>û>ï>í>é>ì>á>è>ó>Ø>õ>Ã>›>á>ð>ð>í>ñ>à>í>ï>ð>à>ï>ë>ñ>í>ë>Û>ñ>é>é>è>ã>é>œ>ð>ï>õ>ß>í>ð>í>ë>5>ï>ñ>ï>ã>ó>ï>ñ>ñ>ç>í>ð>>é>í>ð>ï>ó>à>ë>é>à>í>ó>ð>ï>ð>ï>÷>ñ>ï>õ>ï>ß>í>í>í>ó>×>è>>ù>ð>ñ>ë>ç>í>Ý>é>é>é>÷>ï>ð>í>ç>ë>È>ñ>ç>í>ó>ð>Ð>ñ>é>í>ï>ð>ð>á>é>ó>é>ñ>ð>Ý>ó>ó>ç>è>Ø>í>å>ó>è>è>è>ñ>í>ñ>ñ>ë>ç>é>è>÷>í>ó>é>ñ>í>ç>è>ñ>ð>ï>ð>ë>õ>ñ>ï>ï>è>ñ>ó>õ>ñ>ñ>è>ó>è>ï>ë>å>é>å>é>ð>å>ï>÷>ë>ä>ë>ç>é>ë>ï>é>à>ï>è>ð>ñ>Û>õ>ã>í>é>í>í>õ>í>õ>ë>õ>ë>ï>Õ>í>Û>í>ë>ñ>ð>ï>ç>ð>ï>ù>÷>ï>ô>£>í>ñ>µ>ð>ð>í>Û>ï>ñ> >ë>©=ë>é>ñ>ï>í>ó>u>÷>ô>ï>ë>ë>ð>ð>å>÷>ï>ð>ð>Û>ð>ñ>ñ>ï>ç>ì>ñ>ð>ð>Ù>ñ>é>é>í>¹>¤>é>á>ð>ë> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/23.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/23.0 new file mode 100644 index 0000000000000000000000000000000000000000..b00bd88d2dca05875231b512ec395bb9d9f3f415 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/23.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/24.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/24.0 new file mode 100644 index 0000000000000000000000000000000000000000..325b3b0b9bc3228f0950402f3ae6a327df3e64f6 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/24.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/25.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/25.0 new file mode 100644 index 0000000000000000000000000000000000000000..d4137f02a747cc4bd43facd66e292343e4b7f9a2 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/25.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/26.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/26.0 new file mode 100644 index 0000000000000000000000000000000000000000..1bea8c07b2495c8dc823bbaebfd060bfcb105c0e Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/26.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/27.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/27.0 new file mode 100644 index 0000000000000000000000000000000000000000..c4a09a305526335b24cadadb2ef5595d21c9bad0 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/27.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/28.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/28.0 new file mode 100644 index 0000000000000000000000000000000000000000..902fc6d7f078a2124c58e1337c701a1f053a9036 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/28.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/29.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/29.0 new file mode 100644 index 0000000000000000000000000000000000000000..4591af13b20c3db1fd891a1c22641e6cdd5c93a2 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/29.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..70901ae0de6954844894455d3e731993af878e23 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/3.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/30.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/30.0 new file mode 100644 index 0000000000000000000000000000000000000000..24e888891bb3b909801bd7cf525f1affa145782c Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/30.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/31.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/31.0 new file mode 100644 index 0000000000000000000000000000000000000000..52a167bc4bc0b4c25adc40a15adbacb7db082ccf Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/31.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/4.0 new file mode 100644 index 0000000000000000000000000000000000000000..f6bc355368fc99adfdb284ea9995e522e20be267 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/4.0 @@ -0,0 +1,2 @@ +>>‚>…>G>ƒ>…>„>…>ƒ>s>‰>…>ƒ>ˆ>…>…>ˆ>…>‡>{>‰>„>1>…>{>‹>a>‡>1>‡>‡>>ˆ>…>…>„>h>ƒ>>h>‹>$>>…>U>…>x>>…>'>‰>7>…>‡>ˆ>€>€>…>;>‡>|>ƒ>‰>>ˆ>‡>…>…>…>>ƒ>…>ƒ>x>‡>…>‰>…>ˆ>}>]>8>…>‡>ˆ>>E>‡>‡>‡>…>{>‡>ƒ>ƒ>…>…>‡>†>‡>…>->/>€>…>…>…>…>…>‡>}>…>…>…>€>‡>…>>…>ƒ>…>…>ƒ>†>…>>…>ƒ>†>‰>ˆ>€>W=…>}>>‡>‡>ƒ>i>>†>>ƒ>ˆ>t>}>ƒ>‡>t>€>ƒ>>‡>>ˆ>…>ƒ>…>i>o>Š>…>†>=>i>‹>g>…>…>ˆ>…>…>p>w>‡>‰>ƒ>x>k>‡>‡>ƒ>y>„>…>€>‡>‡>q>‡>†>s>3>ˆ>†>>‡>#>…>…>>…>ƒ>k>‡>‡>‡>>ƒ>…>E>‡>ƒ>‡>>ƒ>ˆ>‡>ƒ>ƒ>…>|>‰>>o>…>|>ƒ>{>…>…>‡>‡>‰>ƒ>ˆ>>…>‡>ˆ>‹>…>‡>>…>‚>ƒ>ˆ>…>]>‡>…>p>>ˆ>‡>‡>‡>ƒ>‰>‡>„>w>‡>_>ƒ>ƒ>ƒ>…>‡>…>…>…>ƒ>…>†>…>ˆ>ƒ>7>…>†>€>‡>‡>‰>…>‰>!=·‡>„>y>>}>…>Y>ˆ>€>7>‰>‡>…>ˆ>ƒ>ˆ>>ˆ>A>ˆ>ƒ>‰>">u>ƒ>ƒ>>…>c>‡>}>ƒ>ƒ>k>‰>…>|>q>>‰>ƒ>…>…>…>u>‡>†>u>‚>ˆ>‡>ˆ>ƒ>…>†>…>{>…>|>€>‡>ƒ>„>…>€>ˆ>…>€>ƒ>…>…>>…>…>…>>ƒ>‡>…>ƒ>X>€>‰>„>ƒ>†>…>d>†>‡>…>ƒ>d>…>C>‰>ƒ>d>ƒ>…>‡>†>‡>ƒ>‡>}>y>w>‡>‡>ƒ>Š>‰>}>x>…>†>ˆ>3>{>ƒ>ˆ>‚>…>‡>>‹>}>>ƒ>t>ˆ>o>…>ƒ>…>…>‡>ƒ>3>ƒ>ƒ>q>…>>…>Œ>…>‡>…>>ƒ>#>…>ƒ>‡>‡>‰>>‡>†>ƒ>g>…>}>‡>ˆ>ƒ>ˆ>…>…>‡>ˆ>„>…>‡>>ƒ>E>…>…>>‹>‡>ƒ>}>ƒ>†>‡>‡>7>x>…>ƒ>†>‡>…>‰>p>>…>…>ƒ>‡>…>…>…>…>…>†>}>ƒ>‰>ˆ>ˆ>…>…>$>ƒ>‡>‰>‰>ƒ>‡>‡>‡>…>H>„>…>†>†>I>€>„>ƒ>ƒ>I>…>‡>…>…>…>!>†>†>‡>…>€>7>‡>ƒ>…>‰>ˆ>ƒ>ƒ>ˆ>w>…>ƒ>€>‡>…>t>‡>>>…>1>…>€>>†>>‰>m>ƒ>‡>„>s>‹>…>…>‰>ˆ>ˆ>y>ƒ>…>‡>‡>‡>…>ƒ>>‡>†>K>†>…>k>‡>‡>s>…>3>€>x>‡>ˆ>‡>…>†>ƒ>ª=‹>ƒ>…>ˆ>>ƒ>w>‡>ˆ>ƒ>†>u>ˆ>†>‡>y>ƒ>…>>…>‡>…>@>‚>…>‡>e>ˆ>…>ƒ>€>{>„>…>>5>‰>‹>…>ƒ>|>…>ƒ>p>„>ƒ>…>‰>€>ƒ>}>…>…>€>‰>=>ƒ>…>„>Y>o>‡>ƒ>‡>ˆ>…>ˆ>ƒ>„>h>‰>ƒ>‡>„> >‡>„>†>…>p>„>4>‡>ƒ>…>…>k>>>…>…>†>>ƒ>…>…>ˆ>ˆ>>‰>ƒ> +>ƒ>‰>…>ˆ>ˆ>g>ˆ>‰>ˆ>‰>…>…>ƒ>ˆ>ˆ>G>Q>„>ƒ>ƒ>‡>…>>…>‡>…>‡>y>…>‡>ˆ>M>…>‡>S>|>ƒ>…>ˆ>{>|>‹>s>Y>…>‡>}>>>…>ƒ>…>…>e>…>d>+>>ˆ>‡>ƒ>†>…>y>ƒ>†>‡>ˆ>‡>y>ˆ>>€>…>…>€>†>‡>]>ƒ>‡>„>‡>ƒ>‡>ƒ>‡>‰>…>‡>€>…>ƒ>€>ˆ>}>ƒ>…>„>‰>…>>‡>…>…>ƒ>‡>ˆ>‹>‡>…>„>{>…>>…>ƒ>‡>‡>‡>c>X>…>…>…>M>…>ˆ>‡>‹>…>…>>‚>t>„>ƒ>}>x>Š>ƒ>ˆ>‡>†>‡>s>ƒ>‡>…>…>ƒ>>>†>‡>…>8>…>…>‡>>‡>…> >…>…>ƒ>„>‚>‡>ˆ>ƒ>M>…>ˆ>…>…><>…>ƒ>‚>A>…>…>…>‹>‡>Š>ƒ>>‡>…>…>ˆ>‡>p>…>‹>‡>‡>‡>5>„·ƒ>…>ƒ>…>{>‡>‡>U>>…>€>>y>…>…>…>…>>‡>ˆ>…>‡>‰>ƒ>…>>ƒ>K>ƒ>\>g>ƒ>…>ˆ>…>>‡>‡>>…>ƒ>‡>„>C>‡>…>ƒ>‡>>€>i>‡>…>†>„>…>‡>ƒ>>s>‹>_>x>}>‡>‡>3>ƒ>‡>‡>w>‡>ƒ>>…>E>‡>u>>…>‡>‡>‡>…>>w>8>‹>->y>‡>…>x>‰>‡>†>…>†>‡>…>L>…>>‡>…>‡>…>…>‰>8>…>…>[>‡>‡>…>…>‡>‡>…>„>{>u>>…>ˆ>£<ˆ>€>‡>…>‡>…>…>ƒ>w>…>c>ˆ>‡>…>‡>…>ˆ>‡>…>1>…>‡>>ˆ>‰>>‡>ˆ>…>…>…>…>K>…>ƒ>,>€>‡>`>}>ƒ>ˆ>…>|>ˆ>‡>ˆ>Q>†>…>‰>…>p>ƒ>‡>…>†>>ƒ>‡>…>€>…>…>'>ˆ>…>†>X>1>‡>…>ƒ>ƒ>…>>‡>€>‡>ƒ>u>x>;>q>…>g>…>i>…>>‡>\>‡>]>„>ƒ>‡>‡>}>}>…>ˆ>…>ˆ>ˆ>…>†>‹>y>|>X>‚>>ˆ>…>…>ˆ>>‡>…>ˆ>ˆ>Ç=7>ƒ>‡>‰>{>|>ƒ>‰>ƒ>…>‚>‡>ƒ>ˆ>ƒ>…>g>p>‡>€>X>…>†>…>…>ƒ>ï=ƒ>„>…>…>…>p>…>„>…>†>‡>`>>‡>>‹>€>}>c>ˆ>4>h>>…>s>‡>†>ˆ>…>…>…>…>…>‚>ˆ>†>y>‡>ƒ>e>ˆ>€>†>S>‡>…>ƒ>y>ˆ>‡>…>„>…>ƒ>ƒ>‰>ˆ>…>ƒ>‡>}>x>ƒ>„>‡>„>x>>T>ƒ>>‡>c>ˆ>…>|>…>ƒ>€>‡>>‡>ƒ>‡>y>‡>ƒ>‰>‡>>‡>…>ˆ>ˆ>>‹>ƒ>>?>…>€>‹>ˆ>y>>ˆ>9>‹>ª=m>ˆ>…>y>‡>‡>>x>‹>‡>‰>}>…>†>‡>y>…>>‡>…>w>…>‰>e>…>…>„>‡>‡>>>p>‡>€>ƒ>>‡>‰>ƒ>€>…>|>‡>ƒ>„>ˆ>…>‰>…>…>‡>>ˆ>…>…>‚>>‡>y>…>…>„>…>ˆ>‡>€>ˆ>`>‡>ƒ>>0>‡>}>…>…>>ƒ>c>ƒ>|>…>ƒ>ƒ>…>G>…>…>ƒ>…>…>…>…>ˆ>‡>…>ˆ>ƒ>…>=>ˆ>…>†>‡>‡>u>{>ƒ>ƒ>{>…>…>†>‡>>…>…>…>„>„>ˆ>ƒ>å=…>H>†>}>ƒ>…>ˆ>ƒ>‡>e>…>…>ˆ>…>…>s>€>ˆ>‡>…>‡>…>…>…>‡>†>…>‡>…>‡>ƒ>…>…>ˆ>…>‰>„>‡>‡>‡>q>‰>>‡>s>ƒ>‰>ƒ>h>\>C>w>…>€>K>‰>ˆ>…>>‡>{>…>…>m>‰>u>„>…>ˆ>…>E>…>>‡>s>ˆ>>>…>Y>…>C>‡>ˆ>‰>P>‡>…>‡>‰>†>‡>‡>)>‰>…>ˆ>ƒ>‡>ƒ>…>„>ˆ>ˆ>…>‡>ƒ>‡>ˆ>i>…>‡>|>ƒ>‡>Š>‡>…>‡>‡>ˆ>ƒ>‡>}>…>‡>‡>‡>>…>ƒ>‰>…>ƒ>…>…>ˆ>…>†>…>A>y>‡>c>ƒ>>X>>…>…>‰>…>†>Š>…>ˆ>‡>†>ƒ>8>->…>‡>|>ˆ>…>O>„>>‡>‰>†>{>>‡>…>>K>…>‡>…>€>ƒ>4>…>…>‡>‡>‹>„>‚>‡>ˆ>…>ˆ>ƒ>…>ˆ>†>…>…>ˆ>}>…>…>†>€>ˆ>>…>w>…>‡>S>…>>…>}>ˆ>ˆ>…>ƒ>U>>…>‡>…>‡>…>{>{>‡>‡>h>>‡>y>{>A>…>‡>ˆ>‡>@>€>‡>†>,>†>k>>€>‡>ƒ>ƒ>…>…>‡>‡>…>‡>‡>…>ˆ>;>a>‡>…>‚>‡>…>}>>>P>…>‡>…>‰>…>ƒ>…>…>…>…>…>>Š>Œ>>‰>ƒ>…>…>…>>u>‡>‡>…>†>ƒ>u>…>‡>ƒ>…>‡>†>">…>ˆ>†>ƒ>‡>ƒ>>ˆ>€>i>ƒ>„>i>…>…>‚>‡>…>…>ƒ>ˆ>>ˆ>‡>;>‰>ƒ>i>->…>…>„>€>…>ˆ>W>…>ˆ>…>‡>…>5>>‰>€>‰>…>ƒ>ƒ>…>…>ˆ>‡>‡>‡>‚>†>„>†>…>…>>‡>‡>…>ˆ>ˆ>}>I>…>†>…>…>…>>‡>…>…>‡>†>!>…>…>[=ƒ>>‡>{>‡>ˆ>…>…>…>…>‡>ƒ>‡>…>a>‡>M>€>ˆ>¿=…>‡>…>…>P>_>y>€>>…>`>ƒ>ƒ>…>ˆ>…>p>->…>ƒ>*>}>ƒ>‡>…>>ˆ>€>s>{>ƒ>…>€>,>…>‰>…>>…>‡>‡>ˆ>…>€>…>ƒ>ˆ>‚>A>‡>‰>w>…>{>…>>…>…>>ƒ>„>‰>…>*>ƒ>h>,>‰>…>ˆ>€>T>€>…>ƒ>†>†>ˆ>ƒ>‡>…>ƒ>‡>…>ˆ>…>…>‰>ƒ>„>‡>…>…>‡>„>‡>9>t>…>i>ˆ>‡>>ƒ>…>…>…>‡>…>ƒ>>€>‡>„>‡>‰>>‡>€>;>„>…>}>‡>‡>„>ƒ>ˆ>…>‰>ƒ>…>ˆ>†>ˆ>…>>‡>7>‡>ˆ>‡>{>…>‡>‡>…>‰>‡>8>‡>€>†>‡>…>…>‡>u>…>ˆ>…>‡>ƒ>†>=>ƒ>>‡>…>X>‡>ˆ>ˆ>>_>ƒ>…>ƒ>…>„>>ˆ>ˆ>‡>x>ˆ>ˆ>|>‡>‡>…>ˆ>‰>…>ˆ>3>ƒ>ƒ>>ƒ>‰>Š>…>ˆ>8>‰>‡>ƒ>…>…>ƒ>ˆ>‰>‡>{>‡>ˆ>5>…>€>…>ƒ>3>>}>‡>‡>ƒ>u>…>ƒ>†>ˆ>=>>}>ƒ>†>‹>ƒ>†>‡>‡>ˆ>‡>ƒ>]>ˆ>ƒ>ƒ>|>ƒ>A>†>>s>ƒ>ƒ>W>‡>…>…>‹>‡>‡>‹>ˆ>‡>€>…>‡>‰>ƒ>ƒ>ƒ>†>†>…>‰>ˆ>->‡>…>…>…>|>…>…>>ˆ>„>‰>…>‡>…>…>ƒ>…>}>ƒ>|>‡>ˆ>ƒ>Y>‡>€>ƒ>…>„>>…>>>‡>‡>‰>…>…>ˆ>…>ƒ>…>ˆ>x>…>†>…>ƒ>ƒ>ˆ>ƒ>ƒ>>…>‡>l>>†>>ƒ>q>ˆ>…>‚>‡>‡>`>I>+>p>>†>‡>…>…>‡>€>…>…>…>…>…>ƒ>…>„>‡>€>ˆ>‚>;>i>>‡>†>ˆ>ˆ>…>‰>>ˆ>†>…>4>ˆ>x>t>…>ƒ>‰>ƒ>…>ƒ>‚>…>}>ƒ>ƒ>‡>‰>‡>…>…>ˆ>ƒ>…>h>ˆ>x>y>?>‡>S>„>‰>y>†>M>ƒ>…>>…>p>…>K> >…>y>…>è=ˆ>…>ˆ>…>ˆ>ˆ>€>ƒ>l>ƒ>ƒ>ˆ>‡>>ˆ>‹>†>)>x>x>…>…>ƒ>ˆ>{>‡>„>ˆ>‡>€>…>†>>…>>ƒ>>÷=ƒ>‡>Y>P>…>…>‡>/>x>ˆ>…>ˆ>‚>…>ƒ>‡>…>p>‡>>‹>‡>‡>†>ƒ>ƒ>)>‡>s>\>7>|>…>…>ƒ>…>„>‡>‡>‰>…>q>C>'>„>…>‡>>0>>†>‡>…>ˆ>‡>†>†>†>…>Š>…>‡>‡>ƒ>>‡>…>‡>‡>ˆ>ƒ>…>‰>…>†>>ƒ>ˆ>€>„>ƒ>‡>‡>ƒ>‡>'>…>„>ƒ>‡>‡>†>ƒ>‡>ƒ>ƒ>„>†>ƒ>‰>…>…>…>‡>‡>‡>€>„>‡>k>‡>ƒ>…>ˆ>3>‡>…>…>…>u>…>†>t>…>ƒ>ƒ>…>>>…>ƒ>‰>>…>„>ƒ>‹>}>=>‚>ˆ>…>q>‡>i>…>‰>†>|>„>‡>ˆ>1>ƒ>}>{>…>->|>‚>†>…>‡>†>p>†>…>ˆ>ˆ>t>ƒ>ˆ>…>ˆ>…>‡>y>…>>‡>‡>Õ={>‡>‡>‡>ˆ>‹>‰>l>…>„>‰>…>‡>…>…>ˆ>‚>ƒ>…>€>g>‡>…>†>ˆ>y>‰>„>…>†>ƒ>ƒ>‡>ˆ>ˆ>‡>‰>‡>ƒ>…>…>‡>g>ˆ>†>…>…>y><>>ƒ>ˆ>‡>…>‡>…>W>†>ƒ>…>…>…>‡>…>‡>ˆ>>€>>ƒ>ƒ>>…>ˆ>,>1>ƒ>ˆ>ƒ>…>‡>‰>>ƒ>ˆ>ƒ>ƒ>…>‡>€>€>…>d>3>>7>‚>…>ˆ>…>}>…>y>ƒ>‡>…>‡>u>…>;>„>ˆ>ˆ>…>ƒ>ƒ>ƒ>ƒ>…>x>…>ƒ>ƒ>…>ƒ>…>‚>‰>>|>†>‡>G>ˆ>†>ƒ>„>‡>‡>‡>‰>†>…>e>ˆ>‡>‰>„>‰>s>‡>‡>‡>]>…>‡>‡>ƒ>‡>>Ë=c>ƒ>‡>„>‡>ƒ>…>ˆ>ˆ>‡>…>‚>‡>4>…>ƒ>{>ˆ>>‰>‡>‡>ˆ>ˆ>l>{>ƒ>m>ƒ>…>‰>†>†>…>†>‰>†>…>…>ˆ>„>‡>‡>‡>†>U=>ƒ>i>…>ƒ>…>M>†>…>ˆ>…>‰>‡>…>€>w>ƒ>…>ƒ>…>ˆ>…>{>ƒ>>…>‡>O>‡>…>‡>€>‚>{>e>ˆ>ˆ>‡>K>…>ƒ>s>‡>†>…>‡>‚>|>†>‡>†>ˆ>ƒ>„>‡>‹>ˆ>y>‰>s>…>…>ƒ>‡>ˆ>E>‹>…>ƒ>…>…>X>…>>ƒ>‡>€>{>ƒ>…>†>€>u>…>…>…>ƒ>‚>…>;>‡>>}>Y>†>„>…>…>‡>ˆ>…>‡>ˆ>k>d>0>ˆ>x>…>„>s>ƒ>‰>‡>‰>‡>ˆ>†>>…>X>‡>…>ˆ>…>…>…>…>‰>4>ƒ>7>…>…>…>>ƒ>>…>†>…>ˆ>‡>†>ƒ>ƒ>=>…>>…>‰>„>†>…>l>…>ˆ>‹>y>…>o>ƒ>ƒ>‡>ˆ>ƒ>>‡>…>‡>‡>ˆ>ˆ>…>‡>{>†>‡>w>…>…>…>D>‹>>ƒ>…>>ƒ>…>ƒ>ƒ>ƒ>‹>i>+>q>‡>ˆ>ƒ>ƒ>ƒ>>ˆ>‡>e>‡>…>ˆ>‡>…>ƒ>x>…>…>‰>>„>‡>‡>…>m>…>…>ˆ>…>…>ˆ>‡>…>†>…>ˆ>>‚>ˆ>‡>|>…>i=…>€>ˆ>p>ƒ>…>†>…>…>y>·=…>…>‡>‰>€>G>†>l>‡>…>ˆ>ˆ>Y>‹>…>>5>ˆ>‡>…>ƒ>‡>‚>…>‡>c>k>ˆ>†>;>ƒ>…>‰>>3>‹>>>>…>„>‡>ˆ>„>…>>‡>{>7>>l>}>{>‡>ƒ>…>…>‡>‡>„>‹>‡>y>…>>>‡>‹>…>…>†>Q>‰>…>}>…>‡>…>G>ˆ>ƒ>…>…>‡>…>‡>„>>…>ˆ>u>…>>…>ƒ>€>‡>‚>ƒ>y>…>†>…>€>…>k>ƒ>…>…>‡>ƒ>‡>g>‡>ƒ>ˆ>„>‡>ˆ>y>‡>…>e>‡>‰>…>@=ƒ>‡>‡>‚>t>ƒ>…>ˆ>ˆ>€>ƒ>ƒ>‡>…>ƒ>…>\>{>‡>ˆ>†>>†>>‡>ü=>ˆ>(>…>…>…>ƒ>>…>†>O>ƒ>‚>†>…>‹>…>>…>x>ƒ>‡>>ˆ>Š>x>„>ƒ>}>†>ƒ>ƒ>†>ƒ>E>‡>x>‡>„>‡>‡>…>‡>„>…>S>‚>ƒ>>‡>„>…>>ƒ>…>ƒ>‡>…>„>>†>}>‡><>c>ƒ>…>…>‡>‹>_>‡>‡>…>9>‡>‚>…>…>>>‡>…>…>‡>…>>‡>‰>I>ƒ>;>…>‰>>…>‡>„>ƒ>ƒ>9>|>Q>…>‡>‚>…>…>…>…>€>…>…>‡>€>‰>@>y>>‡>†>>…>…>ˆ>…>‡>m>„>‡>‡>‰>}>H>°=…>ƒ>€>>ˆ>‡>ƒ>‡>…>ƒ>{>ƒ>ƒ>…>…>ƒ>…>ˆ>ˆ>‡>…>ƒ>†>ƒ>…>k>>…>ƒ>/>ˆ>>…>†>í=ˆ>‡>ˆ>ˆ>†>ˆ>‡>y>†>…>€>…>…>ˆ>ƒ>‡>}>ƒ>‡>…>†>‡>€>ˆ>c>‰>ˆ>s>ƒ>‰>p>‡>ƒ>‡>†>ƒ>„>…>ˆ>…>‡>1>‡>ˆ>ˆ>‡>…>…>ƒ>(>‡>…>‡>}>…>ˆ>ƒ>‡>>>/>‡>‡>…>ƒ>>ƒ>‡>ƒ>ƒ>}>>ƒ>‡>‡>/>…>_>>‡>}>ˆ>…>{>€>ˆ>‡>…>‡>Y>‰>…>x>„><>‡>\>‡>‡>…>…>„>ƒ>ˆ>U>…>…>y>…>[>‡>…>…>…>ƒ>‡>…>‡>‰>…>‡>„>„>ƒ>„>‡>w>…>‰>,>>€>ˆ>†>ƒ>>‰>…>L>ˆ>ƒ>‰>‡>‡>‡>‡>ƒ>>…>‡>>„>‚>w>‡>ƒ>…>ƒ>Š>ˆ>€>‹>…>ˆ>>‡>\>>‡>‡>>ƒ>€>‡>†>‡>…>ˆ>ƒ>†>}>5>…>>‡>ˆ>†>„>‡>…>ˆ>ˆ>ˆ>|>ƒ>†>>ƒ>…>ƒ>ˆ>…>ƒ>ˆ>„>…>…>„>!>4>ƒ>„>…>‡>€>|>>†>…>…>…>/>‡>o>c>p>…>…>…>ƒ>…>‰>ˆ>‰>‡>…>…>ˆ>‡>ˆ>ˆ>@>…>i>…>„>h>>0>å=ƒ>ˆ>‡>i>}>(>‡>ˆ>‹>‰>ƒ>x>€>ˆ>>ˆ>‚>…>‰>…>ˆ>>‹>…>>‚>‡>ƒ>ˆ>|>‡>‡>…>„>ˆ>ˆ>3>„>‡>…>…>>…>‡>ƒ>ˆ>ƒ>‡>†>ƒ>†>‰>‡>ˆ>>y>‡>…>…>‡>‡>‡>w>†>ˆ>…>M>…>ó=…>ˆ>‡>‡>‡>ˆ>…>…>ƒ>/>E>‰>‡>ƒ>…>‚>…>h>>‡>…>‡>7>>‡>{>‡>ƒ>…>…>ƒ>>‡>†>%>€>€>>…>ƒ>…>ˆ>ƒ>s>„>…>4>€>…>q>‡>…>‰>k>€>ˆ>>ˆ>ƒ>„>…>…>…>ƒ>9>ˆ>ƒ>|>…>‡>ˆ>…>>y>…>=>>…>…>…>†>†>…>†>ƒ>…>ƒ>…>‡>…>i>‡>‡>€>ƒ>{>‡>ƒ>…>…>Œ>‡>…>…>‹>ƒ>…>ƒ>‡>I>‰>…>>‡>…>‡>…>ˆ>s>„>‡>…>…>…>„>€>‹>‡>ˆ>ƒ>ƒ>‡>ƒ>…>‡>‡>s>ˆ>>…>…>>x>…>€>`>†>ƒ>‡>ˆ>†>…>…>…>q>‡>‡>ˆ>ƒ>;>ˆ>‡>ˆ>‡>ƒ>3>‡>p>…>>l>†>>‡>ƒ>…>‡>…>†>s>…>‰>…>…>‡>…>…>ˆ>†>M>ˆ>…>‡>>‡>†>ƒ>…>†>G>8>H>5>U>…>…>„>‰>†>ˆ>>‡>ˆ>‡>…>ˆ>‡>‡>ƒ>‰>…>ˆ>…>‡>ƒ>‡>…>…>†>ˆ>‡>ˆ>u>ˆ>ˆ>|>‡>>„>…>ˆ>†>ƒ>s>…>>>…>y>†>S>=>|>‡>ƒ>‡>‰>q>‡>‡>x>E>‡>…>…>‡>…>\>‡>ƒ>„>‡>…>†>\>‡>‡>‡>ƒ>‹>…>…>„>)>ƒ>ƒ>ˆ>8>…>‡>…>…>x>‡>‰>"=|>…>†>ƒ>‡>†>‰>a>‡>ƒ>…>†>ˆ>…>…>‰>…>‡>„>…>{>…>†>†>‡>>…>#>‡>‡>‡>…>ƒ>‚>ƒ>‡>>ƒ>‡>…>‡>‰>…>‰>E>…>…>ƒ>…>u>->…>…>‡>ƒ>…>ƒ>>ƒ>…>…>‡>†>u>ˆ>†>>ˆ>c>>ƒ>ˆ>…>…>‚>…>‡>ƒ>…>‡>‰>‡>‡>ƒ>‡>…>…>‡>>S>ƒ>‡>ƒ>…>ƒ>‰>…>…>‡>‡>…>…>…>‡>‡>‡>…>…>{>…>ˆ>…>…>>†>‰>y>†>‡>…>…>€>>‰>ˆ>„>‡>†>‚>p>„>†>}>‡>…>…>‡>€>‡>…>…>‰>‰>ˆ>>ˆ>#>ƒ>>ˆ>ƒ>ˆ>…>†>€>†>„>>†>…>‡>=>ƒ>‰>k>…>…>…>y>…>‰>3>ƒ>Û7…>…>ƒ>‡>‡>‡>G>>ˆ>…>>>†>…>ƒ>‰>>ˆ>y>U>…>…>‚>†>‡>…>ˆ>p>‡>>ƒ>>>…>h>3>>H>ˆ>‡> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/5.0 new file mode 100644 index 0000000000000000000000000000000000000000..f60ba20b6a24b5c17e77c47bb8b23b59577305ad --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/5.0 @@ -0,0 +1,2 @@ +Œ>>>>->>“>>‘>>€>”>•>>•>>>•>>“>‰>‘>•>7>>>—>c>‘>0>•>>‹>•>•>>‘>|>‹>>p>—>/>ˆ>>Y>“>}>>”>9>—>8>>>”>>‰>”>1>“>‹>>”>>”>“>>>”>>“>•>‰>‡>“>“>•>”>’>‡>o>,>”>”>‘>>&>“>‘>•>>>“>>>“>‘>’>—>’>”>%>#>‘>>‘>>‘>—>‘>‰>>”>>>“>“>>Ž>‰>•>“>‘>”>>>‘>>>“>•>‰>ã=‘>ˆ>>‘>”>>s>>•>Œ>>–>>…>>“>>Œ>>>“>>‘>•>‹>>u>ƒ>›>‰>“>@>u>•>k>•>“>•>‘>>y>y>•>•>>…>q>’>“>Œ>…>“>>‰>’>”>€>”>—>ƒ>,>”>“>Œ>”>>>“>‹>”>>{>•>”>‘>‰>‘>“>>™>“>>‹>‘>“>–>Ž>“>“>Œ>“>>y>>ˆ>’>…>•>•>‘>“>”>“>‘>‰>>“>”>—>‘>‘>>>Œ>>”>–>p>“>>q>>—>”>>•>>“>“>>…>•>`>“>>‰>Ž>’>“>“>“>>‘>“>>”>“>3>•>”>Œ>•>“>•>>•>ƒ=Ù8”>“>…>>‰>“>\>–>ˆ>&>˜>>”>“>>“>ˆ>“>W>—>‰>‘>,>>>‘>‡>‘>h>“>Œ>>“>y>“>‘>‰>…>‹>–>>“>‘>>>‘>‘>ƒ>>—>“>>>‘>”>>ˆ>>‹>‹>”>>‘>>’>>>‹>‘>>“>>“>>“>…>>‘>”>‹>w>ˆ>—>>•>>>€>>”>>‘>d>>W>–>>{>’>”>>‘>‘>‹>>‹>‹>ƒ>•>‘>”>—>‘>ˆ>Œ>‘>’>”>%>‰>>>>‘>>>‘>‡>‹>Ž>}>•>|>‘>“>•>>”>>0>>“>w>‘>>‘>•>“>”>“>‰>>&>>>>“>“>>‘>”>>p>>†>>“>‹>•>“>”>•>>>•>•>>‘>H>‘>>‰>“>”>>‡>Œ>“>”>•>!>ƒ>>Ž>”>‘>•>•>>‹>‰>”>>>Œ>>‘>‘>>“>ˆ>“>•>•>>‘>‘>>•>’>”>”>Ž>“>”>‘>“>P>>>>“>@>…>>‹>>8>“>‘>‘>•>Ž>>•>>“>>Ž>,>“>‹>Ž>—>“>>>“>>>>>>’>ƒ>”>Š>3>>">‘>Œ>‹>‘>>‘>}>>“>‘>‡>•>‘>“>“>—>“>…>‹>>•>>™>“>‰>‰>>>X>>—>€>>>ƒ>>&>‰>…>‘>“>“>>‘>‘>3>“>“>>•>‹>‹>‹>“>–>>”>ƒ>•>—>>ƒ>Ž>>ˆ>‘>“>“>;>>•>>u>>>>ˆ>‰>“>”>‘>>“>‘>“>>‹>”>>{>>‘>“>“>>>‰>•>>‰>“>E>”>‹>>e>„>•>>”>>>>‹>>l>”>>‘>“>3>“>‘>>>t>>>—>>>‘>w>‹>>>“>>>“>>>’>”>‘>‘>>9>“>•>>’>‘>q>“>•>“>—>>‘>‹>—>“>S>X>‘>“>‹>‘>‘>‹>>“>“>•>ˆ>‘>“>’>K>>>e>‡>>”>>ˆ>‰>•>…>`>>>‰>>‡>>“>“>“>h>>p>>‰>•>”>>>“>…>‘>“>–>”>•>ˆ>‘>„>‹>>‘>‡>“>>i>Ž>‘>“>”>>“>‰>–>—>‘>‘>Š>>‘>‘>”>Ž>>‘>“>“>>>”>“>‘>’>•>—>•>‘>”>>‡>>Ž>‘>‹>”>>“>k>[>“>‘>>`>“>•>‘>“>>“>>>…>Œ>“>>…>—>“>“>‘>“>>‡>“>>’>>>>“>”>”>>D>>”>>†>˜>>(>“>’>>>>—>“>>W>‘>˜>>’>H>’>•>>H>“>“>“>–>“>˜>Œ>‡>•>>‘>•>>s>“>“>•>‘>’>>Ð=‘>”>>’>‰>“>“>W>>“>‹>Œ>ˆ>>‘>“>>‹>”>•>”>‘>•>Œ>’>‰>>_>>g>s>>Ž>”>‘>‰>‘>>>”>“>>>A>>”>>‘>ˆ>>|>”>>“>>>”>ˆ>‰>x>—>c>„>‹>‘>–>>•>“>”>…>“>>>“>K>“>…>>>”>•>“>”>‹>‰>->“>)>…>“>>†>•>‘>‘>“>‘>˜>”>_>>ˆ>‘>>>”>Ž>“>E>‘>”>c>—>>>>‘>‘>>‹>‡>‹>>‘>—>›=”>>•>>”>“>‘>>‡>‘>m>•>•>•>“>>–>’>—>E>>‘>>>–>Œ>“>•>‘>“>”>”>\>>>>‹>“>k>Œ>>>“>>>“>“>_>’>>“>>y>>‘>’>“>‹>‹>”>‘>>”>Ž>>”>>—>e>'>“>“>‹>>•>>•>‡>•>>>‰>>>”>p>“>m>‘>>“>q>“>\>‘>‹>“>•>‹>Œ>”>—>“>‘>“>>’>•>…>ˆ>d>>Š>“>Ž>>‘>>•>“>‘>“>ý=>>“>”>…>…>Ž>—>’>‘>‡>“>>”>>>€>‡>“>‹>`>‘>“>’>‘>•>&>>>>>>€>>“>“>“>>k>ˆ>‘>‡>‘>>ƒ>{>•>7>i>>•>>“>—>•>“>“>‘>•>”>>“>”>Œ>”>“>k>‘>Œ>“>G>“>‘>>‡>—>>”>“>>>’>•>’>>>“>‰>‚>“>>”>‘>…>>Q>”>&>”>p>‘>•>…>“>>‹>“>>‘>>“>‡>>Ž>”>”>ˆ>>“>“>”>>”>>‰>@>‘>‹>–>”>ˆ>‰>—>>•>á=>—>”>‡>“>“>‘>Œ>“>˜>—>>“>“>”>}>‘>‰>•>‘>‡>Ž>“>y>>‘>•>”>“>‹>>€>•>‹>>>“>“>>‡>>‹>•>”>–>“>“>•>>>’>>‘>•>>>>”>‰>“>“>>‘>—>”>ˆ>“>k>‘>>>0>‘>‡>>>‹>“>p>“>‰>‘>>>>U>>>Œ>’>>Œ>>—>“>>”>>•>3>‘>—>“>“>–>…>‹>Œ>>ˆ>>>>>Ž>‘>Ž>’>‘>>“>‘>&>“>E>“>Š>“>>’>>•>q>>“>”>>>>Ž>‘>‘>•>‘>>>“>>“>>“>“>”>>>‘>“>”>‘>‹>>“>“>x>‘>ˆ>‘>€>>‘>‹>p>e>P>†>Œ>>H>•>•>>‹>”>‰>”>’>>”>€>>“>“>‹>E>‘>‹>—>{>—>ˆ>>>l>>D>•>”>“>X>”>‘>•>˜>‘>“>‘>&>•>>–>>“>‹>“>>“>•>>’>‘>’>•>p>>”>ˆ>Ž>’>“>“>>‘>—>“>“>‘>†>>“>”>”>Š>>“>”>“>>“>”>“>>>>K>€>•>t>>>k>“>‘>‘>“>“>•>“>>”>–>‘>>%>0>>–>ˆ>•>>S>>>”>“>”>‡>‹>”>–>>Q>’>•>“>Œ>>0>>“>‘>•>•>>>“>•>•>“>‘>>•>>>“>‘>…>‘>‘>>‹>“>>—>„>“>“>W>>‹>‘>…>•>”>‡>‹>Y>ˆ>‘>“>‘>“>•>ƒ>…>’>>w>0>‘>Œ>‹>4>“>”>•>—>X>ƒ>•>>>‘>ƒ>>‡>”>>>>>•>”>“>”>”>“>”>5>q>“>–>‡>—>‘>†>1>‰>[>‘>’>’>“>‘>‹>“>>‘>”>>>“>—>‰>—>‘>“>‘>‘>>…>‘>>>‘>>>”>>>‘>“>>8>’>•>‘>‹>“>‘>‡>“>‡>s>“>>w>“>‘>Ž>—>‘>>>“>‹>“>•>4>•>>€>1>•>>>>>“>l>‘>“>—>”>‘>(>‰>“>†>•>>Œ>Ž>>“>“>’>“>‘>>”>‘>”>“>‘>“>“>“>>>•>‹>e>>”>>“>‘>Ž>“>“>‘>>>>“>’>ñ=>>•>…>‘>—>>>‘>‘>“>>>‘>m>“>S>Ž>•>>>‘>‘>”>Q>p>‰>‡>‘>•>a>>>>•>•>€>A>>‰>&>‡>>‘>•>‹>•>>>ˆ>>”>‹>/>‘>•>>>‘>>”>”>>‹>Ž>>‘>>>”>•>‰>>‡>>‰>’>>ˆ>“>‹>”>>>Ž>{>8>—>>>>Y>‹>Ž>>•>‘>”>“>‘>“>‘>˜>—>•>“>“>•>>>”>>˜>>“>“>>ˆ>>„>“>–>‹>>“>>‘>–>>>>>>>“>’>‰>‘>‹>+>‰>>…>”>“>Œ>Ž>•>”>•>”>•>“>“>”>”>>’>$>•>“>”>‡>Ž>•>‘>‘>‘>•>>Ž>>”>‘>“>>‘>ƒ>‰>•>>‘>>‘>=>Š>‰>‘>>(>“>•>•>>a>“>”>‘>“>—>‹>“>‘>“>‰>˜>•>‡>‘>”>“>“>—>>>A>>>>‰>•>“>>>9>”>“>>>‘>‘>>‘>‘>>>“>0>‘>>>>>‹>‹>‘>”>‰>…>>>”>>>‰>Œ>>’>“>>“>>>“>>>u>>Œ>”>>“>@>“>Š>>•>>`>•>‘>“>—>”>>”>”>’>ˆ>‰>‘>•>>>‘>”>“>‘>“>“>#>•>‘>“>>†>>“>‹>“>>“>“>”>>”>“>•>ƒ>“>‡>‘>•>>[>”>>>‘>‘>’>“>>‹>•>“>•>‘>“>“>>Ž>“>>€>’>•>>>‹>•>>>>>’>y>Œ>>‹>>>•>>>‘>•>`>K>>>>‘>•>—>’>•>ˆ>‘>“>>>>‹>>>“>‰>—>>H>x>‹>—>“>‘>“>’>•>‰>>>>G>•>>ƒ>>>‘>>>“>>•>‰>‘>‹>”>“>•>—>>•>>“>w>‘>ƒ>>O>>Q>>•>‡>>I>>•>‹>>w>”>W>9>“>ƒ>>>”>“>˜>‘>•>“>Œ>>…>‘>‘>‘>˜>>“>—>•>!>…>‡>>“>‘>“>‰>•>“>“>”>‹>‘>‘>>“> >>‘>õ=‹>‘>i>k>•>“>>=>…>—>“>•>Œ>•>>>“>}>‘>“>•>”>‘>>>>1>”>ƒ>m>5>‡>“>˜>‹>>“>“>Ž>—>‘>Œ>D>3>•>>>>0>>‘>“>‘>‘>’>”>>>‘>‘>‘>•>”>‘>>“>‘>‘>‘>–>‹>‘>”>>’>ˆ>>“>Œ>>>Œ>”>>•>>>‹>‘>‘>‘>>>‘>>“>>•>>”>“>>>“>“>“>‡>Ž>‘>€>—>’>>“>3>‘>“>>>…>“>“>>‘>“>>’>>>“>‹>”>>”>‹>‰>—>…>Q>>•>‘>…>’>€>—>—>>‡>Ž>“>“>%>>ˆ>ˆ>>>‰>Ž>‘>>“>•>ƒ>>‘>‘>‘>…>‘>‘>>>Š>>‡>‘>‰>‘>”>>>”>>‘>’>•>•>p>Ž>’>”>>•>•>‘>•>‹>>‘>‰>l>>‘>Ž>‘>{>”>‘>>”>>>>”>‘>>“>•>>’>”>“>k>‘>•>>>ˆ>C>>Ž>•>>Ž>>>]>>‘>–>>“>’>>‘>“>ˆ>Š>‹>>>>’>”>+>5>“>•>‘>>”>—>‰>‘>’>>>>—>>‹>Œ>{>;>>8>>>“>>€>“>„>ˆ>”>“>>ˆ>‘>$>>”>“>•>‘>‰>>‹>•>…>‘>>>>‘>>“>–>Ž>ƒ>•>”>D>’>•>‘>>”>‹>>“>>>y>“>•>•>Ž>“>}>>”>>i>‹>>>>“>>>d>>“>‘>•>>‘>“>“>–>“>>—>*>>”>…>—>>•>•>”>”>—>s>‡>‘>u>‘>“>•>“>‘>>“>•>>“>“>‘>>“>>•>•>µ=>>o>>>>\>“>’>”>“>“>“>“>‹>‡>“>>>”>”>•>…>‘>#>>“>O>>“>“>>>>h>•>“>‘>W>“>‹>€>•>“>”>‘>>>“>“>”>”>”>>”>•>‘>ˆ>”>…>’>—>>“>•>C>•>“>>>“>U>>>•>>>„>‘>>•>…>€>’>>‘>“>>‘>1>•>‡>‹>]>>>>’>‘>•>‘>•>‘>€>e>H>“>…>>>ƒ>‘>—>”>“>”>>>>>]>”>“>“>“>>>>“>/>>0>>>‹>‰>‘>>>”>“>–>>“>‘>’>5>‘>Œ>‡>“>>>>{>•>•>•>>>€>‹>‰>‘>—>>‘>“>”>•>—>”>“>>—>ˆ>“>–>†>“>‘>•>G>•>‹>‘>“>>>“>>Ž>Ž>—>ƒ>(>>“>•>‹>’>‘>>–>“>h>’>“>•>”>‘>>…>>“>•>Œ>>“>•>•>>>”>“>’>‘>”>‘>—>’>‘>’>“>>’>“>‰>“>Ý=>…>–>p>>“>•>•>‘>…>õ=Ž>‘>>“>>G>>o>“>”>>“>u>•>•>‹>#>—>”>”>‘>”>‹>“>>`>s>“>”>">>”>•>>\>“>‰>>‰>>“>‘>”>”>>‹>“>…>Y>>{>‹>ˆ>™>>•>•>“>>’>‘>“>…>>>>“>—>>“>”>U>—>>‹>“>“>•>C>•>Œ>‘>“>‘>’>“>>>Ž>—>>‘>>>>…>‘>>>…>”>>>…>“>p>>“>>•>>“>e>“>>–>‘>”>“>‰>Œ>>}>“>‘>>È=‘>“>>ˆ>ƒ>Ž>“>“>“>‰>’>>‘>‘>>”>y>…>‘>•>”>Œ>>‹>•>&>‹>>->’>‰>‘>>’>“>>o>‘>>>“>“>“>>>‚>”>“>>>“>ƒ>>>Œ>“>Ž>>‘>>@>”>…>“>”>”>“>‘>•>>>\>>‹>>“>‘>‘>>>>>•>“>>>>ˆ>—>W>w>‘>‘>‘>‘>”>i>‘>>‘>,>”>>>“>‰>>‘>>•>“>>A>—>•>S>>9>>”>Œ>“>‹>“>>>>†>k>>”>‡>>>‘>“>>>>‘>‰>“>I>>>>>>”>”>>‘>”>}>>“>“>•>…>C> >“>>Š>>•>’>>>”>‘>†>’>Œ>>>Ž>‘>•>•>”>‘>Œ>—>•>•>ƒ>ˆ>‘>>>“>>>“>>•>”>“>•>•>•>“>‹>>”>ˆ>>>’>‘>>…>•>“>>“>“>Š>“>h>”>—>€>‹>”>|>“>“>•>“>‹>>“>”>>“>?>—>•>•>‘>‘>”>>1>‘>Œ>“>>>•>‘>‘>‰>Š>->’>“>>>>>•>>>‰>Œ>‘>‘>‘>)>”>u>Ž>“>…>•>“>‰>…>“>‘>>“>h>”>‘>ƒ>>&>>c>>•>>“>>>“>`>>‘>‡>>c>‘>•>“>”>“>>‘>”>“>“>“>“>>Ž>“>‘>…>Ž>•>G>‹>„>“>>>‹>—>’>o>‘>>•>”>>‘>“>>‘>>>>>>ƒ>”>‘>>‘>”>’>>˜>‘>‘>>’>e>‹>”>“>Š>“>‹>>“>>>‘>>”>ˆ>&>Œ>>>“>”>•>“>‘>”>”>•>ˆ>‘>“>‡>“>—>>—>“>>‘>‘>>“>‘> +>&>>•>>“>‰>Œ>Ž>”>‘>•>>!>“>†>i>>‘>>”>>>“>•>•>”>•>>“>“>’>>/>—>„>>Œ>ƒ>>8> >>•>>w>‰>%>‘>“>‘>“>>ƒ>>•>—>—>>•>‘>>‘>>•>“>ƒ>‰>“>Ž>“>…>—>”>“>>>•>>•>˜>”>”>>“>•>Œ>“>>>•>>”>‘>”>>>‡>‘>>“>—>>’>ˆ>>”>‹>d>“>$>>•>”>“>“>“>‘>>>/>5>”>“>’>>‹>‘>i>‹>“>>”>8>‡>“>…>“>‰>>‘>>>>”>%>‹>‹>ˆ>“>>—>•>‹>ƒ>”>>0>†>>}>“>‘>”>p>Œ>”>‘>”>‘>‘>>•>>Œ>4>>>>‘>•>”>>>‹>‘>'>>>>>“>‘>‘>”>>“>‹>>>‘>}>“>‘>>>…>•>>‘>“>‘>“>’>’>‘>‘>—>>“>5>”>>‹>“>>“>>“>}>>‘>‘>>>‹>‹>‘>>’>>>‘>>•>•>“>>>‰>”>>>s>‘>‰>u>>>“>>”>>“>’>t>“>“>>>->‘>—>‘>•>>,>‘>{>“>Š>y>>‰>•>‘>”>>”>”>‚>>•>“>”>—>“>>•>>K>‘>”>•>Ž>•>>>’>‘>S>9>U>>\>‘>“>•>›>’>“>>‘>“>“>>—>“>—>>•>”>˜>“>”>“>—>>”>Ž>“>•>“>€>•>“>‰>“>>>>•>>>ˆ>“>‹>‰>>ƒ>”>U>>ˆ>“>>Ž>“>{>‘>“>‡>K>“>>“>’>”>g>“>>‹>>˜>>t>“>‘>˜>‘>•>‘>>>,>>>”>L>“>’>”>—>€>•>—>Ç=ˆ>>“>>•>‘>•>w>>“>“>>“>‘>>˜>’>’>“>’>‡>‘>–>“>‘>‹>Ž>1>“>”>”>>‹>>>Ž>>“>‘>Ž>•>“>>“>I>>>>>Œ>0>•>‘>“>>>”>#>>‘>>—>”>>—>“>Ž>”>s>“>Œ>“>>“>>”>>>“>’>—>“>‘>>”>‘>>”>Œ>o>‹>•>>>>—>’>‘>’>>>“>>>‘>”>>”>‹>“>”>>Ž>‡>>—>ƒ>“>”>>”>‰>Œ>”>•>>“>>>€>”>‘>>•>‘>>“>>”>—>>—>”>•>Œ>“>#>>…>‘>>“>‘>•>‹>“>>>–>”>•>>>”>u>‘>•>‘>ƒ>—>“>>’>µ7>’>>>‘>•>_>‘>•>“>>Ž>‘>“>‘>“>‹>’>‹>c>“>‘>‘>‘>”>>’>>‘>‰>>>>>t>>>[>‘>Ž> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/6.0 new file mode 100644 index 0000000000000000000000000000000000000000..f035964416bab6f0a9863b5c58ce87c588950e18 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/6.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/7.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe1e68097a9e4c20c2351468196e6c7c58075a2f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/7.0 @@ -0,0 +1 @@ +”>—>œ>”>9>™>™>–>‘>—>>Ÿ>œ>—>œ>–>”>œ>Ž>œ>>š>˜>h>>>—>c>˜>=>œ>™>>˜>˜>‘>™>>Ž>—>l>œ>W>„>˜>]>”>ƒ>>—>d>Ÿ>Q>–>“>•>‘>‰>›>I>œ>“>˜>™>™>œ>—>”>‘> >>™>—>>‡>>—>›>™>™>€>ƒ><>™>œ>›>›>;>œ>>˜>“>“>•>›>—>œ>˜>>¡>œ> >A>8>ž>—>—>™>›>>™>>>œ>“>•>>˜>—>š>‹>–>“>˜>˜>™>”>Ÿ>˜>”>—> >>K>Ÿ>ˆ>“>™>˜>˜>>”> >‹>’>ž>|>ˆ>™>œ>„>˜>>“>™>•>›>˜>>˜>q>>‘>ˆ>“>P>u>›>m>>˜>¢>™>’>y>e>—>˜>•>…>m>—>›>—>>›>•>>›>Ÿ>}>›>š>>E>›>™>—>œ>5>˜>œ>>˜>–>€>Ÿ>Ÿ> >‹>œ>—>%>£>•>—>>›>> >—>>˜>>>‘>{>œ>‹>–>>œ>–>˜>Ÿ>›>˜>š>‰>–>›>™>>›>™>—>‘>—>“> >¥>>œ>™>u>‘> >œ>•>œ>—>™>œ>‘>>>e>™>™>>•>—>š>œ>›>—>“>™>œ>œ>œ>I>˜>Ÿ>–>˜>˜>£>˜>œ> >á=˜>™>‰>Ž>Ž>›>c>¡>>D>¡>—>œ>™>‹>›>‡>œ>>¡>Š>¡>G>ƒ>>—>ˆ>™>h>™>’>“>”>…>˜>™>‹>‰>>˜>—>“>™>™>€>œ>œ>‰>—>>—>—>>œ>›>>>™>ˆ>>™>•>>“>œ>š>”>‘>œ>š>¡>—>‘>>œ>‡>‘>—>œ>>‰>>œ>—>>”>“>ˆ>—>>˜>—>d>>y> >’>l>›>>˜>˜>›>—>‹>’>>>œ>˜> > >™>•>Œ>>Ÿ>•>H>…>•>œ>>˜>“>>>ˆ>˜>›>>˜>}>œ>•>™>‘>™>“>L>—>›>€>›>‹>œ>˜>•>›>–>‹>˜>E>˜>–>>›>™>–>˜>™>>{>›>>—>>—>›>œ>¡>”>˜>™>¡>œ>‘>>S>›>—>>˜>œ>•>‰>>—>™>œ>=>…>˜>—>>—>˜>£>Š>ˆ>>—>—>˜>‘>‘>™>>˜>˜>‰>”>¡>Ÿ>œ>—>™>7>˜>œ>›>Ÿ>‘>˜>›>Ÿ>›>X>•>—>•>œ>E>‰>˜>>“>H>›>‘>™>>Ž>C>Ÿ>‘>™>•>‹><>˜>>–>>>—>—>•>t>˜>‘>Ž>—>”>ƒ>›>>P>›><>œ>‘>>—>“>˜>{>‘>œ>˜>>œ>™>œ>>™>˜>ˆ>–>‹>™>>œ>œ>>”>›>œ>€>>ž>‘>>—>…>—>;>‹>ƒ>›>™>Ÿ>•>˜>—>‰>œ>œ>š>¡>>‹>–>Ÿ>Ÿ>—>›>{>”>>”>‡>”>™>>˜>–>˜>T>˜>ž>—>|>—>˜>“>>>—>£>›>5>>>•>˜>Œ>>Œ>‡>—>œ>›>Ÿ>“>”>Œ>™>™>>“>O>—>’>>g>Ž>œ>—>—>>“>•>•>˜>x>¡>”>™>œ>a>—>™>œ>™>k>”>5>>—>˜>˜>x>>>˜>—>‘>›>œ>‘>—>>¢>–>—>>g>œ>™>™>˜>›>s>“>™>œ>“>•>›>>›>›>\>U>¡>š>>œ>œ>>•>œ>›>>‘>”>›>œ>L>˜>>s>>—>›>œ>>‰> >ˆ>X>“>›>”>—>Œ>˜>˜>Ÿ>>s>˜>p>G>“>ž>›>>>œ>‡>>•>>˜>œ>™>>>“>˜>œ>ˆ>š>˜>x>“>—>—>>•>™>Ž>›>™>œ>”>Œ>™>•>•>>š>˜>’> >˜>—>>”>>£>œ>›>›>> >™>>‰>•>‹>—>>š>–>>i>`>œ>›>™>{>”>>—>—>•>›>™>•>ˆ>>œ>‡>‰>›>œ>˜>œ>•>™>>˜>•>™>™>‘>”>˜>•>Ÿ>—>`>›>›>˜>> >”>T>–>™>“>’>•>>•>˜>l>—>¡>>™>a>œ>œ>>W>›>›>Ÿ>œ>—>¡>>‰>œ>š>“>>›>p>˜>—>œ>˜>™>7>G>—>˜>˜>”>“>˜>›>Y>•>›>“>>>—>>—>˜>>Ÿ>Ÿ>›>š>>‹>›>Š>—>}>‘>i>y>•>‘> >“>>›>—>> >›>•>—>H>—>˜>•>—>Š>Œ>‹>š>˜>™>“>•>>•>ˆ>{> >k>>“>•>—>3>›>˜>—>‰>>>>—>U>œ>‡>P>˜>˜>›>¢>—>“>œ>8>—>T>…>¡>—>ˆ>>•>˜>œ>™>>™>q>›>‹>>”>—>—>“>˜>a>™>›>e>>>˜>•>›>Ÿ>“>‘>‘>Œ>“>–>>%>œ>”> >—>œ>—>—>“>‡>—>l>š>›>˜>™>˜> >™>¡>m>˜>™>•>> >‘>˜>>™>›>˜>>p>•>‘>9>>œ>q>˜>>—>–>“>•>™>™>p>Ÿ>•>œ>˜>q>—>>–>œ>•>‹>¡>™>‘>˜>—>E>Ÿ>—>œ>{>8>˜>”>>“>™>—>›>‰>Ÿ>›>…>„>->€> >>œ>e>“>>>‡>£>[>—>>˜>¡>>“>™>¡>œ>—>Ÿ>œ>š>¡>„>ˆ>h>‘>>›>>–>œ>˜>¡>›>›>—>8><>‘>˜>œ>†>‚>’>¢>™>›>„>›>™>˜>“>’>‘>…> >>o>”>>•>š> >m>œ>—>—>“>œ>y>–>˜>˜>œ>›>€>>˜>‡>›>˜>‡>Œ>“>S>]>>>†>˜>£> >Ÿ>–>›>œ>™>>›>˜>˜>“>•>h>˜>”>>L>™>—>“>>Ÿ>—>¡>—>>‘>‘>Ÿ>’>“>>ž>>‰>>‘>Ÿ>™>‡>>U>˜>P>›>p>™> >‡>˜>“>Ž>˜>˜>‘>“>œ>>˜>˜>¡>›>”>›>›>œ>Ÿ>˜>œ>>‰>[>™>•>œ>•>>>¥>)> >3>u>ž>›>‰>—>œ>˜>•>>›>>>™>—>>}> >>>š>Œ>˜>š>…>›>˜>œ>—>œ>>”>…>–>‘>>”>>›>Ž>„>“>>œ>™>˜> >š>›>>—>—>>œ> >”>Ÿ>“>™>‹>˜>•>˜>—>Ÿ> >‰>˜>|>›>“>„>P>—>>˜>‡>>—>k>™>>™>—>œ>™>p>”>“>“>™>—>œ>™>Ÿ>›>—>˜>‘>ž>C>›>›>—>˜>™>>>>˜>Œ>˜>—>˜>—>>™>”>œ>™>¡>˜>›>\>“>`>˜>>›>“>™>™>œ>y>—>™>™>›>—>|>>™>˜>›>™>“>˜>—>™>›>—>œ>™>œ>>—>›>˜>›>Ÿ>Œ>—>›>ž>{>>‰>•>‹>“>•>>s>e>W>ˆ>‹>˜>S>›>œ>˜>‘>‘>Ž>>—>‡>Ÿ>…>’> >™>>M>•>>™>€>™>•>>•>s>•>X> >œ> >Y>>•> >Ÿ>—>>—>K> >˜>™>™>”>>›>’>•>œ>—>•>˜>›>œ>s>˜>Ÿ>“>—>š>£>œ>™>—>¡>™>˜>œ>€>›>›>¡>›>ˆ>“>–>™>œ>“>ž>œ>>‘>˜>›>p>‡>˜>†>˜>>y>—>œ>•>•>˜>™>Ÿ>™>œ>ž>™>™>;>M>•>>‰>˜>›>\>–>˜>›>˜>›>ˆ>‹>Ÿ>œ>‘>X>˜>˜>œ>”>>H>š>œ>—>Ÿ>›>>”>œ>Ÿ>™>—>˜>˜>™>›>˜>¡>˜>‹>™>¡>•>•>—>•>>‡>š>˜>X>‘>™>—>…>¦>˜>…>>Y>‰>—>›>œ>˜> >|>‰>›>˜>ƒ>[>—>œ>‹>;>™>>š> >>ƒ>Ÿ>™>0>›>‡>>ƒ>™> >”>>™>›>>œ>š>¡>›>›>K>ƒ>™>¡>Œ>˜>˜>ˆ>q>>h>>™>š>>™>>™>”>œ>™>>˜> >›>‰>œ>“>™>—>˜>I>>—>™>”>Ÿ>’>…>›>˜>™>˜>›>•>s>˜>Ÿ>Ÿ>> >—>ˆ>™>…>k>™>•>x>˜>˜>•>•>™>›>”>›>’>—>œ>C>˜>”>y>_>›>>—>“>‘> >>•>œ>>Ÿ>™>E>‰>˜>>œ>•>”>“>”>•>›>”>›>—>•>¡>›>›>’>>“>™>™>—>›>•>>>™>˜>•>œ>˜>˜>—>—>>—>•>K>œ>›>]>‘>Œ>œ>‚>—>œ>˜>‘>—>—>™>—>™>—>q>˜>[>>Ÿ>9>”>•>—>Ÿ>Y>€>‡>>“>Ÿ>i>>œ>‘>œ>•>>>>>=>>>˜>™>•>›>˜>„>ˆ>—>œ>“>H>˜>˜>—>>™>“>–>›>“>>>˜>—>‘>8>>™>>›>‰>‘>‹>”>‘>>™>‰>™>—>1>‘>m>K>™>•>œ>•>Y>>”>•>Ÿ>œ> >›>—>˜>—>™>š>›>œ>•>›>•>>›>“>>˜>˜>—>0>”>œ>“>™>>>˜>œ>—>•>œ>—>•>”>“>™>‹>›>—>‘>™>‘>H>‰>—>‹>›>Ÿ>“>“>>˜>Ÿ>–>Ÿ>š>¡> >›>“>>@>›>œ>Ÿ>Œ>”>—>™>—>›>Ÿ>1>”>‘>œ>˜>˜>•>>}>‘>œ>“>—>™>œ>S>>‹>”>š>g>›>˜>Ÿ>>d>—>œ>™>˜>œ>>™>¢> >>¡>œ>…>“>œ>–>œ>Ÿ>™>—>P>“>”>›>‹>›>˜>˜>›>U>£>›>—>—>œ>˜>”>›>™>‘>—>œ>E>—>“>–>’>!>—>‹>œ>˜>‘>>“>‘>˜>˜>>>•>š>›>™>”>Ÿ>>>›>›>–>‘>—>“>˜>>˜>]>™>>>›>>h>Ÿ>›>”>Ÿ>™>™>”>™>>Œ>>‘>—>‰>–> >˜>˜>›>œ>›>?>>—>Ÿ>”>ˆ>˜>˜>>œ>’>›>œ>>•>˜>—>Ÿ>…>–>‡>—>›>>[>™>”>‹>>—>“>˜>‹>> >Ÿ>>•>>œ>˜>—>–>œ>>˜>™>—>”>“>œ>š>™>—>›>—>q>>˜>‘>˜>>>—>–>˜>¥>i>U>->…>”>™>œ>¡>—>>…>™>˜>“>•>˜>>—>•>™>“>œ>“>q>y>’>¢>™>›>œ>˜>›>>™>˜>“>>˜>€>‰>—>›>›>>™>š>>•>‡>—>—>›>›> >ž>›>£>”>—>y>™>…>…>p>’>U>Œ>¥>‰>˜>P>›> >>›>}>”>‚>l>œ>‡>—>A>£>Ÿ>Ÿ>š>¡>—>>”>Š>—>™>œ>¡>”>œ>™> >8>…>ƒ>—> >—>œ>…>œ>™>™> >‰>™>—>‘>•>8>”>’>!>‘>•>ƒ>…> >›>˜>W>“>>—>>—>›>”>”>œ>{>™>—>Ÿ>¡>™>>“>“>S>›>Œ>t>@>>•>Ÿ>“>“>™>›>“>›>œ>™>Q>]>>>>‘>8>‘>œ>>™>š>œ>—>˜>™>™>—>—>›>¡>>>>‘>¢>•>˜>“>™>•>™>˜>>”>Ÿ>‹>”>•>>›>š>˜>;>—>>›>š>˜>”>›>˜>”>˜>™>>‘>Ÿ>œ>Š>›>—>œ>›>’>—>›>…>¢>™>›>˜>I>˜>•>˜>”>…>Ÿ>œ>…>—>˜>˜>™>”>>›>‰>—>—>—>“>ˆ> >>|>”>˜>œ>>›>>Ÿ>™>™>‡>”>¤>Ÿ><>™>‡>Œ>—><>Ž>‹>œ>Š>›>—>ˆ>“>œ>œ>—>>˜>š>›>˜>‰>•>>œ>>›>ž>k>{> >™>–>œ>>›>w>˜>™>˜>>›>¡>£>™>”>—>›>>i>‘>œ>—>–>x>™>™>—>™>”>™>˜>›>Ÿ>•>™>>“>>›>Ÿ>a>—>>—>›>‰>c>>“>œ>—>•>›>™>o>•>—>™>˜>›>œ>˜>>—>…>•>>—>>—>œ>“>I>S> >¡>Ÿ>”>™>¡>•>™>œ>“>“>˜>>>”>‘>‰>O>>D>”>˜>>™>{>™>}>>—>Ÿ>”>˜>—>A>—>œ>Ÿ>›>›>>–>>™>ƒ>—>•>>˜>Ÿ>›>›>™>—>€>›>œ>S>œ>>“>–>™>—>œ>™>>“>>Ÿ>›>¡>˜> >{>>—>—>i>‹>•>—>“> >“>]>`>‘>›>œ>›>™>™> >¡>>¥>•>™>E>•>œ>‹>Ÿ>•> >>œ>œ>›>q>ƒ>™>m>—>–>>˜>—>™>>Ÿ>˜>›>™>œ>“>>™>Ÿ>˜>?>”>•>ƒ>”>—>”>w>ž>›>˜>™>—>™>>•>>›>—>—>œ>˜>œ>>˜>_>“>›>Y>”>“>›>>“>w>h>œ>›>˜>s>š>”>y>¢>œ>˜> >“>”>Ÿ>‘> >™>Ÿ>›>¡>•>™>…>š>>˜>ž>—>—>›>G>œ>˜>—>–>—>h>“>˜>ž>—>—>ˆ>›>Ž>—>…>p>œ>–>˜>>Ž>™>=> >†>>]>—>‘>Ÿ>>”>—>—>œ>›>|>c>}>›>Œ>“>œ>>—>œ>—>>—>—>“>>”>_>>›>™>™>>•>“>Ÿ>A>‘>H>•>—>>>Ÿ>‰>—>•>•>Ÿ>™>•>–>›>K>˜>>…>œ>>>˜>ƒ>™>œ>œ>|>•>€>‹>>>›>™>”>•>Ÿ>›>>Ÿ>œ>˜>£>>™>œ>‹>˜>˜> >i>›>>—>“>’>™>™>™>˜>>™>‹>C>…>>›>”>›>›>—>™>›>d>œ>–>Ÿ>œ>œ>—>‰>—>>—>>—>˜>œ>™>>”>˜>œ>œ>š>œ>“> >œ>›>œ>˜>™>>>>™>E>š>‰>¡>p>—>›>Ÿ>›>™>|><>—>œ>“>œ>”>M>—>i>™> >“>—>…>œ>œ>>3>£>”>›>™>›>>›>˜>c>i>>˜>?>‘>>›>E>>•>‹>™>>•>™>>Ÿ>›>“>‹>£>>m>c>|>Ž>‰>¤>’>Ÿ>›>—>–>Ÿ>œ>ž>‡>“>I>>œ>>>š> >Y>Ÿ>>Ž>Ÿ>š>Ÿ>T>Ÿ>‘>™>›>œ>“>˜>•>>–>›>…>Ÿ>>›>’>ƒ>—>—>˜>>>—>>‹>Ÿ>p>“>“>—>Ÿ>•>™>o>œ>>Ÿ>—> >™>…>‘>•>‰>˜>›>—>5>‘>˜>œ>>„>“>—>Ÿ>›>>•>—>œ>—>‘>œ>>ˆ>˜>>—>>“>Œ> >Q>>•>P>”>“>‘>˜>>™>›>‰>”>˜>™>—>š>Ÿ>›>—>…>š>¢>>—> >ƒ>™>‘>>¡>•>•>œ>Ÿ>S>™>ˆ>Ÿ>š>>›>™> >˜>>T>•>‰>>Ÿ>•>•>—>“>—>”>Ÿ>—>”>“>™>Œ>Ÿ>‹>>˜>›>>›>ž>x>˜>–>—>=>œ>—>œ>˜>…>”>™>˜>˜>—>“>e>¡>›>S>”>Q>œ>Ÿ>>›>•>—>>>7>‰>x>>˜>ƒ>—>”>•>>”>”>—>–>„>›>q>‚>•>œ>›>•>ž>>”> >›>w>˜>¡>›>>…>M>Y>>“>‡>˜>ž>™>˜>™>>™>ƒ>—>>™>—>“>”>œ>›>¡>™>>›>›>—>>Ž>˜>˜><>ž>˜>“>›>T>›>¡>˜>˜>¢>›>›>™>”>›>ˆ>“>•>›>”>˜>‹>™>œ>—>ž>œ>“>™>k>˜>œ>‡>“> >}>œ>˜>›>™>>˜>“>>˜>Ÿ>c> >Ÿ>œ>˜>˜>—>“>K>—>>™>“>™>Ÿ>›>™>Š>>@>—>>™>’>š>”>™>>>>‘>”>œ>—>I>œ>…>‘>œ>Š>¡>›>>€>>›>›>œ>‡>œ>™>|>“>C>—>k>”>>•>™>˜>—>›>a>˜>˜>>>q>˜>›>œ>¡>—>“>˜>›>>—>œ>>“>”>™>˜>‰>‘>›>u>>Ž>Ÿ>”>—>>Ÿ>œ>>—>“>œ>™>—>—>›>—>œ>›>˜>—>œ>—>…>•>™>>—>›>™>•>¡>ž>•>—>›>a>>>—>>œ>>˜>“>™>œ>œ>>˜>‰>=>‘>•>™>™>™>›>—>™>œ>˜>›>>›>›>‘>“>>•>>˜>–>œ>“>•> >˜>1>@>•>›>“>Ÿ>>”>“>›>›>›>•>@>™>‘>\>…>˜>“>œ>>“>™>œ> >š>œ>‘>—>œ>˜>—>A> >>”>“>>‘>Y>L>–>œ>“>>Š>E>›>œ>œ>œ>“>‰>™>Ÿ>¡>Ÿ>•>>>™>“>>œ>œ>>>˜>’>œ>ˆ>Ÿ>œ>™>•>—> >3>œ>Ÿ>˜>>>œ>›>Ž>–>—>™>›>“>–>œ>œ>•>•>>“>>›>œ>›>>“>‘>œ>>„>—>Q>˜>Ÿ>›>š>œ>>—>—>—>H>8>™>˜>˜>•>“>–>i>•>Ÿ>•>˜>]>‹>—>†>›>>•>“>–>>>>M>“>Š>>›>•>›>–>>|>—>—>S>ˆ>‘>…>œ>›> >i>> >—>›>˜>™>“>>>>E>‘>“>…>—>œ>›>˜>‘>>—>9>•>>>œ>—>›>œ> >>œ>“>—>”>˜>…>Ÿ>™>>“>> >•>œ>˜> >£>>–>Ÿ>—>Ÿ>‘>–>D>œ>“>> >“>˜>“>›>u>—>•>›>˜>”>‘>Œ>™>™>˜>›>˜>™>—>>œ>˜>€>›>“>˜>—>>k>™>™>‡>˜>>•>•> >›>¡>ž>p>š>œ>>”>?>—>˜>˜>Ÿ>œ>A>˜>€>˜>>‚>˜>‹>ž>“>>”>š>™>ƒ>•>>™> > >>—>˜>‘>O>™>> >‘>—>˜>•>œ>›>o>Q>s>C>_>œ>–>š>>—>œ>•>œ>>“>•>¡>›>Ÿ>•>œ>™>Ÿ>›>˜>—>œ>˜>›>>—>™>–>…>›>•>>š>M>“>‘> >—>•>“>™>>Œ>š>>œ>Y>H>‹>›> >˜>Ÿ>€>—>™>>c>›>—>Ÿ>›>—>l>Ÿ>‘>˜>”>¡>˜>> >—>Ÿ>Š>™>—>›>“>X>“>›>™>p>Ÿ>›>>œ>|>˜>Ÿ>C>Ž>˜>˜>•>¡>“>ž>ˆ>‘>—>¡>>>Ÿ>•>Ÿ>œ>—>Ÿ>”>‡>˜>œ>˜>š>…>—>=>œ>›>œ>>>’>>”>‘>—>Ÿ>•>Ÿ>™>>œ>S>—>—>˜>œ>“>K>›>™>™>“>˜>¡>`>”>›>—>œ>—>€>›>£>—>˜>s>›>“> >>›>‘>œ>—>—>Ÿ>™>•>”>“>“>™>—>–>>‘>…>’> >–>“>¡>œ> >˜>—>™>”>œ>˜>—>›>>‰>›>>™>˜>>’>ˆ>”>—>ˆ>˜>Ÿ>–>—>>>—>˜>˜>™>“>•>‹>> >y>Ÿ>•>—>˜>>™>œ>˜>¡>Ÿ> >“>ž>G>•>>™>—>›>š>›>”>˜>>”>¤>›>>/>“>›>u>›>›>•>>˜>œ>D>”>ƒ<”>›>—>˜>—>>`>Ÿ>œ>˜>•>•>›>˜>“>>“>›>˜>€>š>›>˜>—>›>>š>˜>˜>‰>‘>™>•>‘>s>7>”>x>›>> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/8.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/8.0 new file mode 100644 index 0000000000000000000000000000000000000000..251992a1f4d10d7615aa3c7e772cd4300b48fb33 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/8.0 @@ -0,0 +1 @@ +˜>˜>ž>“>+>Ÿ>œ>œ>˜>™>€>¤>¡>™> >—>™>ž>“>£>”>Ÿ>œ>k>>‘>œ>\>œ>8> >ž>>>œ>‘>Ÿ>Œ>‘>™>q> >]>…> >\>—>ˆ>>™>l>£>M>˜>š>™>˜>‰>Ÿ>@> >“>™> >™>¡>›>›>”>¡>—>>Ÿ>>…>£>œ>ž>Ÿ>œ>>Œ>9>œ>>Ÿ>Ÿ>8>¡>£>œ>˜>™>•> >›>ž>œ>£>¦> >¨>@>1>¦>œ>> >Ÿ>Ÿ>Ÿ>•>“>¡>”>œ>¥>ž>—>›>>›>™>˜> >œ>›>¡>Ÿ>˜>›>¤>™>S>¤>‰>—> > >Ÿ>y>˜>¥>‰>—> >€>ˆ>Ÿ>¢>…>>“>”>›>—> >ž>“>—>w>‘>’>ˆ>˜>P>y>œ>k>ž>>¥>¡>˜>u>W>›> >˜>‰>d>>¢>™>“> >™>>>£>>Ÿ> >>=>¡>Ÿ>—>£>)>œ>Ÿ>’>›>œ>…>£>¡>£>>¡>›>>«>•>œ>“>œ>>¤>›>“>>“>¤>—>}>¡>>™>>œ>>˜>¡> >›>>‹>˜> >>¢>›>>–>•>—>—>¤>¨>>¤>>s>“>¤>¡>›>¡>>ž>¤>˜>“>¤>d>œ>Ÿ>”>™>˜>Ÿ>¡>Ÿ>œ>—>Ÿ>£>¡>>I>>£>>›>>©>›> > >#> >œ>Š>>‘>£>]>£>>7>¨>—> >›>> >‰>Ÿ>ˆ>§>‹>¤>A>…>”>—>Œ> >c>ž>™>›>—>ˆ>œ>>‘>Œ>>Ÿ>>˜>>Ÿ>|>§>£>‹>œ>£> >œ>”>¤>£>>”>›>>‹>Ÿ>˜>Ÿ>—>¡>™>–>—>›>™>©> >“>”>œ>…>”>> >>Œ>x>>>£>˜>•>>›>¡>œ>œ>]>‘>>¡>–>q>>£>™>Ÿ>ž>•>‹>™>>>Ÿ>>£>£>Ÿ>›>>¡>¤>—>=>ˆ>›>¡>Ž>>”>“>¦>…>œ>Ÿ>>œ>‡>Ÿ>>Ÿ>”>>”>K>–>>>œ>> >Ÿ>™>Ÿ>™>‹>Ÿ>=>œ>ž>Ÿ>ž>œ>˜>œ>£> >{>ž>>—>¥>™>¡>£>¨>›>Ÿ>>¥>>‘> >T>¡>œ>>Ÿ>¡>•>‰>“>™> >¡>*>ƒ>Ÿ>—> >œ>>©>‹>Œ>>ž>™>›>•>•>>£>ž>>>˜>¥>£>Ÿ>™>>,>—> > >¤>•>™>Ÿ>¤>£>\>˜>›>›>›>=>Œ>›>‘>—>9>Ÿ>”>œ>Ÿ>>?>¢>“>Ÿ>™>>5> >>™>¡>¥>™>›>›>y>—>”>>>—>…>>“>S>¡>-> >—>>œ>˜>œ>†>‘>›>œ>‘>Ÿ>¡>>£>¡>>‹>›>‹> >>£> >Š>™> > >„>>¤>–> >>ˆ>™>,>>‡>›> >¥>•>™>œ>‘> >œ>Ÿ>§>‘>> >¡>Ÿ>>¡>x>›> >˜>ˆ>™>š>ƒ> >˜>>O>Ÿ>£>Ÿ>{>—>š>—>>Ž>›>¬>Ÿ>#>>¡>>>Œ>¦>>‡>˜> >Ÿ>¡>—>š>Œ>œ>œ>>˜>Q>˜>—>”>p>•>¡>œ>œ>“>˜>—>—>>q>§>™>œ> >i>™>Ÿ> >¡>p>™>(>¡>Ÿ>›>Ÿ>€>>‘>™> >’>>¤>”>™>¤>©>™>œ>”>y> > >œ> >¢>u>›> >¡>š>™>œ>”>Ÿ>¡>[>U>¢>>•>œ> >”>—>£>Ÿ>©>›>›>£>¡>K>™>>s>>™> >¡>”>>§>‰>`>—>Ÿ>˜>œ>Œ>›>™>«> >m>œ>s>=>—>¡>Ÿ>>>£>Œ> >œ>¤>>¢>ž> >ƒ>—>> >…> >™>u>—>>ž>¡>›>¡>”>Ÿ>Ÿ> >˜>>¡>œ>œ>¥>¡>˜>“>§>¡>œ>“>>”>£>> >¡>¡>¦>œ>¡>‰>>‘>™>>Ÿ>˜>£>a>]> >œ>™>ƒ>š>£>—>œ>™>Ÿ>›>•>Œ>”>>‡>>¡>¥>>¡>š>Ÿ>> >›> >>—>œ>˜>Ÿ>£>™>]> >¢>›>‘>£>—>Y>> >“>–>™>¤>œ>œ>q>>¨>“>ž>i>> > >T>Ÿ> >¥>Ÿ>ž>£>>Ž> >›>—>¥>ž>q>Ÿ>>¡>Ÿ> >)>U>™>œ>¡>œ>–>>¥>X>›> >”>•>>˜>£>>™>>¥>£>¡> > >Ž>¢>‹>›>ƒ>•>m>}>—>—>§>˜>> >Ÿ>—>¦>£>•>œ>H>›>›>™>™>>>>œ>›>œ>—>™>¥>–>‰>y>¥>i>ƒ>›>—>>)>¡>¡>›>ˆ>§>‘>“>›>S>¥>‰>D>—>>>©>œ>˜>¨>8>›>Q>ˆ>¥>˜>‹>©>™>›>œ>Ÿ>£>Ÿ>{>£>>Ÿ>™>œ>š>•>Ÿ>g>œ>Ÿ>a>§>”>>˜>>£>™>‘>—>Ž>˜>›>¥><> >—>£>›>£>ž>™>˜>‰>›>l>£>›>>¡>œ>¨>>¥>`>™>Ÿ>˜>¦>¦>”>¢>Ÿ>>¥>> >o>›>”>1>—>£>x>>>œ>›>˜>˜>œ>£>k>¥>˜> > >y>>¡>˜>£>˜>‘>¥> >’>š>œ>?> >˜>¡>ƒ>0>œ>˜>”>—>£>Ÿ>¥>>¤>¡>‚>ˆ>>>§>> >i>—>“>Ÿ>‡>©>[>™>‘>™>¥>‘>—>¤>§> >—>¦>¡>Ÿ>¨>‰>‰>g>”>“> >“>™>£>œ>¤>¡> >™>;>&>—>>¡>Š>€>•>§>Ÿ> >…>> >–>•>š>—>‹> >“>q>•>¢>›>Ÿ>£>t>¡>œ>™>•>>u>™>œ>>¥>ž>ƒ>>>‰> >Ÿ>Š>’>˜>T>Q>•>§>ƒ>›>§>¤>¥>™>Ÿ>¡>œ>> >>>™>š>c>™>˜>£>K>>—>™>•>¤>>«>›>‘>—>—>£>˜>—>‹>¡>‘>>¤>–> >>ˆ>•>P>œ>Y>Ÿ>w>>¢>‰>Ÿ>—>>Ÿ>>“>•>£>>œ>œ>«>¡>™>œ>¢>¡>¡>›>¥>‘>Œ>[>™>š>¢>›>˜>“>¨>>£>;>|>¦>>ˆ>™>¡>™>™>¨>¡>£>”>œ>›>£>x>£>>>œ>‹>œ>Ÿ>‰>œ>›>£>™>>‘>—>†>>˜>’>™>¥>>”>{>˜>“>¡>Ÿ>>¥>¡> >•>™>™>>£>§>—>¡>š>Ÿ>>™>›>›>Ÿ>£>¨>> >ƒ>œ>‘>‰>M>›>“>˜>‰>>›>e>£>>¡>›>¡>>‚>™>”>”>œ>˜>Ÿ> >¤>¡>›>>–>¤>@>¢>¡>>>œ>•>“>>œ>‘>™>™>>™>>›>™>¡>œ>¨>œ>>o>™>c>œ>“>™>”>>> >€>œ>¤>Ÿ>>˜>|>‹>>ž>¡>¡>˜>œ>>¡>>™>Ÿ>ž>£>“>œ>¡>>Ÿ>§>‰>œ>£>Ÿ>x>‘>‰>˜>>˜>—>”>q>_>P>‰>>>L> >¡>˜>”>•>’>¢>Ÿ>‰>¤>>‘>¡>>”>E>>”>>>œ>™>’>—>y>™>X>£>£>¥>`>¡>Ÿ>¨>¦>>£>™>E>¤>—>œ>œ>™>”> >–>œ>¥>˜>™>>> >s>œ>¡>™>—> >©>¡>›>˜>¤>£>™> >>ž>>§>Ÿ>‰>˜>˜> >£>˜>¡>£>£>”>›>>s>ƒ>›>ƒ>œ>“>€>>¢>™>™>> >§>>>¢>>>1>T>˜>Ÿ>>œ>œ>T>™>›>Ÿ>œ>£>‹>‹>¡>Ÿ>“>U>›>œ> >—>‘><>›> >œ>£> >“>›>¡>¡>Ÿ>¡>š>›>™>›>>¥> >‹>ž>£>š>˜>š>•>£>‰>>™>Y>—>›>™>ƒ>¨>œ>‡>>Y>>œ>œ>¡>›>§>€>>¢>™>‡>U>™>¬>>4>Ÿ>Ÿ>Ÿ> >‡>ˆ>§>š>1>£>>”>…>Ÿ>£>—>‘>™>¡>©>Ÿ>Ÿ>¡> >¡>L>‡>Ÿ>£>>œ>›>‰>>“>m>¡>>Ÿ>£>›>“>ž>˜>> >‘>˜>£>¡>Œ>Ÿ>”>>>œ>D>>™>>š>£>”>‡> >¡> >>¢>˜>l>œ>¢>¡>>¥>Ÿ>‰>›>ˆ>m>œ>˜>y>>>œ>˜>œ>£>›>Ÿ>•>›>¡>@>ž>™>|>m>Ÿ>“>—>˜>–>¡>“>œ>¡>¡>£>>@>‹>¡>Ž>Ÿ>™>˜>—>˜>œ> >—>£>˜>˜>¥>¡>ž>—>£>—>Ÿ>œ>œ>›>˜>‘>ƒ> >™>–>Ÿ>§>—>˜>›>>>š>G>¡>£>[>>Ž>Ÿ>‚>œ>¥>œ>•>›> >›>œ>œ>š>q>Ÿ>W>”>¥>7>˜>™>˜>§>[>>‰>“>—>£>c>–>¡>”>£>˜>ƒ>ˆ>”>“>3>Œ>‘>>ž>™>£>™>…>‰>—> >—>C>›>œ>œ>—>>—>›>>—>‘>“>›>™>”>,> >Ÿ>>Ÿ>>•>Š>™>“>>œ>‹>œ>œ>>—>k>I>Ÿ>›>¤>™>\>“>•>˜>¡>Ÿ>¥>ž>>>›> >>Ÿ> >™>£>>“> >š> >œ>œ>ž>!>—>¡>•>¡>¡>>›> >˜>›>£>™>š>™>˜> >>¡>˜>“>>“>8>‰>œ>>¡>Ÿ>™>•>Ÿ>œ>£>˜>¥>›>«>¤>>—>Ÿ>3>¢>›>¤>‘>–>™>Ÿ>Ÿ>Ÿ>§>>—>”> >œ>˜>™>¡>}>”>>™>˜> >¤>P>>‹>>ž>)>¥>›>Ÿ>>c>Ÿ> >™> >¡>‘> >¨>¥>–>¦> >…>—> >™>¤>¤>œ>›>P>•>˜> >Œ>>œ>™>>M>§> >˜>˜> >>˜>Ÿ> >•>œ>>C>˜>–>—>˜>>›>>¡>ž>”>>—>•>Ÿ>œ> >>˜>˜>¦> >•>£>“>•>¡>Ÿ>˜>¡>>•>>>>d>>”>„>¡>‘>o>¡>œ>˜>¥>£>Ÿ>—>›>¡>>>—> >‹>—>¥>Ÿ>›>¥> >¡>3> > >£>˜>„>˜>œ>–> >>ž>¡>£>›>™>›>£>‹>>ˆ>>Ÿ>>[>Ÿ>”>>£>˜>˜>Ÿ>>>§>¥>Ÿ>™>¡>¡>˜>œ>—>>ƒ>œ>£>›>•>>¡>Ÿ>Ÿ>—>>œ>x>‘>™>>>>¡>œ>™>™>«>c>]>>Š>™>> >¥>—> >…>Ÿ>Ÿ>—>•>™>•>™>œ>ž>—>¢>”>y>w>•>­>™>Ÿ>¢> > >•>>>™>Š>>}>Œ>œ> > >>™>>>Ÿ>‰>œ>> >Ÿ>¡>¡>œ>¨>›>œ>y>>ƒ>ƒ>w>“>P>‘>¬>‹>œ>L>›>£>“>>w>•>‹>„> >‡>—>H>¨> >£>Ÿ>¥>™> >˜>>Ÿ>Ÿ>>§>—> >Ÿ>£>/>…>ƒ>˜>£>™>£>‰>¡>Ÿ> >£>‹>™>›>”>š>)>•>•>>—>ž>‡>‹>¥>>œ>c>˜>¤>>¡>›> >™>—>¡>€> >œ>¥>§>>”>›>—>M>¡>>t>?>>˜>ª>“>”>¡>¡>˜>¡>¡>Ÿ>K>k>¡>•>”>˜><>“>¡>£>>¡>¡>>>œ>œ>œ>>Ÿ>©>¤>> >•>§>œ>¡>“>Ÿ>™>Ÿ>™>‘>˜>¡>‹>—>™>•>Ÿ>œ>>4>™>˜>¡>Ÿ>¡>›>›>ž>˜>œ>Ÿ>œ>”> > >>>™>¡>>˜>›>¢>ˆ>¤>œ> >¥>L>š>›>>—>‡>¥>Ÿ>…>›> >>Ÿ>™>‘>¡>Ž>›>—>ž>›>‹>¤>x>€>”>ž>Ÿ>“>>ƒ>¤>>œ>ˆ>–>­>¤>4>Ÿ>‰>’>›>9>>>¡>>œ>›>Œ>™>Ÿ> >>‡>œ> >>>>—>”>£>>¢> >m>{>¨>>š> >¤>>u>¡>Ÿ>›>”>£>©>©>Ÿ>—>œ>›>“>_>—>Ÿ>™>™>y>Ÿ>œ>˜>>•>>™>¡>¡>›>œ>£>š>¤>>¤>X>˜>¥>™>ž>>e>—>™>¡>›>>¡>œ>o>œ>œ>£>™>—> >Ÿ> > >‡>™>”>™>”>>>˜>8>L>£>¨>¡>˜>>¨>˜>›>¤>—>”>œ>§>“>—>“>‹>P>>@>™>>ž>›>}>>w>>>¢>—>>›>1>œ>¥>¦>> >‹>œ>”>›>ƒ>˜>›>•>>¦>ž>>¨>™>ƒ> >Ÿ>M> >¡>—>>Ÿ>—> >>Ÿ>—>™>§>¡>¥>>¥>}>”>œ>˜>l>>™>—>–>£>“>s>c>‘>¡> >>›>Ÿ>¡>¨>£>ª>›>>A>™> >Ž>¡>š> >£>Ÿ>£>¡>s>…>>c>™>›>£>›>—>œ> >¤>>œ>¡> >—>“>>¤>š>D>•>˜>€>˜>™>›>>£>¡>œ>Ÿ>>£>ž>˜>•> >›>™>£> >¢>‡>œ>g>˜>œ>Q>™>™> >•>—>h>c>£> >>}>¡>™>y>§>¡>›>£>”>˜>£>Ÿ>¥> >£>Ÿ>¤>—>™>ˆ>>>œ>¥>›>Ÿ>¡>D>Ÿ>Ÿ>›>˜>Ÿ>[>•>–>£>˜>˜>…>¡>”>›>‡>s> >™>›> >”>œ><>£>>>Y>—>—> >¤>™>Ÿ>™>¡> >>a>„> >>™> >ƒ>œ>>œ> >>œ>—>’>”>X>¥>Ÿ> > >‹>>—>¤>=>”>=>›>œ>“>‘>£>>˜>—>š>¥>›>>> >@> >>‰>Ÿ>•>“>—>>¡>¡>ž>€>š>…>>’>•>Ÿ>>™>œ>Ÿ>£>¡>¡> >>¥>> > >Ž>›>›>«>k>œ>”>—>˜>”>›>Ÿ>Ÿ>>—>¡>>9>ˆ> >¡>•> >Ÿ> > >œ>i> >>£> >Ÿ>›>>›>£>>>Ÿ>™>¡>£>…>—>œ>¢>Ÿ>Ÿ> >˜>¢> >> >>>Ÿ>¢>“>£>S>™>Œ>§>o>œ>¡>¨>Ÿ>Ÿ>><>™>>™>£>•>H>œ>h>>§>”>™>>¥>¡>”> >¨>•> >¡> >“>œ>œ>a>k> >œ>5>—>¤>>=>…>œ>Š>Ÿ>”>™>Ÿ> >¥>ž>•>ˆ>¨>‘>„>o>>>‹>©>”>Ÿ>£>Ÿ>›> >¡>£>ˆ>š>?>“> >£>”>œ>¡>U>§>‘>˜>£>¡>¤>T> >‘>ž>Ÿ>¡>•>¢>™>”>›>¡>‡>£>“>œ>–>…>>›>›>‹>¤>œ>”>>¡>k>”>•>–>¥>•>ž>p>¢>”>¤>™> >¡>ˆ>“>›>>™> >™>D>—>> >>ƒ>”>™>¥>£>>œ>˜>¡>œ>>Ÿ>—>‰>™>¤>œ>”>˜>>§>S>>—>P>˜>’>™>›>¤>™>>>—>>¡>>>¥>Ÿ>™>…>Ÿ>Ÿ>‘>™>¡>ƒ>œ>—>‘>¤>˜>˜>¡>¤>P>>‹>§>œ>£>¡>>©>Ÿ>Ÿ>S>›>Œ>”>¡>š>>Ÿ>—>œ>—>¨>˜>˜>—>œ>>£>“>>œ> >”>¡>¡>y>>™>›>/> >™>>>‡>“> >œ>¡>™>•>d>¨>£>W>›>P> >¡>–>œ>Ÿ>Ÿ>˜>“>#>>>‘> >…>™>™>›>£>œ>”>˜>Ÿ>‡>¨>€>>•>¥>Ÿ>—>£>¥>˜>¦>¥>x>œ>¥> > >…>K>_>ž>—>‡>›>¡> >>œ> >œ>…>™>—>>œ>˜>™>>£>¨>¡>‹>£> >>•>‘>ž>>,>£>Ÿ>—>£>`>›>©>œ>œ>¥>¡> > >›>œ>Œ>•>š>£>•>›>>>¢>>Ÿ> >>>a>>£>‡>•>¤>y> >›>£> >‘>Ÿ>”>¡>™>¤>e>§>§>¡>œ>>ž>—>W>›>Ž>¡>˜>Ÿ>¥> >>Œ>‘>8>—>§>œ>“>Ÿ>•>Ÿ>>’>“>“>›>¡>>H>¡>…>”> >Œ>¡>Ÿ>>>©>>œ>>>¡>™>|>˜>0>Ÿ>h>˜>¡>™>™>ž>œ>>c>›>›>Œ> >q>œ> >>£>>>›>¢>¥>œ> >¡>“>•>ž>¡>>“>>„>—>>¤>˜>›>“>£>¡>”>¡>›>£>ž>˜>˜>¡>˜> >>ž>—>>›>‡>˜>Ÿ>“>›>¡>Ÿ>˜>§>Ÿ>›>™> >_>“>¡>¢>>£>“>>š>> >¡>—>œ>‹>4>—>›>˜>Ÿ>ž>¡>œ> >Ÿ>›>Ÿ>”>> >˜>•>¥>˜>¡>Ÿ>›>ž>”>š>§>ž>%>;>›>¡>œ>¤>”>—>•>œ>Ÿ> >—>8>Ÿ>›>`>Œ>ž>—> >‘>—>>¡>§>™> >—>œ>¤>›>˜>9>£>—>—>—>›>“>T>H>˜> >›>‚>>;>¡>œ>¡>£>–>‰>›>¢>¨>¥>> > >˜>—>—>¡> >|>‘>ž>”>Ÿ>‰>¤>Ÿ>>™>œ>¨>> >£>ž>£>>¡>Ÿ>“>›>˜>>Ÿ>—>›>ž> >˜>›>—>™>—> >£>>£>˜>—>£>>‰>˜>P>>§> >£>¢>£>š>™>—>G>1>Ÿ>>œ>—>˜>—>g>˜> >›>ž>H>‰>™>‡>Ÿ>>™>™>“>>>£>E>”>‹>>œ>™>> >“>ƒ>™>œ>Q>‹>•>‰>£> >¥>p>“>¥>›>¡>> >˜>£>”>“>D>”>—>ƒ>Ÿ> >¥>œ>—>“>˜>1>™>”>“>Ÿ>˜>¢> >¥>—>¤>—>™>™>Ÿ>„>¨>œ>“>•>>¬>™>Ÿ>ž>¡>¨>£>›>¥>œ>Ÿ>•>>->¡>˜>“>§>—>œ>”> >|>˜>œ>ž>>˜>•>>Ÿ> >> >œ>¢>›>£>¡>>>š>•>›>™>”>i>œ>˜>Š>œ>>—>™>¨>ž>¨> >o>Ÿ>¡>Ÿ>˜>5>ž>™>¡>¨> >3>›>>Ÿ>”>ƒ>>>¨>“> >˜> >›>…>™>¡>Ÿ>¤>©>¡>›>œ>‘>H>œ>£>¥>—>›>™>™>> >m>M>{>0>U>¡>œ>£>£>™>¥>™> >¢>™>>¥> >¥>˜>¥>œ>£>¤>œ>Ÿ>£> > >”>›>>›>†> >›>>¥>P>•>—>©>>™>—>¡>>“>œ>> >]>)>> >¦>™>£>‚>œ>¡>•>`>ž> >¡>>>k>¨>“>™>—>£>™>‡>£>œ>§>>¡>™> >—>Q>˜>>>x>¡>> >ž>ƒ>œ>§>O>”>œ>›>™>©>•>§>‹>–>›>¥> >¡>¡>™>©> >›>¥>—>‰>œ>Ÿ>˜>œ>…>—>7>¡>£>˜>˜>>–>>›>—>>¡>œ>Ÿ>œ>>ž>G>™>š>œ>¡>˜>M> >Ÿ>>—>™>¥>o>—> >–>Ÿ>>> >§>œ>›>s>£>>¥>‘>Ÿ>—>£>Ÿ>›>£>>˜>™>”>—> >œ>˜>¡>•>‰>•>§>™>˜>¤>£>¥>>™>›>—>¡>>Ÿ>Ÿ>£>>£>>>Ÿ>>—>‡>”>œ>‡>œ>¡>›>˜>“>>›>Ÿ>œ>>•>˜>>¡>¥>€>¥>—>™>>“>Ÿ>£>˜>§>¡>¥>•> >H>˜>>>›>¢>¡>Ÿ>—>ž>“>—>¨> >¢>>—> >>>>˜>ƒ>£>¡>->˜>C·•> >›> >›>¡>o>£>¡>œ>>˜>¡>œ>•>¤>—> >›>€>>£>™>˜> >> > >œ>Š>—>™>˜>•>k>&>–>„>—>“> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/9.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/9.0 new file mode 100644 index 0000000000000000000000000000000000000000..473e420ab0972a38fb0e0e14f9cc5a18881257f0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.layer_norm_weight/9.0 @@ -0,0 +1 @@ +˜>™>™>“>E>¡> >>™>>}>ª>£>•>¡>˜>˜>¡>•>£>”> >¡>t>‘>”>Ÿ>Y>Ÿ>I>¥>œ>>Ÿ> >™>£>>’>œ>i>£>i>‡>>[>˜>ˆ>—>œ>x>¤>T>˜>™>>™>‡>¤>K>¤>—>Ÿ>¡>›> >>>”>¥>“>¡>¡>>ˆ>¥>>¡>>Ÿ>>Œ>E>Ÿ> >¢>¢>S>¡>£>Ÿ>™>™>˜>¡>›>ž>ž>¡>¨>¡>§>H>@>£>Ÿ>œ>¡>Ÿ>Ÿ> >‘>“> >•>>¥>>›>™>>œ>™>œ>Ÿ>›>ž>£>ž>™>¡>«>š>M> >‡>–>¡>¤>>p>›>©>‡>˜>£>w>Š>£>£>ƒ>>“>’> >˜>¡>¡>“>˜>q>“>>‡>>Y>x>Ÿ>e>£>>­>£>™>p>8>>¥>™>>_>>¡>›>—> >™>>Ÿ>©>ƒ> >¥>>S>£> >š>¤>@>>¢>“>¡>>†>¦>¤>¥>“> >>?>³>>œ>•>> >¦>>•>Ÿ>‘>¡>”>s>¡>>›>> > >—>£>£>>Ÿ>>™>£>¡>§>›> >š>”>›>˜>«>ª>>§>¡>m>—>¥>¥>—>¥>˜>Ÿ>¢>•>‘>¥>c>œ>¡>“>™>ž>¢>¡>¢>œ>˜>›>£>¥> >=>Ÿ>¤> >>¡>§>œ>¡>õ=#>¡>¡>‰>>>¥>\>¥>>H>¨>—> >Ÿ>>¢>‡>¤>>¨>‹>§>P>ƒ>•>—>‹> >]> >œ>œ>˜>>œ>Ÿ>‘>>”>¡>›>™> >£>x>©>¦>>>£>£>œ>>£>¤>>”>™>‹>Œ> >™> >‘>£>›>™>—>Ÿ>˜>«>>”>•>ž>y>’>>£>Œ>>L>£> >¥>”>“>Œ>Ÿ>¢>>›>c>“>ƒ>¥>—>k>> >™>Ÿ>Ÿ>”>‘>˜>’>>¤>Ÿ> >§> >—>“>£>§>—>K>‰>š>¥>>™>•>”>¥>ƒ>œ>Ÿ>‚> >Œ>£>ž>Ÿ>“>Ÿ>–>X>˜> >€> >> >>>Ÿ>›>ˆ>Ÿ>L> >œ> >£>>—>>¡>¡>|>¡>‹>™>§>˜> >¥>©>ž>Ÿ>Ÿ>¨>£>˜>¡>S>¡>Ÿ>>¡>¥>˜>Œ>“>œ>Ÿ>¤>A>ƒ> >—>¥>>¡>«>Œ>ˆ>’> >œ>>—>—>>¥>> >>—>£>£> >š>¡>E>—>¡>¡>¥>˜>œ>£>Ÿ>¥>Y>›>œ> >¡>M>>œ>>˜>K> >•>™> >’>H>¡>“>>™>Ž>A>¡>“>›>¤> >›>œ>š>u>š>•>‘> >—>‡>¡>‘>`>£>G>¡>”>“>Ÿ>™>Ÿ>‰>‘>Ÿ>>>¡>> >¥>¢>ž>‰>Ÿ>ˆ>¡>>§> >>—>ž>¡>‰>“>§>—>£> >ˆ>œ>@>‹>‰>>¡>§>”>œ>œ>”>¥> >Ÿ>§>“>‰> >¡>¡>›>¡>y>œ>£>—>‡>˜>™>€>¡>˜>Ÿ>X> >§>œ>€>š>>˜>>>>¨>¡>A>¤>©> >¡>>©>‘>‰>›>Ÿ>¥>¡>š>™>Ž>Ÿ>Ÿ>>˜>S>˜>”>“>u>˜>¨>>Ÿ>>™>˜>˜>›>o>©>>> >c>Ÿ>Ÿ>¡>¢>g>š>@>¥> >™>>>>>›>Ÿ>“>Ÿ>¥>—>•>¨>«>™>›>“>‚>¡> >Ÿ>Ÿ>¡>w>™>¡>£>›>> >“>¡>¤>T>U>¡> >–>> >š>˜>§>¡>¨>›>›>¥>£>L>›>>y>”>™> >¥>—>>©>‰>[>•>>˜>Ÿ>>™>>Á>¥>o>œ>s>L>™>£>Ÿ>>Ÿ>¢>‹>¢>œ>¥>>§> > >}>˜>>¢>€> >>t>“>¡>œ>£>˜>¤>‘>¡> > >›>>ž>Ÿ>Ÿ>©>£>œ>“>§>¡>›>Ž>>”>§>>¢>ž>£>«>›>£>‹>œ>‰>>> >›>§>`>`>£>ž>Ÿ>„>™>¥>›> >œ> >™>˜>Š>˜>Ÿ>…>‰>¢>£> >¥>›>Ÿ>ƒ>¢>œ>ž>œ>˜>œ>•> >¡>›>S>¡>¤>š>‘>¢>˜>c>¡>£>”>—>œ>¦>œ>>u>Ÿ>©>‘> >i> >¡> >U>Ÿ>¡>¨> > >«>“>‹>£>>–>¥>¡>p> >>¤>>š>@>`>œ>Ÿ> >œ>˜>Ÿ>¢>S>œ> >•>•>”>›>¤>>›>>©>§> > >£>‹>£>>>‰>“>o>>—>•>«>˜>“>Ÿ>Ÿ>—>¤>¤>˜>>P>™>¡>š>œ>>Ž>‘> >Ÿ>>•>˜>§>™>‰>y>¨>i>}>Ÿ>—>£>E>¡>¤> >‹>¥>“>“>œ>[>¨>‡>`>™>œ>¡>©>›>š>©>C>Ÿ>`>‡>­>˜>Œ>¨>™>›>Ÿ>¡>¥>¡>{> >>¡>˜>>œ>”>>e>Ÿ>¡>X>¥>“>¡>›>>£>™>“>•>>˜>Ÿ>©>G>Ÿ>˜>«>>£>Ÿ>œ>—>‹>>l>¥> >Ÿ>¡>›>ª>Ÿ>§>M>›>¡>œ>¨>­>•>¡>¥>¡>¤>£>¤>p>˜>”>E>—>¡>u>œ>“>>>˜>—>›>ª>\>¨>˜>>¢>s>>£>›>¥>š>”>©>¢>”>Ÿ>>O>¥>œ>¡>…>E>¡>š>”>•>£>Ÿ>¤>>§> >…>‰>->ƒ>¥>€>Ÿ>e>—>“>£>…>¯>\>>“>™>¥>—>™>¥>«>¡>›>­>¤>œ>©>‰>…>e>•>‘>¥>“>—>§>œ>¤>¢>¡>˜>=>A>—>¡>¢>‹>„>—>§> >Ÿ>ƒ>>Ÿ>›>—>˜>—>‹>¥>•>m>˜> >>¡>¡>y>¡>>>“>¡>w>™>ž>>¦>¡>„>Ž>¡>‹>ž> >‡>>™>]>3>“>¤>…>œ>©>¨>¬>™>¢>¥>£>>Ÿ>Ÿ>Ÿ>œ>œ>d>Ÿ>š>¥>Q>œ>œ>›>•>¥>œ>­>Ÿ>’>•>™>§>˜>˜>>¡>•>>¤>”>> >‹>”>P>>[>¥>x>>¤>ˆ>£>•>“> >>“>•>£>>œ>Ÿ>©>£>™>œ>¡>¡>£>™>¥>•>‹>]>—>>£>›>˜>”>©>3>§>3>x>«>>ˆ>›>§>œ>œ>§>¡>£>“>œ>>¥>y>¨>>¡>Ÿ>>ž>¡>‡>>ž>¥>™>£>“>—>…>Ÿ>˜>“>˜>£> >•>h>˜>”>¡>Ÿ>œ>«>£>Ÿ>•> >™>>¢>¨>˜> >›>Ÿ>>>œ>˜> >¨>«>Ž> >ƒ>œ>’>‰>X>>•>›>‰>“>˜>d>¤>”>¡>>¡>Ÿ>>™>˜>™>Ÿ>™>> >¦>¢>™>>–>¨>P>Ÿ> > > > >—>•>”>Ÿ>‘>˜>>¡>›>>>•> >›>¥>£>>|>œ>c>›>‘>›>•>¡> >¥>}>Ÿ>¡>>œ>š>{>‹> >>Ÿ>§>™>œ>œ>£> >™> > >¥>>›>¤> >Ÿ>¥>>›>£> >u>•>Š>˜>Ž>›>˜>•>s>a>T>‡>> >S> >¡>–>•>“>>£>>‹>¥>>’>£> >•>Q>ž>”>Ÿ>y>œ>™>—>›>w>›>`>¨>¥>¢>c>¥>Ÿ>«>¨>>¡>œ>U>§>˜>> >>—>£>•>œ>§>›>™>›>¡>¢>q>Ÿ>¥>™>> >©>¦>>˜>ª> >œ> >>Ÿ>ž>¦>Ÿ>‡>œ>œ>¢>¦>›>£>£>¥>—>›>>}>ƒ>Ÿ>x>>“>}>>£>œ>™>›>¡>©>>¡>¦> >¡>A>W>> >>>œ>P>—>¥>£> >£>„>Œ>§>¤>•>[>›>ž> >™>“>K>™>£>>¦>¥>>˜>¥>©>£>Ÿ>>œ>™>›>>¨>Ÿ>ˆ>¡>¤>>˜>—>—>¤>‹>¡>œ>X>˜>>œ>{>©> >‰>‡>U>> > > >›>«>ƒ>‰>¥>™>†>i>›>±>‘>E> >¢>¤>§>‡>ˆ>¥>œ>=>¡>>”>ˆ>œ>Ÿ>—>>š>¤>«>¢>¡>¡>£>¡>Q>‹>¡>¥>>œ>›>‹>‡>”>p>¥> >Ÿ>¥>™>’>¡>>¡>¡>>œ>ª>¤>>¢>“>¡>œ>œ>P>„>œ> >™>£>“>…>¤> > >>£>™>p>ž>«>¡>>¥>Ÿ>‡>>ˆ>i>œ>˜>y> >¡> >›>Ÿ>¡>›>£>•>>¥>C> >™>€>m>£>>—>˜>—>Ÿ>™>œ>¤>¥>¥>œ>O>‰>¡>>Ÿ>˜>•>—>˜>>¡>™>¦>œ>ž>¥>£> >—>¨>˜> >œ>œ>Ÿ>>’>‰>£>›>›> >«>œ>›>œ> > >œ>Y>£>§>L>”>> >…>>>›>™>—>Ÿ>>>>›>t>>X>”>­>M>˜>™>™>¥>[>ƒ>Š>>˜>¥>a>’>¤>”>§>>‡>‹>”>‘>K>>>Ÿ> >›>¥>™>‡>‹>™>¡>™>S>Ÿ>Ÿ>œ>˜>œ>•>>£>˜>‘>“>œ>š>“>@>§>¥>>£>>”>‰>™>“>>¡>‡>Ÿ>›>;>”>l>L> >>§>™>[>>˜>Ÿ>¡>¡>©>¤>›>>>¡>£> >¡>š>¤>>> >™>¦>™> >>A>˜>¡>˜>Ÿ>¤>‘>™>£>—>›> >™>™>™>™>£>>£>—>—>›>—>K>‹>›>>¡>¥>˜>•>¡>œ>¤>œ>§>Ÿ>«>¨>ž>™>£>H>¥> >¨>>–>˜> > >¡>§>@>•>•>£>œ>—>˜>¡>w>˜> >˜>›> >¡>P>>ˆ>˜>Ÿ>S>§>˜>Ÿ>‘>U> >¢>œ>>©>“> >ª>¨>—>©>£>‡>—>¤>Ÿ>¥>­>š>™>T>•>›>¡>Œ>£>>™>¢>Y>©> >”>œ>£>™>—>Ÿ> >™>>¡>I>›>“>˜>˜>5>>>¡> >•>•>—>—>œ>¡>0>‘>›>ž>£>£>˜>£>“>—>£>Ÿ>˜>£>>’>>>>a>Ÿ>>>¥>>q>£>Ÿ>š>¨>£> >™> >£>>‹>—>Ÿ>>œ>§>¡>>£>¤>¥>/>¥>Ÿ>©>™>€>—>>’>¥>•>£>¥>¥>œ> >Ÿ>¤>‡>>‹> >Ÿ>Ž>X>¡>“>‘>¥>Ÿ>–> >>>¥>£>¥>>¡>£>™>>›>>…>>¨>œ>™>‘>¡>Ÿ>£>—>¡>™>l>˜>™>“>ž>”>£>>œ>Ÿ>­>g>[>;>ˆ>›>¡>¤>«>›>¢>…>>œ>˜>—>œ>—>™>›>Ÿ>—>§>>ƒ>x>˜>­>ž> >¥>Ÿ>£>•>˜>>™>–>¢>t>>š>¡>£>‹>œ>Ÿ>“>£>‹>œ>™>¡>¡>¥>£> >¬>›>¡>q>¢>…>ƒ>}>—>T>”>­>ˆ>›>K>Ÿ>¤>”> >y>—>Œ>Œ>>ƒ>—>E>¨>¢>¥>£>§>›> >˜>>>Ÿ>¤>©>—>Ÿ>¡>¨>H>…>ƒ>™>£>™>¡>‰>£>Ÿ>¢>£>‰>>š>—>¢>;>™>•>>›>>…>‘>¨> >>a>>©> >¤>˜>£>™>—>¡>}>Ÿ>œ>¨>©>£>™>˜>•>Y>£>“>>A>‘>›>«>•>•> > >˜>¡>¥>¡>S>p>¡>˜>“>”>1>˜>¡>£>Ÿ>¥>§> >Ÿ>¡> >œ>ž> >¬>¢>‘>¡>”>¨>> >•>Ÿ>™>>>‘>”>¨>…>›>™>‘> >>£>A>˜>˜>¡>£> >œ>¡>>•>œ>Ÿ>¢>•> >£>>>Ÿ>Ÿ>>™>›>£>‰>©>Ÿ>£>¥>P>›>˜> >˜>>§>£>‡>Ÿ>¡>œ>¡>>“> >Ž>>œ>¡>™>…>­>y>ƒ>˜>Ÿ>£>—>Ÿ>>£>¡> >ˆ>—>¯>¥>I>>…>”>›>E>>>¥>>ž>œ>>›>£>¥>Ÿ>‡> > >£>œ>>™>“>§>>¥>¢>y>{>«>¢>œ>¥>¥> >s> >¡>š>—>¡>©>¨>¡>>›>>‘>`>—>¥>š>›>x>¡>œ>œ>Ÿ>”>ž>œ>¤>£>œ>£>¥>™>¡>Ÿ>¥>A>›>¥>—>£>>k>•>œ>¥>Ÿ>œ>£>Ÿ>p>›>>£>™>>£> >¤>>ƒ>š>—>>“>Ÿ> >—>I>S>¤>­>¤>˜> >«>œ>›>©>•>–>¡>©>•>—>“>Œ>P>ˆ>L>›>›>£>¡>>¢>u>>œ>¡>•>Ÿ>›>L>™>¤>¥>>¡>>>‘>ž>…>›>œ>“>œ>¨>>¡>«>œ>ƒ>¡>£>T> >£>—>›>>•>Ÿ>Ÿ>£>”>—>¨>¡>¨>œ>¦>€>—>œ>™>i>>Ÿ>—>—>¥>“>w>a>”>£> >£> >>¡>§>¤>¨>œ>>L>›>£>>©>œ>¥>¨>¡>¤>¤>k>ƒ>¡>c>™>Ÿ>¡>œ>˜> >¥>¤>š> >¡>¡>˜>•>Ÿ>£>>E>›>—>k>™>>˜>>©>£>Ÿ>Ÿ> >¤>¢>™>“>¡>>š>£>¡>¡>‡>¢>u>˜> >;>™>˜>Ÿ>–>”>X>d>¦>¢>›>€>¡>•>y>«>£>œ> >˜>˜>§>¨>¬>£>¨>¦>¥>›>>‰>Ÿ>”>>¥>>>¤>L>¡> >›>˜> >X>•>—>§>›>˜>>£>•>œ>…>q> >>> >“>>E>¤>‰>“>Y>˜>—>¥>¡>™>œ>›>£>¤>€>`>‰>¡>‘>š>£>>Ÿ>>›>¡>œ>>—>>•>Y>£> >¡>¡>>Ÿ>”>¥>O>“>G>™>Ÿ>“>>¥>‰>™>˜>š>§>œ>›>œ>£>L>Ÿ>>ˆ>£>—>–>—>…>£>¡>£>ƒ>˜>‡>>”>’>£>Ÿ>˜>Ÿ>¥>¥>¢>¤>£>Ÿ>§>”>¡>£>>>Ÿ>©>q>¡>•>˜>˜>—>œ>>Ÿ>œ>•>£>>H>ˆ>§> >”> >£> > >Ÿ>c>¡>œ>¤>¡>£>>>Ÿ>¥>Ÿ>‘>Ÿ>>¥> >„>˜>>¥>Ÿ>œ>¡>™>¥>¡> >Ÿ>ž> >£>£>‘> >H>™>‹>¨>e>Ÿ>£>©>£> >>=>›>¡>˜>§>—>T>œ>d>›>§>—>œ>>¥>¡>>D>«>”>¥>>£>‘> >>]>l>¤>›>G>•>¦>>=>†>>>¤>”>›>> >¤>Ÿ>—>‰>¨>“>Š>€>€>>>°>”>¤>§>¡>> >¤>¥>‡>œ>[>>£>§>”>¡>£>[>«>>˜>£>¡>§>[>£>‘>>£>£>“>¥>>’>Ÿ>£>…>¨>>œ>—>†>œ>›>œ>Ž>¨>œ>˜>>¥>i>—>—>”>¨>–>›>h>¡>”>¥>Ÿ>¡>Ÿ>‡>“>™>>›> >œ>S>—>¡>¡>>{>˜>™>¨>§>>œ>>¡>Ÿ>“>¡>š>ˆ>>¥>>’>•>Œ>§>W>>>S>˜>•>˜>›>¨>>>—>›>›>Ÿ> >>«>Ÿ>œ>…>£>¥>”>>¦>>>—>”>£>™>™>£>¥>W>£>‰>§>›>¡>£>›>¦>Ÿ>¡>X>œ>>˜>§>>œ>Ÿ>•>œ>™>¦>œ>—>—>œ>>¥>™>}>š>£>˜>£>¥>s>Ÿ>›>œ>C>©>˜>ž>>…>˜>Ÿ>>£>Ÿ>•>q>«>¥>W>œ>M>ž>¥>—>>Ÿ> >“>>=>‹>>Ž>œ>‡>™>˜>™>¢>>”>™>›>…>ª>…>>“>§>œ>˜>¤>§>›>¨> >w>œ>¢>¡>¡>‡>P>a>¨>™>‚>›>§>£> >œ>¡>Ÿ>‡>›>•>>>˜>™>Ÿ>¤>£>¡>‹>£>¡>Ÿ>•>>Ÿ>>H>¥> >™>¨>T>¡>©>›>Ÿ>©>£>¡>¡>›>Ÿ>…>—>˜>§>™>¡>>Ÿ>¢>œ> >£>–> >O>>§>ˆ>•>§>{>£>œ>¥>£>‘>›>‘>¤>›>¡>m>¯>§>£>œ>¡>Ÿ>“>T>œ>>¡>˜>>£> >œ>‹>>C>›>¥>œ>•>œ>˜>Ÿ>>•>”>‘>›>£> >P>£>ˆ>“>¢>‹>£>£>>ƒ>ª>£>˜>¥>>¥>œ>>˜>K>š>e>›>§>œ> >>Ÿ>Ÿ>\>>>>¢>t>Ÿ>œ>¡>¢>˜>>>¤>©>œ> >£>•>˜>Ÿ>¡>Ž>>¡>…>™>>¨>›>›>>©>¡>™>>œ>§>™>™>›>¡>™>¡>¡>>˜>¥>œ>…>˜>Ÿ>•>˜>£>¢>—>£>¡>˜>š> >a>‘>¦>¡>>¤>> >œ>Ÿ>Ÿ>¢>•>œ>ˆ>E>”>œ>>£> >¥>¡>Ÿ>>>œ>”>ž>¡>™>™>«>š>¥>ž>™> >•>œ>©>>=>M>›>£>™>§>“>—>˜>£>Ÿ>¡>™>O> >>e>>Ÿ>˜>Ÿ>‘>™>ž>§>¨>š>¥>˜>œ>¤>™>œ>M>©>—>–>™> >‘>\>@>š>¡>œ>€>Œ>G>¡>>¥>¦>˜>‰>>¥>±>£>œ>¥>§>™>˜>—>£>¡>t>—>Ÿ>—>£>…>¥>¡> >™>›>¨>7>Ÿ>¥>>¤>> > >‘>>—>>¢>˜>œ> > >›>™>”>›>•> >¥>Ÿ>ª>œ>˜>£>‘>Œ>Ÿ>Y>>«>¡>£>§>¥>œ>›>—>L>L> >Ÿ>>—>™>™>i>œ>¥>Ÿ>£>]>ˆ>Ÿ>ˆ>¡>‹>›>›>•>”>‘>¥>M>˜>>“>>™> > >–>>>Ÿ>Y>>”>ˆ>¢>¡>¥>u>‘>¥>™>¤>Ÿ>Ÿ>>¥>”>‘>K>•>™>ƒ>™>¥>§>™>™>˜>›>E>›>“>”> >˜>¤>¡>§>™>£>•>>›>œ>…>«>£>—>•>>±>š> >Ÿ>¡>¬>¡>œ>¦>™>¥>•>>I>¥>—>>©>œ>>>£>s>›>œ> >œ>˜>”>‘>>¡>Ÿ> >Ÿ>£>˜>£>¤>›>€> >—>˜>—>>e>›>™>Œ>>>œ>•>«>>¥>£>l>Ÿ>£>Ÿ>š>C>ž>œ> >«> >C> >}>>‘>> >>¥>•>¡>›>¡>œ>…>—>¤>•>¨>¨>¢>>>”>Q>¡>£>©>“>›>™>œ>Ÿ>¡>s>W>€>G>_> >>¢>¡>œ>¥>›>£>¡>›>Ÿ>§>¡>§>š>£>¡>¡>¥>ž> >¡>¢>¡>>>¡>>‡>¡>œ>“>¥>]>˜>—>¬>™>™>—>Ÿ>>>¡>{>£>Y>E>‹>ž>¥>œ>¤>}>œ>¢>”>e>Ÿ>£>¤>¡>¡>q>¯>”>›>˜>¡>›>>¤>Ÿ>«>>¡>—>£>—>P>”> >¡>u>¥>œ>£>Ÿ>}>œ>©>O>“>œ>œ>œ>¯>‘>¨>Œ>—>›>§>Ÿ>§>Ÿ>›>©>¥>œ>©>—>Š>›> >˜> >…>œ>C>¥>¥> >œ>>—>>›>”>™>£>›>£>œ>>Ÿ>P>¢>˜>Ÿ>¤>™>S>£>> >˜>>©>u>š>¤>˜>§>œ>}>¡>©>>›>p>¡>”>¡>˜>Ÿ>‘>¡>¡>>¤>¡>š>›>”>”>¤>œ>˜>¡>š>Œ>˜>¨>›>˜>£>Ÿ>¥>Ÿ>™> >—>£>> >>§>>§>’>¡>¡>>˜>‰>—>Ÿ>>>¤>˜>š>>>›>Ÿ>›> >“>—>‘>¥>©>}>¥>”>—>ž>“> >£>š>¨>¢>¨>˜>¡>P>™>}> >>¤> >¢>—>Ÿ>•>—>©> >£>8>™> >y> >Ÿ>˜>ƒ> >£>K>˜>I=˜>¡> >£>>£>p>£>¥>¡>œ>˜>¦>>–>¤>˜>£>Ÿ>€>ž>¡>>™> >‘>¡> >Ÿ>‰>•> >š>•>k>=>—>…>Ÿ>‘> \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/.zarray b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..e6874b83f85774045985c961f575e7623cfa812d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/.zarray @@ -0,0 +1,18 @@ +{ + "chunks": [ + 1, + 3584, + 4096 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 32, + 28672, + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..605f15abb3d6fb10c577e22d33cc6dbbe99725cc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f0f00e6b8ca8032dcaa659c8f44513432f8d46a1c4a0ac50325bd2ce9ef621 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8a671c1bead026a3cd08a201216c9362d1f24c84 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84eecb21b96310582073cc831fab0441d4296e39fe378d81f4c643cae2967dc2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..388086f7d9701f74709c12c0871184ffab7e5b55 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631244d602d1446b9e456502a682a36f5591a9be13415b463a1793b5dfa72f0e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d184ba333032ffe60156519ab8c20b0fd81de887 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d9982631998b9005f3c4d305eb4c57db032ebfef1640569c3a1816b094aa17 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..156bfeb8794b51705646d4154df0700df3b49b5a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee26d1bddaba0fb9a6987d0f825071222881a0bc39903cba752d42cdf617ab1 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5aaa1348d5303210de7bf2dd2ca8929dfc8843f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218378024a2fa5d7681b986068925ab5b1c6609a6683a7cdbc30476213634e21 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..3be03bf35768ffd1b43930593cc5c90b6de2abe5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb390de220f9c6ecdfd4f3ea1ef4560efc0f27549a31e19920ce4b28204bdcb +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..b6078dc72cf58cdeccc74f404639a3bad07eb045 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/0.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f614014a594d23e65ccd3495620780984ea7f97208d3b01ce7190fa7fdd9310 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bd32bb6a59ca8489e81bc05fe356808d0c0eea47 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c60dcc0cf1c99ce50018351a1c197bd79e7c18046bcbb619dd8d0d2ae4e25c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..cdf8cd610577951edd59faf6c7b4ecca9bf44f79 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e9b931cd7bb8119f84a9777f98067054c0b7da82b3b7e4bc9f374a8890b7e1 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d07a0c6ba4ff4a59a76b355888f6fab2614c0064 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d6a580d69fbffdb3de183551b5f638a928d9f8c8ba5b02c76a7a9209a2e367 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..d59ac656e595c454b47a46dd377e651f0e34d634 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b00bcf3d0459efc6a36a5fbd513cca7e90a6a48cd0859263237f92e47322196 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..248a779088e5573625787f21a9eed8845a85aadd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d27876321e19b4156880e09072c1d7e6559164e086aa78e6513491444670760 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..beaa4074ebea1e10fd264ce34cf37d5e4ce2dfe7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d73f494d5efe74430efde333695ad4180992773ad60fc1ed3c2b85432e8d2b06 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b08d989a98b7eae62059e24e33443c37a17ef66 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f4da6b04f39245e0a01a0688aacc0acb329d53013995f5091084e1d554fc6f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..1e9814d6fed6d42d5f0ce9017d4e66209365dad9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/1.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb5d54cd95260a71e4e42ebf31abb238d2eeaa48d8f78639f16ed75c12310579 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bc231ef8278650f6e74b4cae35a55788cd8876aa --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2b7f8b730e37eeb40d5558e142de6feed27a889ab324f5378741d118b85f0f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..625230257ec555052deb87304c2df8055ff150e0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aac5e5840072e2e2db9fee05e5c71106cfa1879cb557090a3d0a5bbe146270f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c0aae7e11eb90bde80ffd34ec9eeb9cccca0bb5d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2a8fb941d31fbd273b742acd15f059d1225a79dd6741fa0130ae4a69537ef97 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..be15447622a648f0bb238f5a7c9d53acf60d6f5f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5adf4446ec710b763d497c3ecb83e63d389e1e430536db849fbacc46aab78de3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..8db5dff0d3daa5ec56702aa4d53ae30529a82b5d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b889ead3692a6980b77850f18f04063f0a70526ba47ca85c21c3a8e8f7550558 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..fd053ccb47cfe17bd07f54e2fbb25385a9e449b9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70126136f46216a7d3b1805a6202a97406799e7fe08f8774af404b66850ba314 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..4d9ce48ccc54392136c3ecb44d7f99d054497904 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fbff5eec97dccfa433c3b29a383792ed0427f52603021bfd0560356096c39fc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..665a355ce59b2803a7107ad7a3535182b7911fa4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/10.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720544c46ac543c8e882ad7757dafbe14813efc44cbb04bc8054822581837459 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..368fd8b7fe4fe9ce3655d9856dda6c9bdfba2bdb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d63936200df5f862d5d3625c5fe071ac52258a5f0831322a765ed729cda586 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..758280c681ec70f6721495c64e431c2a0256fd80 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b890a45e91a0ed1ddc4a8155b6805f72c29550c305f8a286b888b16228be3440 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..2387cd8775cbf435de94a531c4273e6ff16cd0c8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a6e5e88227220646fb7f7fdb277ca72da9dc9409f2b898ec0731ef5a309c77 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6dad40465bfb9e0ea47aa111e082cb1e74e908f8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60324b6e726c4839e0ebba54310c6dfc00a2f86e095535a9eea98cc12960cf9b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..04c2de74a79d5246dd31db9285018db1c33c2438 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d38a79af49bb192fb4a312b1a80696e31fd9702b43c335d9a6ecb11b3121d69 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e435bb27cf9994e7640f058079c1be43898ee5c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71574031e43e6f32d93c1b04d355459941d10d1797945359fdbf3048259e6948 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..f5b2ed70e2e00d5482f917754e191f9e6380ab33 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f0abff9b0e014a9f5cf407827254a3034b26a5b739c1581e91af47c06e1e58 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..92fcb2ebb0f712954046644f8483b47a8131c51d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/11.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b8c4dc443794ef5a00df55ca6223c975e7ba022261c096b9c508baab549625d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..609e4d14f3c8e5ddac91580611966ce0ab37fb87 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0feb4e3a1c2036de32d32469d3adb6e7c4efca0510e6af07f7cdc704207f69c2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7975b2a68be6dabf9a2d3fe7485bd133f30de3d4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01341f3d85f9b372c92b6895200d261633e659f714cff7b8c0d6bec37f66f46 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..60313072c9603b5b575fd78d27a84b8ba196f70d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4579324090847be44fd5993d58dff4151f996296629a3d0d25060201caf2610b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f2ccd7d5fa00dd80819aaac80a5fe9f9e36d4758 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a60b5f1d06e8008cbab50e98f33b3d9eaf5a986a93892cb6352d97cd06c73f99 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..08a917b1ea769b166ceb68639c60338dc6de5c63 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53257c4ccb81e05ff933e3522d7421756358079ebb7ecbdcca0d1fdeb3194d0c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..7d118f03f889ecac18b5d0403412e8b7ab12402b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c4ae5117cf09cfd3f50260775dbfd3ad232dc0eb311b2e5621e42a759fe51e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..dafbf012875b4c9664210836a00d6596d87397e6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27312e1db30399c3446417a189acf8101e09004d79fb051d62c277387d1f518 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2f74806a36fe282625ed5458810cb88207cac07 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/12.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55367e1a9a5e74cc5a21aa201dbdbe4b291d70ba5f56d4c63de8d9f84ed9f7be +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5c4e41f244c6521d258f7b09ae54d12a66959f1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66bfc3521b9d0fbda841a5c6435a398e01bc97e33a4343ff19b0c94b24004121 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b9ef99aeec1e799e8296ee1ccccee3df6e7b7a87 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73144a650a0794524bc734aff015fc9918d1977f238d839b25b2074ee089791a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..08ffad11840226ffbb3ece9d78ba23bd7a58265e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:393a0dbced3c39f423b570d7c4abd3e585961f4f6c36a68777d70b70448985ab +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8614f23893c9de0b1cf7382fe86d247d92594fd5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96747ec3899af09ba7eb23e82c89d8ac1efb6c1b0cbf4a40b5c71a27d803a46 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..075cf3b4864d9a173dcf0935390f459673da323b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75fc25aefa460dba592c8d1a56fdc975f6bd57be730252dfa4083c9b9d75971b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..2785f04255765126efc6f8e6a7d9106491d8202c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:447452d56db88012370f861ad0cd4e208b68e1d5235168ac7a2cf7e3f680fa11 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..4cba194033a66058c58903e8a316d391c1fc3e17 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39bc36954d9b6133af7d93e98e58e08191721cbd1de077bf7f7fb4d1a388d783 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..33e3637c7fbd2500d36e3c7720270e8900bdb06d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/13.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a74f975d34f46ca72ce8d3f6a095f75f392457c54ecd87f8395ebdd09498e69 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5073790c5bc92a21f2a2e187d3c8b114a4bb8663 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b0095197c589051bcad30ccdaac9366f1d835b615a03db03b9904bd4b1d7c35 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0eb4628f19f846ca0e2ab464e9ddb6a611570118 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54054a0def084093d15de0adcca77cce7924de76e2e12b12a2858c19f17db63 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..95a9531ab51c298b80bf2e604280b10a35c2b996 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b192bec931e34c4e237304c346ac06ce06495d266b79b4b055ecfd3acf5e27f9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ae1a402486109532bd4dd88c3e8b00e66133f41 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0393f4bce1792df8a19e6d600e06f84e049ab866463bd9c69b787bf2c14875 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..080bb40a2425cebacaf33b8e354fd3e0b9e1d5da --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0378885a359a54718dedc26fc0078e33207411a571d69521cadc53dcb6ffa7cc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..4a9290a195bc46856a8f663ba0264124f56aea30 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d95957962f0e389aecfa7af4044fc428ab7c36af7d74b7a14e24bf401c4d0e54 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..37930987bdadbda7e994611a9ec42f7a6ee94e6f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19594a142a4c37b8d4400cfe394229d8b806c47f7540dc750eb2984d72f4f430 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..e21a828e453948425fccd739f82bb31bff415a49 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/14.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b448a799caad0419ed2170629401a41669119d1c035791d29379992768a3b2a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..cc274812abb5ad5d874f3b7ad22df0fb5dc94cb9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c381b0157f3577a18bdf14b24f2aacbe35f1faef5bcdc678fb37786f85070f5f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f673ac204cc91fa242cc13bf960938903ff8ec8a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8065978b0c0cc5ebf02cd9ca00f4d350bd0777e91662b76da930e7e64b38e5fd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..59370c5c23ef7fc4ded7034b467044d9a15da4c1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d37ef110827237485fc4e8e1a763c399313347e9e4ca65ed37db64c941f97a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9142f9540dcdbab99a1b740b94de219bd9591791 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab3792e22be571a1ecf65522781aa02f8a02453f00b03a9452dc6dcf2b50b614 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..2590f73527b6f408c5b7191418e3adb5b0d012b2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:997931d92a265f0904062fde5ce8bbdfffd580871c9af6726f6a094b267e1250 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..94cca2aa8133c20ad589d232cd14cb528910a9e6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecfbe7b2d42574ae641f585ed6e2eaaa6ef9dcc1014458600caea36785c36ca3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..c12e253a18385f7fef0aaa86f839174dff40c6b5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00c371bb271f40fa05f584ff1a991e70e03ecc152a7810a95520928f01500d7d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..de06898873ad931ef17c16b07f8f2d5dc94c5bcc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/15.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb5009dcdca46f8fa09f181c3c3a131caf5370462a8526b456983819a7eef10 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4fef304e43a92d5bc449c9c9ddae90dc9aaa7a2f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04ed486ae142380cb7aaa917f953bb3bd29a97bc3e21c19eb5e62d79cb573ff0 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1f8d82e1ab8a98f0936a76e7f09497d6762d88f9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2825109b498f4ac4cbcc3460d91936de1a12a6a80bd376b0cf36175d45687c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c0f1e36d198a56e325cab6ff0ec29c7373be607b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b4733e86f51c15364d0aa5b4f36250bf1c176411a467aca89cc60184ac5b8e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1832e5ecf5ec37d53405014db88c9e08153147d8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:decf53221e793e1280be87f823d8f0f4b2c0e5422884e43fc866092825c945a6 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..a359ea6b3848ed95984c7093f60567b9e0d50b34 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b63e738dee8f8692a9125e131b07a96b0a7f3b8ae5487159339b35678375e1b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..77fa1090c4fb90ad3ee281b019278224110459af --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79a955058abb38581cfbb918065120e09840261f005ecf0c9c178c682971402 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..5694055e15791528d5d66d75b7d3645b7b314d12 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea90491a0f1fa358362e8f5a47413ea8853709070ad4867f672c29c19b48a4d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..f7f81871d504ba28b15dac08f5552c2666e6c8ff --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/16.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b348a0e10b8bd26bc8b828cbaa1e5787c4b3ff52205ba0ab662ded09b109c14 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7ee829612293a74f01f7a6156626b06842ee816f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c3dab6f0b42070ec1c5cbfd66253a78beee674c4b1b9d3a3eb4b25a2c93097 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6f13ca89c4cac817b8d787e2107174691605011e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba3562479ea28d86a6dd7ebcac07ab6c1b0964f143020a298b0e83e9c7b6aa1 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9b92df8d8babee26cc471797ee0c5462ea75d87c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:935cc8e36e0b248282172efcd87cba9f62ae7e9ede7aa8303db03499eb3b48ec +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..46c82e77b6aaeb71043127322ee3634fea91f1d5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45ce78842670619c41725451c41579e9b2cee7ecbf1a89ddf1f92bfd6da46351 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..cb4eb2ac48817094da1f5a01194b43d65a82ad77 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b0123f3e44348dcbc8f993852f40f3dcb04200b9e744744972f690a90bcaa85 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..4b128dfd861785ffa31bb9f2e4ff92afbe2224d7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c8480f560d8765c00fae1b44ecf14ca85c05b9c3e6522976b2eec8c42293df +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..ce8bb94f84aa82e21138eadf8fa3586e2ae1e383 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa3e58a3f20d6d464d0e1fd54c8d0cc057031ed230d2c842f15d0e565c2101f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..c56c2749d3d5a0d23b0901db6cc35e0b51aae760 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/17.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554a91494631d014fabc8de70c111fcf54dd71726c9d51f3a9910a077d5bc840 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8eb90774c379130b0024ffbb29920aaaf53846ab --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8064a77c415eefea7569793a121136aa3580b36c70c37a61601fd76b9fc14985 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f3a4c1ec891f8a2406fca3733ac08ff636e1cca3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49253f03b2b2922a7fef4130589b3b2db331cb288871fd6b3b0d35f4fec9e27 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..0fb8291a199fce2cd303cc102d09d2f4962399b5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ad7994ab2a56e962ee087744d1704c25d534330421a4043860aa663853c588 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f42747d2e69e38a8bf60e8f82416910a9cc5ed02 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc4f987dfbf91e6581a2a7a6d6716b925edacbfaa78077abd6eef9dcf4d66606 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..826fd54b44306fbd5378e713734d914a8390dfa5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08df5b2c2f03142ef478ecddcda91e59f82dc471919235c87245447ff19c9e3b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..519e988323e54c8988c24ed357aa5e37bd550b66 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fcab89b049adf3fdb50cc2d91c172d530bd64879ca205aebe56e2d2bfa9db36 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..3df735e7bc4510e26a67aaf3624fa318283c29bb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d3d43b0a5e94eefae384fdad2414bb9250ca5688284514c6d95e4f18b93068 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..633a5a228fb3b427df3745087a9da32cbe284cd7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/18.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:173b7bffeee0c9e917e84dc49fb5cc6f3d20b5584993c18845329a516db40dde +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8cce60ccc75d53414b40020b072f0d56f93d5319 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80a9950f5fff73c0b878c03595469d69f8f248ac51edd92f69563e804ac8931b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b0c2b688a4a4117244a460187d54302b4c61cc5a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3a990959edb6aee76b24a052c4e4d9caada2ecb70adede688cd1d7acc6a6148 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b935a5efbe68bbdb638094a8b8947e92b02d3c9b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75958fd1a116dff7f48818b702b0e6051abfbbbe8459610ff2e266f6054fe419 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac8fc5cb8e55da98254fad4d1a57e7c293611966 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c72993450b61c6615ea3a9ef8205d0eebd445d7449b82c6e69df9ba6d64770 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..e4fd7b34323ba02f49fb737119f713c45263b891 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da7a7c8a60f76f06cf248298d1c3628b288d816f2350ef8ae49f00dea917ef5 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..d28e503e9fb9091e717aca3fa03a45ba5c0aad6c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ddc94382a350d10a684fdfb5e455b12104474927a9dbac8810447efe53320b3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..55c2c08680999d64e7ec53ab74053811900bdabb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0675f34b0da06e41b2d0b06ec8085e569e6afc0f3c30311a554450b593bfefd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..3c0f27a8256ce6c8df573fdf87330a83b3d625fd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/19.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050339c2895347248c94e74fc13bb1cf646c53ed9987d88169d636a6b3c5778c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a7c15dfbe3abfb940c4cd54e3cebdf8d271658e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f1585f865e639d6ac6b2e7b459c2de37615bfba529fd2c9f1e16a897acd06e4 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d4cd527c6ba814334d4a31e6d3743228295ae838 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4f004c872a9535da8ecd347f2c8d3b517b2857eb7ffab2eaa6c3f1b3308c24 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..75db9beaf4d3682e5108e0d3339243c5d789915b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c5503709634bdc3a301f679c797dc15cd0a02a4bf3c400d43cb6ab9a71b6f3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a378779fceb6df892920afe2c1871731e566ead1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f1b8e99575976134fbd05bcf19653f23b1856c3736c08f115727e5216b665d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..83021497d45d011e2856d2c69cfaa29ba6c659db --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc04b38ca613f52e187d9afc483edd12031819b9fb4a46c70b768dfb269cc50 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..296d1cc7afe742314d07f051e90b9fe7de335812 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:201c443f3b57cd08de84229fae2e47fb05a2a58350025b9b37e66949a35c6ebf +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..ed890d577221bcf47f56627d77049036910a687a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0822302dc52ec018bfad8641007404a8a99a244232583370bbb81d3a03c433e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..61003a4277409df414de063f72eb24fcda5f9352 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/2.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6478604b00873feffcb0ad118ac48aa84f8ef03c175e8ba2f2d042fdc44215dd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..296fd3de277a9116abd0dfc68e524c9c7fbe6bb7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d3ee1126c00a676acb6586b3c8a998fa225aca8e6a5b3f8887f9a0de2701054 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5f14a070abc259117df7142f55c53a02801d00c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f19690352366f993147a983497406e580be8d3160125a32d83c08cfe1e07dc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1c0b4ecccbe350642c81822ef1d165c579d1e19d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7b6d0c203d6b8f56cd14d47ad3e6ddaf41b1b4e6ed627c6f28175fe907a890 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8991d9df3f961af37befad130d5551738bba1dc0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c754b3187edd7715038fb5b4ea2b1278e40bcb75aec6b0f8fe4564f3f96e1482 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..7c052306aefcf18d3191c6d96deee3f267e4773e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af57237707ace7df1ff9c528494799b195dd1441106ea90c51f7b7eeabaea00e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc882d88eff016681b91d7fa4886ba8b91b0d07e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11a7f325a44f1034df2f97216f058ba03d5eed6dad92cf6c9c322ff9b2e2894 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..4badfb5d5db58484b65903698a5c2135589dcbc3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a3e82d2a583692039843c057ea08e7e07c474472879eb4e18d80f3528ae95d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..4f8495289c0c4901dec2212d7d8e0744d4eab15c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/20.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16cc8dab57ff336377551b24473e26f425266d98ac4685dfcdfbc41df3fb5dab +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c151d30549c440ebe3b7772f3cc069cb891026ad --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7287387927fdb1746a90741bbbf679bbead234cf6bfc11f4c66f41efe15d6f7 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a4555a594ad1629fd9b96fcdb676cf1241aa6880 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df709c42f279b011d19e338a3e3619cce34032711b7ecba6ad23d00645c5cb9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d020ac9ef2f119e7bc8b829a6db506217554a32c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d42a1f421830d23f6de32dc9ed4bc61457326fffecfa0994ae9b93b96ddc07 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..95b4500fb4f26230ee186f2c192fb39c7a147517 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721a66a70325b8732edc5aa398b38954e80a73963dea0bac4cc89b007b2e6652 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..600e4061f7046d895c3b0140159d268f9d83645d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04117b3e2d6ea896a1aadbca8ff40d1525ca5da4b63607404c2260e51f07738 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..025aacec111ad5ad249bbf7fa3634748da063f37 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3befac0f34871a20e6a114a7ab018e9de0b240073b28faf6e9a8ef43c5792e4a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..e1685f727c631da1ab94fbcd09c7940637f189a2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93392d207d12143ff881f2db4552c6740d0a737c43dc6a6a14974db5d85e301c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..414d3da5d7b3b8db97b37a567b0564bdb8363e33 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/21.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9406d445d75ad3bb3a6a4bd5bc44f792a6527e0b4d48049d94fd9b73eecc051 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..cc89bad0a0af4ceac6490e4d079cbeb9ca6b30d8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1336b532c09bbfb045f3177d0e91ebb140ad644a8cbc72530e94ccefef43d36b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e09eadea2584e02780a9d8961efc17566ebedeef --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f0c8f59c0f8f705bcf8e98ff4d2a76a3d9ee517e08742441bf47d72e21bf22 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..22264c990fba107038a28e28f69c1cacd217f9a3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d3820e46dcfeddddcc0aa90efe27d8e575391d8464d544d92edd6c02d3a96c8 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..7f0021a91baf151ade34e1636927610ba0affb36 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ce4bfdbbb51e72f5d7a1107ff3bbc90bf0104cb6715589abd073ce40e2dcf8 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..9cfd8a1278a0e7de0626289d8a671343fa90224f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ada770c95795050ded4ccc28a9836e71607378cb3dc09e40bf7bcece9b527b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..aebc625af5f7e5c6f35234cdd418a1cca651f110 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4915eced00ae315f05bca31db336486b39e109666b535fa6f6d1de8754db747 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..408df532a1912f2dcb021cfa8e6affa9f8d45749 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8ac06213c00948ab8a3035c6d65ac344bb5713dc77c914b4715b0a478f1693 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..dc1960e2468eef113c12ec0394ce00ccbe6f2423 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/22.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e812e571fb4d0bc0a2722a3f3787dff7bc0c8c95eb797d7ffbb39da3a1d8fab +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..6a6b9285a9c1d0f08641bc4d79dda2e4e34cd86c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc399a70599df31d2ec6c7938a86bdcb22a2a5d218acb3a6a3c64e370a805874 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b754e9d4f5f7f80c5c9b187885735e14457a9768 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5941119bf62f4f2141dbcb86853044a4176847116f345438506b4101d932f711 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..730b0060b8049da7186452ac5f8417eeac81de0f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03056dd1d4e56a4507f36a792af52174d0cafdb28a0fff3421d7ef5afb1b75b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b9bbd78dcd36641635a2d192461b79906e12338 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22a87025de1807dd71fa5b956f3ac3457fad1e3d4a1113964bb678c70c2be8ce +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..efdda4c3145968a12dbd7b2fba786080fdca86a3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493c755d520ed551caff31dd8141797dc23dc582ac465a8a5f493b8182f397cd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..764b737ea8014bb5050a17238e9ae563fe6f683f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d12779379712e322595acc17051ae4e1cd758ee07a8703b753bb7e4961a2e29 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..d01344a920b9547d780425babf64e80efbc1de8b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e4d67e8c6dd832d4c8c4d322c6b1d402a12e2cacc16a1624feb5b6c5d16c62c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..13857c8df6c4feb0058c82d4c70e38d3d5914df0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/23.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b54d9900c547108b08bebbb42a1263208a8cee370eac9acfd3670692eb00d44 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..dbd5bec2c3a053452aeb14185d3a575ee9e85228 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9476872b9edcbb4c34e0cbad9788b7dbeebb6f2ea059a8f8c4308627ed63e1ab +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3470344ffc97594fed3370ee382bb6f731a3da16 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4536778727992d023f25cfbe5fe75b0d73a4b58cbca3468766d89d8f22943d3e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1fe3f483986f31cff73cd338b0ea983cbd67bf95 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5caeeb1fe14b16792b4f7db4a038df30670c8627bb5f88f8b59f94fc51d7544c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..8f47735d80ecf1b9d8cd28c10c5ab0b8d5b94ce3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8b4923ad9f8e37f74220545b88441b00510b8e44b7c75c53c4fea934c1f4203 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..451aeb83bc3f5928339b559b1dcf371e2a230cbd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ea53e264f504dac33d016d917bb7b2b91e31ec62451c388519f8f61352b231 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..f475a960ceb543984d303b8f5765e2903843ae0a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7262dfd79eaeed3b8dc51aa4ddced9210673aaf41f96542a2c7fe3936c2e83c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..2eb69d4787a89a9e4609ebe2b7296e27b141581f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b81c105f44e7ccbbc07500abfa28b97eed768fb5ff6a1f6ef8c31142666d111 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..cc87eebb4a780fdb91e9a16b6b6f816f9b33c8f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/24.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4f7780046e0f77391ef9dc4474432c4800f66a64dbe5f32cdbb29cf6b1e66e0 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ddd90053206ae01c00c2bc9d37b00a11f287cd21 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b127868db29a3b05aeeaf475c8d94e2b08e9bd0c79347ec809328a16155dc6f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..92c8917c572f578c9d2a46c6b3c1a5ecb11d5c3a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2513a4e5d1ed5de8ada8cd0f0c4684abdd7de39c6b5194dc52b97b3cc48b34b1 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..2db5713328ed2914e27f3d25ca1e92c809005dad --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00c1c825010b2a5cea326f1c4458d1789e65049bc8e085516b251edce39b0a0a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..c1e711c72a52534469eb06d703b3a97c413c0a4a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a97a3379a8b18a73c1d62261d4c6c0db234dcb43783a136b4d583227285c5df +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..d5a441c3acbc16db08c71ffdca8b15a052472bf0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc08d5176c2d652e6ea80e0766f08eb5aa4aec6abac308b7dd5b2b81b42c5c73 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..b4244cfdf8ec7750df3952abac3394a6c1664c39 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfac85b6763905ecd2ee5c221eada53dd0e68e8f4c7d12f63e6d771c37aae3ed +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..3dba53b37755546e7cdb1b9ef92dbeb1c278f2f3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd7512799ed7bc815060f730f9877ceb7e5b176394f656bcc9a56eec5ee4e7a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..7d9fdebd09e78786eb5c6b97f33b8ecaa0efcc28 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/25.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2536e584b3aacbc988702cc6346e5b387012328f905a2c1b957321cd8afb88d8 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..30a4a44c9c6427874db072bfe597b018cf04d422 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553d67a1c78d0e6e87343a111e47f183bfeb7557bb999400232b9f99dcece802 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5c11e5a51482c1b538ecd3f2bba1eecae9c85124 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f91d003de850b47917a8b2d030e0cdde72f05909795e7996af2c3b0a96ef7ad3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f740c472371104541724f3da35238fa82a458165 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb02c6fdd24c5705e20072aed9fef2517291af613f8f3442598cca46b7734c54 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..735355dd76239a093be84be4be0907295368bf59 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10981cc427fcbe3e97e5ad222863a7796a2a30dbfb0af6bcc47dd53b595d2e29 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..74e39426153138f82914a8c5dbd637254291a818 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7be07ba1a7e896458dcd5eb4c803a3ff68b95921b082f4ccbda4b4443a558d9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..236cacb4cb2a0e61501b10241ae6c381a2166aae --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd6aa6e031fc10932d86b42886511ce30afa33a35dca1dc04132d4ce4bc0952 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..29eeecbac5916b43324564ecb5b2ba9cb8d09b88 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9424c3eb17eb72509a1a93e02e6ac16be317184a64d037e46b4697d3f8b99f8a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..f46a16540fdf82d4817503097d41bd2ecf26648d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/26.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3560145d83fa1694f2bc7c427bf3358caa7330c3adf04f6a03f28490d1f77043 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a558f2f66f9805a521ba0b62e06a9a980297d42c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b08e8635217387407b814f3c9eb8a2e8efae01e1a73ec8e9a2cdc21a35b881 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..23b92872dedfb9710a7870e4ee811d4044a64d23 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f3fc0649e2bac41bdac7c74ea289d5458365fab15474f2c35da733e92a8f0c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..31d50141693bb78931bd7228ed88f69f907d89bf --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4adfc7b082ed9f23d889aa3b394bd0213d7d0f4e07b7d82bc8ddcb52039c44 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..cec819ec715cc487441985a63b23e3d3f9272942 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b063511238d7ee71d153f5ee4fcf34238d0f10c94d5c2d0b7f03f3578abf865 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..67f92348fccd3c36c1546ae3777739dc64c7415d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b74c2b18ca5ea1216d5d0692675c80c859c458fb3b7206647225e811c7c189d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..de44e0b97ed3055864b65c8c5481dbe298fc8a67 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb339cc1ee3559c68578cb2378f677569bb04936351604e22bce289dab2e845f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..e25eecc2de2887996a111ef0bdc28487a8ce7593 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d96228d213fef666d2167a3dcd680eb740c5b9a2eb6b9f5627ff5c9f1498e2d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..34f687eb6ee80db40051730215389f572e7e6f84 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/27.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25359c28e9fe5d0aa33e1c6cfc3dad8de8ffa6c5c3cf595369b73d07bce6c3a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fa4781581cf8a4f64f1fe03856d6ccf2ff13b926 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a33943ce1884cbbc20d212c06f66a3b95e1ab9d1362403d99d6bc8818cd44237 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8fda5b86f460f53a846650a8d85f24a5af1dcf9e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e115efae176b8f1508e459f5938c04824e8105d5a265df94a94b0818708f8a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e8f5c7a7a205b56fb2850ba2c4b868efcad77236 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a12eb733fb287e4032d90199c787dd2483d338fde0d75588fe4f6eb7bb3b7ec +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1bf18490804493043926092a17366e80508a195b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb01502d6e6b8d28161d62423aec3faffc92f6ed9558af43bce1f10f4296e653 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..16d9a590948b85cc85a82730f3be9fa3d628d717 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:059f7f3915cc940214d677d66572508451f80fccc8d3d30384a7fddc5fbd7e51 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..e48702d2326b11c52b02b0f32d36b29d5b1d242d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756b1db7954d15040c58d40893bc07cb8af4559d11017607e111afe60a8e4303 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..9c3c964f8b73f077c498c2302970314ad3f10d05 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f40eb7628d3ce0cbdaaac12e4689cc3a1fae0558d239ff7babfa921485cd953b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..85390a3ddcadaebec31e125159ed331f23b7e42d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/28.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a5fbb6e932148090890f28621d57870cc61c51654bf45b1e95bcb19532c80ba +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..59a873ea5815715ad4b4b64402cc08c8cc4faed6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a5c06b79a684c0a7e1d0131fa2bdde592152bc33f58a234be5d8df6e45a04d4 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3806c2acc71448a408fbaf7fe35a46068278c093 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae2655cec81658543016e027fbdfa360a3aaf4603e685b944dfb0ed3394c42f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..888334b0d68ca00b6beeed6cd19157c464845945 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf4394d23e01d8b1761f6d89fed55414b623f4a8146e97b5e278e8c3e3f8727 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..057d82530a1fcce9b08f74ecbc8ac268339c90ed --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b24662e5808b7925091b68ab511db19f1121b62a80c12050eb96820ff9567f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a5d4161fcb0040a14a50e2611ab207104ecdceb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:048f1e0660abdaccd00c8056fd7c7444c14e9f83f56407f4a40fe933dbf170b9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..e7c89d8f76fb836b8cb873d64b6320a0ccc7b28e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957b7476b530a81a03f1f0e5f60e72e7778f895b7bea1d982ba117cbcbdda102 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..1522286100e960f0b5a3f200510b4cc297ac0eef --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e7f8bdfacaf767abe09706fafbbd377f7293226105b38edf5d8cf81b6e87bb +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..85a0d699f908a12c211475ef9bdebf949ebb9bb3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/29.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96ed7c56d855b25cce87f0066125b3145bd26afae6db645cdec71143d3ed1cd8 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e4de3797d789c459e44bc32fad799ded79cc294 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61418b80726a682c271d88427cb8a0414bf7b66fedbec3c5458136345459b747 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2370dc325fa646495e3b61f2ef526bd3e7954034 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a091c4796b7f9bd6a06e2e74b17b01c65d9cea935791f65b8cbbf85c6a3a0c2d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..833f5de11d6926efc8d56fa733e4bfd62c7aa3ad --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb2bf656678cc45ff06ac6c69f45dc80cb86e23c0235c678e5147f2ee9fc824 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a87f4a2ebf9f63097d7b76667aa1fd597b1e199e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa8bd2adddf83a6c1f01e37035103864a36703a3ef81b90e0857bf1c63b0bca7 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..e60a49d52bd48304631dc770b8dc64601f94e4fb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a878f363ce8783a9e74876f3715abf92298fdacf1ce96a4c411f75a6f3c84aec +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..e69e5b5b91d597e201f8b0ff2df32b03b4e57fec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de62dd4e5f1b070a85d033a061a1513048ab18bf286405d3e8f49322e9083573 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..d1db64835f0aab662fb3d966dde69a6ad6ec86b1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf327f519862642ff3443181662b8d0403faa80e1b3da27318c20cd75aa4910f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..cfc234ea7d6ada5c496c5cc24866cad9067966e3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/3.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6901c387bad0fdd4d7ccbe481b5ea6ef4e038064b4f1ba7e23a1e253de0d72f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..461e0f0288bb3e7bed8cc683fd4fc8410679a1a7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ebf95d435c954568f4983c9c2f6bbddd115c69f64aec7d98e7b587247437a3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5f3003796c58f461efe6095cf805a4bca52d07c3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0075920a357d897a475a44ed9a6b6732e9e222cd41e64f40c34de82686660a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d699b80f4b718487656d813a9140582d4670aeba --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f09ea516961a6a798004e912f6583d9240c822e3773e8074a15b31540767a4e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5ce2b3d2f205de87988ed2588bc5972cd9e2b715 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80292024f256eeb4783dff35e086dace09194dfacb6ef5358a113928d014d988 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..d40d17157990d041d4e78cf75092c4702503cd1c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3af98e854ab8b822aaa4ac0403544f208229b8cdb0a27c767fb9fcc14203690a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..ddeabc56bd9056e2af40a90b06e26f704853b0c5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08a187ecf4266c03b0aea6b45787f50ada7ee2249f9daebaddcb74b527912b3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a9f6cb1b79c1c7d39c10e06b0358d8beec0ab22 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2616d917d428fe44b2c8bd86a976f5c16b3668ab4de529d8526856adbec4f46a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..db43df5557685de189754c7eaf296888f5fc4181 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/30.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dbe598f1f6862e5339703dc89f8e449eac4c15ac57def459f4502ba7612cbad +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c6544b8179e70049eeb2fb0dc0441a24eef9784d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1f3fc96d237e47cd80e1031fd08a7387555408b1196d1d643679908cf1edf4 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..45feb97a6509ea2340d03179a8e9ae896e1a281b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbfd51da2768c2c733da45a90d9524519671a7cad73b1807a0eac5730ac0ccb +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8f96af883e2f677a0b403e00c25baa6c905a5986 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1574e6558605bc3d3456c9adba5085977e07bbc58080ff8fa3014cede0a3e8ad +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..2cb77a458b2230f123e2a5f1ada4304e534c2e6b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0528555a93efca8ca654e8411bebf8356cab070744deb9aa7c6a27b1992aac0 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..14c06c5d5d1a875614b3c0c0e217376290a991e2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46feaf71343dc8c6456e7865340a341107bda4f5454483cd5b058a637b490366 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..d87d931823239d338bec07cde3d23ef8bbed4d39 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27722e9fe8e63e83ec0547f4e3e0cc260cbcf68bd9b042a9b1875946b35e01b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..a40274fa94257028678b61c4b3d8ecf6d5d75772 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132058820195ee18104ef40beee17465a4f7b4d67ac1706791ab2323013fbe11 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac53ead461fe87e82e995db7dcc4581b08646c1f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/31.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1f7006cd3f50f0753bd51cb6bfee58d5817134e1fc7ee726e327cbb16b3ac0 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..870d352eab782f7699323aad8054614ab9456f6e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3f3958617f735bd69ffb92cf01becdfe891f2b328848d1584ae204b495a64cd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..c467245836b1a0d65a7671051675f2b4a324c1b2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2cfd3588959c9e6a9c21ffc294f7aa8466a80311e91b84d6f69eaa057784781 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..e1afd2c5f277bcd4debe2167f7e8c6403ee99ce2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10ee5a3703e6a6ccde03de5ef8f66815abdf380c69fee84c37f52348b8c6022d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..cf386b01010ec76033584f63be19b227724d558c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3623864bda98b4dc093e9110fb427a4a8dfbee2bc49782e4987a8e2443ffb24 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..0c26f38bc1af9d064e5287182ee012057279164b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f596be52492228dc6fbb9323cad1fd4e4a0af6c94f3af9ad582ca8b38c98a45e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..fbe713244782cf1629c70ea06703120345e33d72 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ac9f746f6eabc0a7b791a7d8e74ea7cf65f27c1ad68ec0ca5eeae402c02a2b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a363d2dc36cc854173e90a458c74a4537f6e2fd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f22dc97373b841ff996192b513ec19b6824f5699d0a3d8edcbc5abdc78659cbf +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e681b54410892ebd065329765d5164e71f812b7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/4.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c2fc70a065578e6a5e85ae31ba5101c2112b90064c23005e6e123c32d7a076 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7d2eb37d9907be358e7a17c354d8d40d503867a6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f7684a6979070464caee95e48e45008852a5e1532c8dbb91f5d22f93c43af73 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..29e2e97af7d111f1ccf227ce56910adc19d77f46 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3846e2b0b8591ee06755f634d27dcfbebc2c126fc44b20ca65b7689bf3a4f9d0 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b4465678533aed98e5788b4d6f52231e163e5c8c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b49cb1fecdba59e4060e9d1f080d27e44e4129d38a0c26d59127be6734db4bf +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..0fc0edb30003d4180a5d435fabe9d8b2a5b1c9f8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbafa46886f1d52df2324266d9ac378171bff2ef998b2d39c1a0ed37d2b69bc9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..c558663aa737eabcbb05cd75682da8e95a59590d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a47c2eafcc2607fdfc441d9855c95e58beba175a1cb4e10d92b3e0937028fb +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..6cb6299eeed1509516778b9f679aa2584af2e58b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:237e4faa11d6530a15fde024279cb88603cbc09fbef9372761c906ff23158c50 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..393b6894519a1958a28ce4b5370e46a2a93ae1e5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c6cbd34173360b76723050cf6d4f21cbff5429b1cfe56f78960b80b3a58d5ae +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..1857baf4d759604323f25be47e8bda5fb0ce7f98 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/5.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7f5aa0682bcbeb99f09fae45e06faf2cb92fb1b7b9873d85b17286f837e220 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f89533ae0f8674d289824266c0c59bde34efae56 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0308211bd832352e2ace151786f40fae7be50611e9caacdd13741e84518cc2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1c61b042995ff5df32bd926e2d293f1793ede4f7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ba4b631ae59e551d2aa41b9f68a964a285c2cc700be36a060c5e97d4a51562 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b141cc93aa3810601456a4ef5fd99104885a8f0e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c155c4054d648e7e24e112768eb3fc171b44b79db584cb2735b87e14b1b23a0e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e0cec2cd594c056ae6499dd332ec09e73ac3634c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c93fca3a8b97fb851cf8545baf57c6e5871163425d4cf475d70ab25d04f4acd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..f4019d8d270c0e351751b3dc9e3f1a38d79d2ea8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f0b01b8b79fe02ad7fddf149541f0369ab32c77c94ed3252eafea78c8956c9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..f5a0012edba88e981d19379a93f233ad313c54b0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a308a370ff8316427d6e6c49b34b8bb948aba2b39a6923e7ae37e6df55ef4a62 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc6be73b6e963c9385854e3a3bd6ad9424dc6735 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b068ff34acbb8d8884065a192bf49c6af27e4d68ba0adec415a111d160ec8b98 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..7fadd1fbe673046576397d3c95051ff8fb294171 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/6.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecec6f3f24a908fea53cd153db91280238524f447bc46a9b2c9316d007b51295 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ecc7918b69c8044f92cafcd421efb7b2bd3518dc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd51373b8b12d923cb39ef0ba01d825a6e61676bf6b2b1795a5727da598fe1ed +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..a691ed9ec1871ce3cdd54cef0bd1e12dfc77adf2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f300e2a7980328823f9d6c02faf7e5bd99d91f0f274009ea4ca324cbaa46d9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8c944c365231533e4134c51452cb8d98a1cc8ec8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1da4db445f2e9b1b83f81e85800b17eb21fce2fe5d0e82037479447ca98611 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1e2261fadb57929a59b6d4b79391eb969778368f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61a1ca6736e61ce813f7da1b6e4405df540e2a3a7a73c153ac813796cad422c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..c1f591bb1ad1d8337b805e5abb867978347e9fe1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb135141e19593d863a154345563ab615cffc70b25264e3af9d4ec4f98e5fd2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..bc02743632e510c5a49f0058ab48680af60a69f3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67c744e83bdb956a8ef5b4157562514559ab2ea64d3342ec8bf79f73790eeb62 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..a0c3fff279fa6159e3bfd1959b64bab538745dc7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3e3262dc69dc07e517404dc26df3c4c985dad8d70874d9fb2882979ef8610a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee626097d999d3eca45b651c5ab64480f2b5f922 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/7.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bdd3ba77185fc4799abca1590797be173c572bc18a3ab7447cdf643b04f4650 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..65c257fb42513f88d2815e96f7625425c81b5dec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5968e8019c9352cbe0cf09e6d44de94047ab74254875802f987585b668424c51 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6a0734154629824754588f2140c895124b7f7a81 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a07ada75eb61a2293c26ddddce146227f745026d20fb2af45e431dacfee2f3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..efd9c82d6bafe0ca0333493731a882068414ea6d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76868acf2cd428db76f0fbf502917c48d155f5ebc9a9378fa87bbef094bae183 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..cdbc67d50745797fe5b727033b15ac436e84b10b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293c009bf7218c1a69a3cfa10ffb26ef883212e2b5583d3977e7d5a66da6bfef +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..127c421cd61118335f8b1ccbc40d087f242c8e07 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c45514d1a85c51372c36fc180606ec14a0c304437e4122bfda7d22ea8c251c4f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..55b3606763294f99648dedb3210ae330fed66d83 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d567153449467644e3ff8654ccc5b04b2f7cfa8904f3e858010bc8251d6307 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..d7d511d7ba78a17e11124e2e1308b70d6610b112 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda81c11740b91296ab348c42cc56c09c378f4f0a309e38a7881f886c27b6e24 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..c399b87a3c711186c1c96f3535b8bb21fd91f1ec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/8.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa08a06870d7641305e9b8f110cdb866f5cffc624affebd92b460a752bc6c535 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..65e8a68f62ec52be8d842fc7ff90f6febaceccd7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971be0cdcd7581b4778cf03ae368962b54cdba783253b0259c8e28e006762bb3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.1.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ffd6a121f2fbb5a02d9d8e09c53de925a6f2a1fa --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad1742f8f6d68e92b71d7e36c9a21c334bc592c2621d65bdf2850adda4966ebd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.2.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..bb674be0cea050a6464856a0fc3b21d7eb0c0183 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386481b25e9891cae9d3954100e3278674ffe727adc115cbd52df52321c71cd8 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.3.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..002edfaa43a5bc734dd06524ce32dd9f53ba04c0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99a1ae6384be4356f1459519a08df313f81086d03e7249977f46e77455fa0791 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.4.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.4.0 new file mode 100644 index 0000000000000000000000000000000000000000..6b364f3c0d3a66c79d4e5e92fbd8f62fd2bba0c1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.4.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e405698fedb3ea60beabd5c9ebf4ae6b8f3345a7ac30f77b64fe2145adbf71b2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.5.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.5.0 new file mode 100644 index 0000000000000000000000000000000000000000..d291cd07aae8fa06b2454ce0e391d02052fae2db --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.5.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4738bdf3f421a364a5b11fc9bbae6bf3eab8627f782e3beef687ceb8fb0c7902 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.6.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.6.0 new file mode 100644 index 0000000000000000000000000000000000000000..69193c830842ea72e7f8203aa21ed897726304c8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.6.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a08531bd3219fa8a19258f64bc938add2eafb816ce684281e9a9a00f8a3c24 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.7.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.7.0 new file mode 100644 index 0000000000000000000000000000000000000000..4987584da4e1355f3c976b8c921ee6152c3e8ce9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc1.weight/9.7.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08dee8538f64fc235fc67e1473651d6c0633ce298a0249aca3c03a39fa2df02 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_0_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_0_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..af093bc040b9bfdab9ffd67f2c1c213613e5c62d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_0_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfea882a79f2bdc6691f3abffbf42f72ea90a206a873ced4c23ba225be3a52b9 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_10_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_10_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c2ed0e50688a0cbc824eee6ed07b498871987e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_10_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce2fde5075677bd348eda3e8fec4edeb648738c9160fdf341ea4bd3d502a774 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_11_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_11_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4adb79a3b81eafad2ee0f6891a7bfedf0e64cb0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_11_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7570532fbe5a7308c0eab584375a11ea5447c53c0f37baa45d0151dd0eb3f64c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_12_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_12_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f8d86274644c9610771ede40197ca9b8eac9f58 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_12_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f25e501e97cff7e8de02864772880ba25c1f94f3df6c49aaa0b4dfec3844b1b +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_13_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_13_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f39fac0eeb29a317efec3a08fad2c0ce215c5f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_13_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1342c024e8d734dba993c1b2703152ac728b93923959bd96668f521c614ff6f0 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_14_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_14_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca2e850efa96d6c00c6de5ea14f639fbf9f963a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_14_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87ac81f15e7ccca8037453d164f6b0a311df1c456912d5a5845243aa9a83107 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_15_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_15_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..437ea1fcfa2ab73eee7a898eec0997704e1b4304 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_15_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6c29a320fc3bb7ca2177396a4d262d5bb686d6ee6695e957a5259707e910fc +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_16_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_16_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e61dfaa23975967270aad806dae065cdfaa7788 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_16_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e033d5985303a093052da5d9f4dea431c518af71c277a87f5a23bf3a6be39ad +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_17_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_17_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7bd56ed532e56a11558207a37763dbc872ce002 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_17_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9495d6607a34a2ee495c8ef1a9ef72a0c5276ada44355618992a56a7404df95 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_18_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_18_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bca5e5897d482f1f14aa7573e116d9e1f552e2d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_18_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8598da7e410942c77870b4e5bde6b7a9d28391ac318438c409c9ad8e6dca52da +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_19_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_19_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f13820fcf76e40258a06b4586e83498b826ad95 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_19_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06faf86285c4b17afd70ad266428a87834326e5cf2911a7a7f75acb12222e7bb +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_1_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_1_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..89ebbac9c03995272e3df2fa62675664d6f57716 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_1_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d595d940b7304a5515a42a13db5243328cf166c05d6b389dc38ba296f895b99c +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_20_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_20_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ea979f8b1e9e7529aacc0181479dc16e1e52a9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_20_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eccd309df2ac0d7db90c90896b13b0f798e8efc5614f96659dece819f797382 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_21_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_21_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fb7faa6a94cfff6ebdf180a413828c987073e7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_21_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1063001f00061025ff3b86b9b03e2d4b9890486ac0fd4dd52128a0b613c637 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_22_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_22_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4c370ddc2282ed7983afa95d8df86c57a47bf5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_22_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfbd9465298388f8614145b4a10caab9c7f8d0d55abe62ea7b8abfc8c47d2e8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_23_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_23_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec750c20d7ea754b7060591fc68df51db2bb12d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_23_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc13cb8c15337279cabdcfeefa23321afde337b7b1284f19824c43a0863cf76 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_24_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_24_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ebd92dcb0d34b0bd690efd0bdc2da5180f6df6f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_24_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8f7582bb9b53cf1c5fa153cef9175621b3dad029679c33aaf345766500e4d3 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_25_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_25_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e690f65e8714beb7e4217d01a10ba7cb9bd2b82 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_25_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f4e6361c8a0592b80aa747c8a0fc6d1d51fcebc316a89af4a64697edf2c228 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_26_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_26_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..855bcdfd04112b915222fc86f67f147e9ae74c65 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_26_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc5ddb8b6a5e8173eff44a1a258649591b98faefeb4ae37df307cfde547a8a +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_27_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_27_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd33c1ed411dcd0ce6f8c814e30f0f76671b0325 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_27_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e7685fc01ba14be5ea09d5faeb559f569b52461fd2c0cad1c16694f2a250b9 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_28_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_28_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac35976cb5928a8da7e4ccdb5356ae7bb705f31a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_28_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95929b1933ba15aeb06cc40866fb9bc4849d315e5167854256cfbb604ef140f7 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_29_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_29_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..18b725d90b3e3fd1650d0b3f1d82e0fa29091f46 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_29_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cc67352bf8ce0ded1ad8c89a8a7d1893620b64db012b54d1585e9983c90a8c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_2_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_2_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eedcf274f79f2090967c28473e46e4a930f08b6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_2_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486d703cc7a816327e1b18018996059a23adf9177172614e860956333dd2eef0 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_30_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_30_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..c65f52a055b7e082e0cd65885d5c0deb922e9a06 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_30_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182b1e32fa0c27a25cd6525d3fb451cacc43f098039497d197b8af232c17956f +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_31_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_31_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..560bcd57ffc8d169bccd69b8e291d213494f7214 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_31_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a0a2cf37407340f38545d83578fb11ba1cc31dd32ba53cb6c2ef01a94e8cc8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_3_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_3_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..453a09b5b68dbe4520a1a34bc51220e4967b3ad3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_3_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4320cf77a3d24b17bb878df3147154cec3781c7998cba60a0040af04b5fc791 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_4_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_4_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd55ac98a7bc03e00d0e77cfe691a007e0f00feb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_4_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f48b20cd6ce31054bb776dc121e2d8c860805aba3290e19ae82d80372d0d4b4 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_5_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_5_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa4f904fc32ad2778bb130a79be99caf55f0a168 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_5_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c00d72ef6d697433831669aab19149eb06a9acd1b5dde8d9bddbffc239dd1d +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_6_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_6_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ce60eae9a820b281c5469e683029860a30d9f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_6_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e4978cb21be48bbb69d8455cc10f6e5e076dc85878033e24e2a2602a8bd6ad +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_7_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_7_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a75133c7bf3a3a7788686658ab1f091f3dfad7a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_7_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b4ebcae96a9f703a9dbb76d7e0a9a4a8f1842cd879e739b92a40a11242f5f1 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_8_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_8_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa615aa0df41fd59c2241f1ac26cd10c64b24096 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_8_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c1c7068de4f865aa72c7521437552e1bf92c309441fc1ad65d305302200d5e +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_9_32.pt b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_9_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7061341e4ce159a3311f6dee8ebf866a52101ec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2._extra_state/shard_9_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e95d1a0f3a9880b886738863ad1d3e2200e21959610023c0382eb3f863b29f +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/.zarray b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..eea4a2f72ff26d983024f3ae98e06bf8f24893ac --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/.zarray @@ -0,0 +1,18 @@ +{ + "chunks": [ + 1, + 4096, + 3584 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 32, + 4096, + 14336 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..18f1f5d334234a50eaec0dc21c051b718f2fd620 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e55ce0014e5c9c559e8358470990b2b439a0d2ba66afac955a1e3c375595c11 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..737380fd37b58a4a7bcf8362ab89321b52052a9a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eec8dccbf8e3b0902d6d3554ceaddfd8ef1e301bf28626ee464d1f9d4946ef4 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..3f3e92b60ae9ccd5582c395653b45b1a0566b90d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4afb6fb228e4a1b08f65aeb011a2510005b5606505a3e33858624053eb502db4 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..891acd28246836365292664d5049e3170db5d93e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/0.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb85108a0bca6b546252338caf89b8611d28c4def007931ccf83e43b2dbb1b91 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..55411f4154734d9f9a0f4c07bbf25aa2d40a8e45 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2d6a870105f7b377c387dc0d02f204763abcc30f11247b82f8cc730adb74e6 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..a5fdc8b1fa6c0c44dda5cc4db838c0fab7b160bd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525581b1bfcb43344cd60319198e01f2de3f1094a3b3e1ff5633a7b5868ff202 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..7e06dbb31168d665271692f48305558390270e66 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77c6033ce684c90248ed7e882baa3f0f525590e2498aa70f20bf4bbaf8b3a9bc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..4195506440ae03bf5d03ff900c4f495309c7ee45 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/1.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd753c395af92a48d85028f9c869b8f5b58725804d294952175763bde772028 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d6269261f829425cbb7e5ba250b40e12c2dceb2e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61130b17d49554987eb48ffe2e33b640a3f382d9653430f070d04a855cfe4c27 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..6a0aa518c06af6cdfb4407763823aedd4c79c6c6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:213c8aa9bc86e8e75c1bb06ce0608fc5548a89194b7faebdc1f926b22a94b1dc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..205a66d2bb85b82ee813f535154aeb64406d59a7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:030bb62fa4d78eb2ec0165ff8fff0b86f602ff43f281023e0b4819ab416d4df1 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..670ed76126fa3c5993a9c72e664fe03192951242 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/10.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0363f3ee540f5ae5cfeeef9eca20d3f7b63dd4ad5bd6dbfe1e11edee8a6a20fc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..94ecbf754198bb066b52d102392479e512e7f366 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b9f841b28d4d12118a98fcb5eb7f4b871ff710b29bb0e416234700e7d25314 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..3ade4053d2c11986a3e90ab984dd4f815cda0a53 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a89f45192b2ad324362a8af9c0d3f9dcf9d236fe5d84556afca36279073e63c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..4b5d90312b078efe56795b0a0be0bf47323de2a3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33946774625d204bf9e72f24ea8079e37d9b8da3c5dd10d45ec85a231c12825a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..b41c472a15647e613295b7018d21e6b504911af9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/11.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19d317167e500059fa2b50e005dfaec02df806b38d01f80f4e56ed6dcbe104b2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2736b8ac9600d31dd1f2f36a4149dd0d247ce5e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c66dcad86011be495d2e68111b44aee7c955d19e62f7268385be083b797bf1d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..fedf19e73b2f24800d32387fb0fce3e517c6aaee --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6943424c3d9d8b7fcdbb5a90ca772e1516d68b61b0da36d2f3edd186ed323911 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d12171d9abda73fde72e716e5cce9a8d23a1b1cb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517280e257f32873fabd1fd4ac9fb99096e4f983f7f100a63f52c467c574f249 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0b60c9b2ca97d6713b5257dc3edad1162ad77f6c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/12.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a51e4d23b6a6948f9f711f6857dc4775028a298be6161120bb81c28289e6ba57 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c7081ed8fc04f2b7632348b7a1c5314719619721 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c56e9488d88771f0837686c169eb4cec54ab017548a29af9756bf6acbfb2861 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..7b1e3b3a985dd404ad89aeb9b95acd9f9c03f2ce --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:895f47943f1337b309b4d5a090d815d9a5fbddf51ee23292c4af1de842662544 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..831de9ebeb5337d1f687ad4d6f7327ce82727fb4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5405628c6e04de95a1721f0d03fbf1c8f325e80d7e3b37612f3d3b69a6f04445 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..8de4fdf3bebf3070bf8a8dfe587a9d272da3c257 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/13.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d193487547b0ad38dc19f4eb0c1fa8b6d69fb924b3471941fffd0ff79327ad77 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..624f0f60410eeceda1eafaf7160768796dced61c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c26bb44ea86cef7f0d4bdb99e26c5abd872baf7dd9561009c54bb9758683d7 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..b53defbdb2d2d9fb35ecdf6cd6ab7a024678af90 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:942ade4300378aa703756080e78c502589d03228cd4f9bf3ae786c032cafa75f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..0c2b49a0100a571cde46e47a091dfe05ec3c5d30 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8d49abcecf6c8444954e16ec9a01ae4a63a3f95bfab9f8ecf022bf29057c887 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c650f70424c4a81d43ca52afa4ac355666681940 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/14.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228eb7f54fcaa1410c8d145cbf4593b7cba1f9e71efaa06d40c68949d40c8103 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2dd19fb39821b2e8177ec1f743828634f32ccdec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1441d0bd301c4d631ddde49febe4d09b8b73f611e8ff7e9f26856878fbb6071b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..6c199cd2d6420691c30c36b73bc097e91c05282e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7b1cd6fb8bb2d2207e52fbd3636fb203cdbdc9cf9b9e112881df48c35539d1 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..690ba26f380515d8a7e4c9cb3028f263978b1ac7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf04a079def292aa597d134810bcaf02789d0ef019b8fdeff05cb73fae37389 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..532cb02e3dd3e339e5fca0066647f9b6f9c55785 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/15.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840fb7680f7e24330af933970a863ca840160bcd88f08889614c847ceeb6cbb2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..dbd21c9942282275bc8fe7913c96f17d1bc4d7fa --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e989db86f1996b47b27e45bf915f396e47e1b044cab8fd0d197afbf8cd3b2a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..6947aa11f976a97b9eca2a793b673e145069efc9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ce594e7607f70b8266e8f21022cb67059f4580ddbfd95ded4843310e523d38 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..65e3cc68b39b106d927c0139dba2baf94e0daf15 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5624e6079f4309f3d402511f5dac8aed39ceb03c3f53e1fa10410a1357c9ae3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..818cd3b1561100efee6c98e1053810c6b1b8853a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/16.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb15153ac4ead92a78d09061eb2e853a4f2ce13a2aadb755c720c2ebfd401168 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c05a080da7c864538e782a298934a0685da1faee --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d732536adb7cacdce80550ebaca90ad250a2b575d1c912a9e4be004ec5b0b81d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..b4fba94f9cb45ee91220ef7e8b60ba5e3629cd55 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1bcafb8f65a55bd3e0ceac8e0546e1aada2823b8b4d5ca7384a8680b6cdaa44 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d064c90ad006081bad09536028f9ec28f2533ac8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221652b74d425a6c52b53b09bf6fd53e9bcf431e0ffd1a02ae22c131f7834c51 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..41654baef08fef63ccfa06fe45c94aa42acd2a38 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/17.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e10df7ff052dd4b65dff4c851cb2bbfe9c859b221fe94a18ec66e2db68abc5 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fbe500fe2010095eed183e77cfb5cf8d487388e8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56431734112c10bf2b9c39a1eba7c96ddf57f5df4e4089e9207e4e57156c605d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..c337fba21d1e1d86e32568700c07d37ebc8e3fbe --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:272114d8857552135fdef64e17b0923b5a6bfa6ff1c32d9fa43cf38d42885f17 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..3411b778646e3930449bc1dd9df645182d5e4f51 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2214f1c95d902aa5e68b0287d325da395cb0506da480cfae7ba5ec62b7a1261b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0e3b416de7cad37ff1abda30a4a482b8dba55512 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/18.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1124459972a274939794194f333c66ab4eadb980bc556961ec1129f6a3f08c83 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..09196aa14ec5ded15e8c496928949fec967ea725 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdae88d0582bdc5f9cef370add96a807d3fd0cd24daef486eb9ab09d88a80597 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..10001bda695fdff0172654b4c0378e6c442f8073 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abc8f6dbde67a4fbdc10769ddc252cfaef45513739a0058ecdcfabfbfe04d5d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..2bec8988b52d492b0759bc0c8366f9e0cb92a031 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0dcc60ca1955cfb55fd7999914eba676e0b3dc7f931a0819a99ff65b199088 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..b40bb0f8f6dc167f45d552d35a64f21964a45030 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/19.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f734146a13bc9b014886a6ca788a7cc40402430b96dc1f0157038a1a4e9b65 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9dee7897b607968849fe8a50f2c8b86e826e20c0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b163191dced91d29b737e89baea9f7231c759b8d300e623d691656b5559799b6 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..82de1d03c906132003075b99fd992c5615910787 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35da0dd60c6294a4aea2ca2e75958464cde705fc6a0b854a4bfb66c4ad2324fa +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d664dc303967b9883b0f80a24f344abd139de611 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0533e095ec1ca696c5f6dd0452cfd714e746a298cf81fba5f040ce201806c64e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..30fc941954a7a0c0a3858ab9472022abed64390e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/2.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f895651519ab568f8dcc5a631be7249b046a1c7cee7104675ddc3cb6954d055b +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ed4310d156a93ffe4ce3be21a608d26f8f0c6c28 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2e4e077e005f8125ae88da48c7c0854b67a590694fee57b21437a31d8a3d3f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..360048e0563df26e9406261a1e541ee3e1e983bd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af59ea1b30d39b3dd5971c1ac92fd90cc1b75808a9d835bb2e2cc99922980545 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..520ba3d7278d1dce8b58621d042328b79ba5ac0a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c399288527a03d5138fbb74a897645c6183c962e9c2803ca8fc4d56587ed42cf +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..6255dcfad7e21eb5e9f08cca20b95e518e6cdf47 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/20.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e59942382b27e28d90b42d081df5ca836a5f8ad0eb64d829c7e223ba5a6fe27 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..36b429a69928fb8fff5853df2bde529d1aa88b0e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3bc29b64f627fe91340e847395f4c53f143f9d741b23b1f866109b72cf2abef +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..aa16b4c30e9967064ec685a72c4e52c8e1c8ff87 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76de79f645563b246415fcdeb99b4b8747a5a5afd6eefccfcc9de0f1d6056bd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..2a381eeecb695d4dc0c3f64bf997cb7fa5bcb7ce --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdad750d6895474ca9e06f03d8f7fcc4ea65e87899da7a277ed05370bf574f99 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..24be0601e10a9e21a46ade626bd44ed81d9f4034 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/21.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff639c9baf6ff13dfb9100867013f01792328dd6a3dd825c8aa50182717d13c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e95b1a20618897b3a7eee1f7c57b5fc1b586ae90 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1913da52138cb404aa611c1ec9532ace5f1e5f8cfa935ce7d1d32de31e4706a9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..dad4671666a756476a4367b7b7a1f81bcbbe9cf4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce1214c3f23b70053ed7e32fabd1548fef8e5caa42394325059e56cd4c3aba22 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..1716a41c1f0991634bd1759d0ef53d613e850f72 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a5d6faa3abb316f4e0f4e1cb7fd78cee6d3a79233eb14973bf517ac67798fda +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..00ff2c13282bbe8e8dffdf21a40e819fc7b9a3ad --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/22.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a726c3e7f20900d06600cfe1bb92f4aae8d55855eb043a3d0e6e82254c240d5 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..df0cd1a8351b558845fa0de1484762edd3fffe2c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21bbac8ffc0af7f73cf5fee280105416590b3bacfc17887155eece4e5a19e110 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..e95c7c4863db2f5f6a06a8aeff8b667bbfc5fc3f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb52ab67a0f388baae51543ca5456e0af6a4177edc86a62e6b0b6080b0512b37 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..181a85cdc11102e882ff0d15be1a09ad90b3f99c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c02422cefa06ad746c8593d5a8cf814e650c66b664beb30fe87555f2e68bab +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..07020ac8b53bc94d47d39cffbeac1c9f177b78df --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/23.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7732fb38e84b6847dfa6910e55c55964f373ecbbc59db0a854137e16ffc1484e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c14e5c8a5e841fe73f66c0571c0371cb924f15c9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73a9252a0815c2127137096b92c46387c4ad744a1cf86e9ddffbce8ec3163b6 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..181a7e72d8349364dc2554571ddac6c680fd1daf --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93fb3f1712c2554b57d3e4bd1cc729841ebd012c7bab1fb5062c8719efb2f7ef +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..60fde95ecfdee4d3b4860321107a4afb92c32758 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7dfd975f84e0d691615b91fa407eab4ee28b68af54e99f19eea77bfa5e6889a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..b44d6c6f283d3568be139481dbf60991c2fefe19 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/24.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d629a4ac81cde40d07761a711846262bebed2a1b4beb83b9bf5efaf715fc8c6a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c79a71a94a18d22a88fcdc1b10f600f4bbeb23ea --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7fc4e1716034305e77912cd8c67477621bf0943d7d440782315555d0620ce7e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..4e4b10ce4a4c860a24f51a58a76171fec0205871 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a10e9aeb9d98fada9be6f8ef1facb5a2b63b32b21c914195ba8f13bcfc0224e2 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..e151c70262b70b9838e0244c86f53c18ea13d980 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ba7c322000ec6585cbc835882f47266c4d578d18db72fdb0a3f0ea01187b2d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..fbc73360e26ea3e35cf9e1b265db12332b833032 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/25.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e321fbffc1d5f87c8e068b00e88691ec6b070e35b2b8c624ae1e1890daf8344d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..75e8d1e79f28dd16540f865ed0d04e0eddfaaa1c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c14727f15f2b141ff3300fdbfd443eaa26785e04c03e1c6ebf607128155e7e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..fa6e8e2263bf3a10af8354f519f824139d2746e7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a69b35aefabe174edfaa63359b6519937dc02e3273250d3556c51f2b14151437 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b2941bb038286ffe00609f0cd47cd8383ad0cd83 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8625617a6ec6bbd6573f562c50b5cabe4e376f0973f3ebe85dc6fa0416640bdc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e15bbf09742f26875a36a56ad694fc831ab3e74b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/26.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2200b1bc3ca15e0bb24154b94945bde6f6aad9825ef17d96c9e2e432467291 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0ab673375910dc99dfff37606793c0a2bed50e21 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d47628871e15a3800295c65d3d563b39ea15000f5eda5c7e2ec485d0c2d00cab +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..054bbc1b1fe7004f5ee364afa5f8a54bdb88d385 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91cdae796764dcb4bafd1adc679ec952855f002ad1a5075534baee74178f4d41 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..dc2b92b0904cf52e03801d960fccd92208ad8ae9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889574bcddd2fe56546e2daa6060b8b045870056c8065d7fba2abe5f25b57630 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..3315ab333b392de4412e42d4d1ae258d9f320f61 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/27.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b57c855fe4970c81ad875bec53037a4910c1c1d5a0c24cd18c85f76e26f77df +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3f4229cbc22e33a91a5da9660639e48544a9dff0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5320f076b26bd90eced70f54a3f7d1ba7a639f2be60dae92b62e6b50cefc9fc5 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..6f502f92a7e7367da03ca6d8be10f3a509052896 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55450d2d2c381e33f8d97c993c8e8dee19233b6735b973a33f9f199b611156d6 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b94dda54ca92484224933c7565bab02be4f94ec7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9b093dc9233dbed6797906dafa6cc22880e27c387e0dc9ffd3b06722eb7d69 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..50dea0019b6b4add79850fcc722e9707f82afa07 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/28.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5452e20841a7d3748d446a800ebcda41771aa052dd82af450fef4bc843d647b8 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5c54e61a6b8ee26befa3dbaf5e6ea9bfad8d427b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67dc8dbead851e9ae651cb75f9900e40e5c98ed78dc2084730c4dcd994a19508 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..3b347a776872b833aaa2d96f36f985d22c168849 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30229adf0439b6ba44cfba3152c04246f3d35742f6ebaffcb197a7dfe9bc1350 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d253bad7d9be2a4e862bfdc7be2f39ebb3104b6c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6826134c785f98453a51b67ce564458069e8ee5ce19e2b7f2a1135e1058a0067 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..57c0911fa63c3bbd17828508d0be3f196a4d352e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/29.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d87959046fd68aff7263b297e982aa688a0a2b251963cdbd78b88d7366e9e5c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d55c194448de5e2621fad0dbbe739eaf6d1b1cd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409d44c9485a08d6f6617f09a9683d8d4daedcf7831f28f54bbd67c2fba136a9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..466845526f7c62d210a0b2158a307d85ba7aeb66 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21bac4395c7968ef4d3e0e3b6847d8fa58d7c1b5c86019078d20af8266eb630 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..50176fc5ad794ca213d6b3e1803ea3a249c83cb2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2584311f51bfdecb8f03dfaab52dadc5d042e1cdf542535b72d531c69f34f572 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..e29142ef57716d6e1712e71eb5d6ca728556be84 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/3.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329f9ef1796b93aaba38d7ba627498824866a62d07d33002f174033ce50d8937 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b087d9069bb1e6a38410dcc63835b945d486fac6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d760ccab499e97f89f3fb900d4c1e487c1d3fcad5ece2f24383098a5fd7d3f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..37055745e2a494616e3cecda6844e963f968acde --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:750598d4fe1187498a41e731c682d9ae641bc5a9fda1c4a952bdce5d1c841424 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ba22faed3a8f1b363bbb41067a0cf86e55a16d97 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:466f3ea893ee1692c4e36c98f1874e18130c852b640602bbcf50727ab1cbd8f1 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0388b8d61f6650d7655b31bd1e81dc3c1bcf3175 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/30.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c47767c6d0d200e75ef26c4294edcc63d6ae4c8eea15a17a07901af59af62e9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..5135f568d27671e8c8cbbfe30cef2d721fa56dcc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:810eb63e26c0a7a8937be1f099ab575ef15b553b20cc139458ca8b1c75de583c +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1f33b45859eb454c0c2ce26314cad4703888c6f5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec97a3171f60d9cbf662da82672b11897abd9636a313d6a559cbd0b08c4ce433 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d6a4bbf50824bc4d6b3af8ad15fc95f1696774ec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6331133ced12328004c2b195a097b8161f5bcf750c3834b3c94baf9cc389393 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..9090926160456ac414e264b062a02b49cb7d7d0c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/31.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1276b89c1b12f533901baf86ebff2aefe76702ac6972c3e0fc6993b97fa19de9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e2205148ab86bf023ca868c6306a92c6b9e83db9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe0763e0806cd1e0f5b9b598d1fea5d7eabb6ec04d62445672081e2906b4c19 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..523d806e679c418bf5fb867e9e6c5bb0c3965d66 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adca548d913efd00697043d7ba2e85d5b9c967515d34eafb2b7c7e36b05b6347 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..8ae4680d24fe5ec4c995f13cb69dcc4b9f7177a4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:298f446473c140fa74563c4b40c29e51190f44ddad6904f8f460f4a2905b6235 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..1678f6ee4b67994aeeb9f3617a0c4a42ac7b6014 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/4.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae6bbd5d8e4c39fb45d6d980484f20014f48aa0bc55ed3c7d0a08ecd5569b7a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f1d52f3defa346a4e52140f17f1796cf1efaf4e1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:579655d06538a3830fb97f5fe9aa5e5a4b0c7ff7fe272bbeb987a01378f49bff +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..5442d34111dd886f2743676b3fb7b25867a89462 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:267e1e5c0f14afeda78a8ea8f241bb599295daa37740ab5bdf375aa7bf64d5cf +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..d90331a8fca1ee5afb284a7c528f128acda11769 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac49b5af34b761bfcc6c1aac5a7a98d1e8414995fc8777670e7acdafbe7ddf1a +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..67443a59f6d2d2e1813f9698f0174e036ee39f4f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/5.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e20aae4fc0a1a1c1f40d8c7a44057c9c344d85cc0434a2159eda46d2ec2dccc +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ab2c014647eee6d095283f879863b7c5e3289bbb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccee68d65a2885f0790d8429c90afed8623194ba7da5fc9ea067f3292de81490 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..0af74f14e1d548baf38fadef6c22e8b04a7114f0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6095fea0588da5f45be1423992aab759a79353ac741d807220ff8362eaa5ee30 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..6256de0ece7d62840d872d6ec08536c6b6c863a3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a83e8b498a3153158a17f68531d57d3c974310ee564be29d530344e8e56b66 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..a00a1429f2b3c05b5e6a3bdbd8ecd0f9f9be67b0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/6.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8748c3cc1e5d30055b804c18ab5672f56eef722f1e5abbe6ed03ea3388cc608 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c5f4f7c3e713ecad709e177accddde43ad764efe --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49065855008b7cb1873e68cffd13cebe52e62f8f542a1c3e9643e4446d10bfd +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..8fc2df66db0fc8fe357167876f31b61c5e1808b1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e649d2a360ba068d9fb0be220ca8943fe6f3ec3d45b471725b8191b8ce21c429 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..f531a8e0bd0f7a43b45468ba41965173e36c68c6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a0f3ae187b18404f68bf237d9c437475e97b6f4f7a1f9f9bc8547ca05bedf9 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c03a6ff08775e1c4e63a1067a8ad88305d87edd2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/7.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d711958d49c6f29042476ead347be914d88b4d31fc523da054def4ae8c7ca39 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..36f4d759870f3cfb68eb49f4b0330527a1354efe --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff49c7ad7b6f1d9a2eddb890c2225ae814f70f208fea5b777a19e2739b4f9c3 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..2e47f9c413af93433960a896a86e42921b16dacd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe9024f4b8ab01ef1ab26c74349e3b6d94ca47056963c1e0403746fabbc0092d +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b3579a131089547953773f4fd19c2c8a07f2847d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:174692a87aec82a84c63cf676ef0e25b389ae96f4e0e8a912f91b172deef075f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..9a0e1c0139c0af51ca433cbd06e0ca4e0037207a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/8.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a483d30bfc066d818bec0f780f15628efa1baa2cad18a8c0b553f343fd5a8a24 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.0 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1333e5c7015ac7a314f6023ed347d491236aee17 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b34ef74c4482d076ca0ee334924bd63c63622a09e77d6c23605e1b375c916e +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.1 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ed236412bf7b0c07735b02bfd45da2716111219c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7326a652ad0582c134df1f0d9969af343197e0856d35fc9932e99d7ae19dafeb +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.2 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..2a953a1d6122f1f6003f02d292a4dcfb321843a3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6056f9a3bdf99ca953dfddbc67a87eb14513a5f8919a49654eb186341a5d7f3f +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.3 b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2cb627376e1992401faf9f6d6d4a5d923832de15 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.mlp.linear_fc2.weight/9.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0db88d1cc3f6c73e8e6f64826224f3d0071e3853a9311c460a684cd69d66532 +size 29360128 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_0_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_0_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..af093bc040b9bfdab9ffd67f2c1c213613e5c62d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_0_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfea882a79f2bdc6691f3abffbf42f72ea90a206a873ced4c23ba225be3a52b9 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_10_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_10_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c2ed0e50688a0cbc824eee6ed07b498871987e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_10_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce2fde5075677bd348eda3e8fec4edeb648738c9160fdf341ea4bd3d502a774 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_11_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_11_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4adb79a3b81eafad2ee0f6891a7bfedf0e64cb0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_11_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7570532fbe5a7308c0eab584375a11ea5447c53c0f37baa45d0151dd0eb3f64c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_12_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_12_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f8d86274644c9610771ede40197ca9b8eac9f58 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_12_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f25e501e97cff7e8de02864772880ba25c1f94f3df6c49aaa0b4dfec3844b1b +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_13_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_13_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f39fac0eeb29a317efec3a08fad2c0ce215c5f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_13_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1342c024e8d734dba993c1b2703152ac728b93923959bd96668f521c614ff6f0 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_14_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_14_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca2e850efa96d6c00c6de5ea14f639fbf9f963a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_14_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87ac81f15e7ccca8037453d164f6b0a311df1c456912d5a5845243aa9a83107 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_15_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_15_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..437ea1fcfa2ab73eee7a898eec0997704e1b4304 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_15_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6c29a320fc3bb7ca2177396a4d262d5bb686d6ee6695e957a5259707e910fc +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_16_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_16_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e61dfaa23975967270aad806dae065cdfaa7788 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_16_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e033d5985303a093052da5d9f4dea431c518af71c277a87f5a23bf3a6be39ad +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_17_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_17_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7bd56ed532e56a11558207a37763dbc872ce002 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_17_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9495d6607a34a2ee495c8ef1a9ef72a0c5276ada44355618992a56a7404df95 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_18_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_18_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bca5e5897d482f1f14aa7573e116d9e1f552e2d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_18_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8598da7e410942c77870b4e5bde6b7a9d28391ac318438c409c9ad8e6dca52da +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_19_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_19_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f13820fcf76e40258a06b4586e83498b826ad95 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_19_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06faf86285c4b17afd70ad266428a87834326e5cf2911a7a7f75acb12222e7bb +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_1_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_1_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..89ebbac9c03995272e3df2fa62675664d6f57716 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_1_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d595d940b7304a5515a42a13db5243328cf166c05d6b389dc38ba296f895b99c +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_20_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_20_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ea979f8b1e9e7529aacc0181479dc16e1e52a9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_20_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eccd309df2ac0d7db90c90896b13b0f798e8efc5614f96659dece819f797382 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_21_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_21_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fb7faa6a94cfff6ebdf180a413828c987073e7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_21_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1063001f00061025ff3b86b9b03e2d4b9890486ac0fd4dd52128a0b613c637 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_22_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_22_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4c370ddc2282ed7983afa95d8df86c57a47bf5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_22_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfbd9465298388f8614145b4a10caab9c7f8d0d55abe62ea7b8abfc8c47d2e8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_23_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_23_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec750c20d7ea754b7060591fc68df51db2bb12d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_23_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc13cb8c15337279cabdcfeefa23321afde337b7b1284f19824c43a0863cf76 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_24_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_24_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ebd92dcb0d34b0bd690efd0bdc2da5180f6df6f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_24_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8f7582bb9b53cf1c5fa153cef9175621b3dad029679c33aaf345766500e4d3 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_25_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_25_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e690f65e8714beb7e4217d01a10ba7cb9bd2b82 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_25_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f4e6361c8a0592b80aa747c8a0fc6d1d51fcebc316a89af4a64697edf2c228 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_26_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_26_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..855bcdfd04112b915222fc86f67f147e9ae74c65 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_26_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc5ddb8b6a5e8173eff44a1a258649591b98faefeb4ae37df307cfde547a8a +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_27_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_27_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd33c1ed411dcd0ce6f8c814e30f0f76671b0325 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_27_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e7685fc01ba14be5ea09d5faeb559f569b52461fd2c0cad1c16694f2a250b9 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_28_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_28_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac35976cb5928a8da7e4ccdb5356ae7bb705f31a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_28_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95929b1933ba15aeb06cc40866fb9bc4849d315e5167854256cfbb604ef140f7 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_29_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_29_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..18b725d90b3e3fd1650d0b3f1d82e0fa29091f46 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_29_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cc67352bf8ce0ded1ad8c89a8a7d1893620b64db012b54d1585e9983c90a8c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_2_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_2_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eedcf274f79f2090967c28473e46e4a930f08b6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_2_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486d703cc7a816327e1b18018996059a23adf9177172614e860956333dd2eef0 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_30_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_30_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..c65f52a055b7e082e0cd65885d5c0deb922e9a06 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_30_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182b1e32fa0c27a25cd6525d3fb451cacc43f098039497d197b8af232c17956f +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_31_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_31_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..560bcd57ffc8d169bccd69b8e291d213494f7214 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_31_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a0a2cf37407340f38545d83578fb11ba1cc31dd32ba53cb6c2ef01a94e8cc8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_3_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_3_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..453a09b5b68dbe4520a1a34bc51220e4967b3ad3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_3_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4320cf77a3d24b17bb878df3147154cec3781c7998cba60a0040af04b5fc791 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_4_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_4_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd55ac98a7bc03e00d0e77cfe691a007e0f00feb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_4_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f48b20cd6ce31054bb776dc121e2d8c860805aba3290e19ae82d80372d0d4b4 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_5_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_5_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa4f904fc32ad2778bb130a79be99caf55f0a168 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_5_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c00d72ef6d697433831669aab19149eb06a9acd1b5dde8d9bddbffc239dd1d +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_6_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_6_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ce60eae9a820b281c5469e683029860a30d9f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_6_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e4978cb21be48bbb69d8455cc10f6e5e076dc85878033e24e2a2602a8bd6ad +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_7_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_7_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a75133c7bf3a3a7788686658ab1f091f3dfad7a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_7_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b4ebcae96a9f703a9dbb76d7e0a9a4a8f1842cd879e739b92a40a11242f5f1 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_8_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_8_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa615aa0df41fd59c2241f1ac26cd10c64b24096 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_8_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c1c7068de4f865aa72c7521437552e1bf92c309441fc1ad65d305302200d5e +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_9_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_9_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7061341e4ce159a3311f6dee8ebf866a52101ec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj._extra_state/shard_9_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e95d1a0f3a9880b886738863ad1d3e2200e21959610023c0382eb3f863b29f +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/.zarray b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..43a2fbd274c2dc4170b524c89e43af08d45cd00d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/.zarray @@ -0,0 +1,18 @@ +{ + "chunks": [ + 1, + 4096, + 1024 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 32, + 4096, + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3e497d387511176eb8b0f6ea4a3d0905217fc58a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81010899951de8b04ff3fbf6a1b2b9a96eccb6a3ec97bddc0a78f1b5c1c4c2b3 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..dd89955d0320cdb649f33be100fb5e2b99c746a1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c07fb243b9d46852881a943b7e3e4bb853c6ff68a482440066781f394718553 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..4930e2e5f5c3031a21026e44f59d282c1b3d75c3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a7c8a13acebaf50624964036ba625bc480c475c5835353ea2bd70c11fd9e45 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..236d55065c08be6e271743fefbd19362825d4f34 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/0.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a743747bda5064d8e36da09d99f1c0ca380391339c78c52aa984ae9af9c3df15 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7dee5241fe607a2b9df659e40c7793e397e70521 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a447aa1fc4a6048ca9510f465379021c35e509f65a74ab28fb66ee4bdd17cb65 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..4e54a6a849e9554e9949bdeeeb642a7193dce50a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6b036ce5c68798620c3ba77c93a7c2ed4c4062739be1cebd119b0a34db2126 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..23892d8bf586e58e82ae3aed660c8830f716477d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e629aebaed4fcb9bc47b1c138aed252917acfdec3c51ef1efec0b2968b186663 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..04858a5f5ef51dbb7cfaabfe0e45422e0f67bd8b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/1.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec3b5c9a6984831a89514f270968869adad39f71677ba6a0b3bcffb2821ffa6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7123d3a3191ae19bfc5fecb48c5f961caf6034cd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2be6b1195a4bc2f2eebb6e0dd7c431b70ab1bb21b84ec732826f82e0fddd5788 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..d5552d13d7c9bdf025cfc1525d092ae7185f1c79 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e5b963d9dbec5491784f3611bf124287e9576246995026965ecfbf6cce0cc0b +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..859651ed2d0e8501374da9ed277821b6a968949a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b24cb111b6bfbbe88ee237c5fbb53e1c724b5f3f8be7e0e0fa1e2f80526321 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..7cb39ed8d37f058a7001b6547e3e554643cc03ab --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/10.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a7a06e21ac29d3aceb80ee72811f8b84b6a6c2699bdac385cf64475ce5dfd6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..70d505fea84bf59856e66a18beae8ffe36508b24 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a347bce9a8cb998d56ec8c71615537827288c353bd2584df42ade601b5c02a47 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..da30899f5462c4f8e2ddc733925fb228c63b95f8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b782c3c13d2acae14c9ba86d87cb1fd2514880ebc355a651c4198cff2e7b6f +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..61f6127c42c3fdac26bf39e5f2794c640fbe3d11 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3824739ce0c3fefca28c8654598b58bb426b24e1670c0351757fb0eb680691e1 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..24c08b38d527d71d25d3b8acf11adc2cb572dc8c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/11.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1838fdee8f8a91362576065266541f5ab0e62359faeee04ba81e580a68b9815f +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..483cfd32b68bb7edcfe8cabd013f01c03348dea9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a4a3703edd44ae742fc7b68fcf4742bc3e2285af9546a961af1a54375a5f00d +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..a165121a3464cfc0f5118ea51910d54e13167c99 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c99b79e00ac8d63b7c0efa42d3fc77c7d9d3ae456cd87449cdb6f4bd67ce8c +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..0a9f97f9bd09288625ba53443e77041330eb0ea1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aefbfa1823682ec398b8dccbc4bdaadcbbdd285bc21c653a6ab1a5aa999e4530 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c826d8aeeb0aa3f9fab399b2c2faeaaf8692b49c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/12.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730d61d014338724739823b78eca64a279e9d91cd3328c3278c8b17979fed304 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..99fd0c1e2665d730cbc7d5621401e65f4dc273e6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3bd85263635ac4bc19c28fd24c2f2dd5e8293f7f0cc9b238c4d696be1f7bc3 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..86d963dd1c5754db53bce871662b4675c0bd81a5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1e3a6087aa05dbb0d95ca0987d392df2551de8aead560f879c1b278874ac9da +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..707e31e2e076a6179899ba5fd08b507c0dcd8aed --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb3791c1736754d3567a64c83795ff89e381a2b4a1026ba067363046232a13a +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2fd88cc19731e89ad7cffeba02e46afa38549c82 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/13.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2860aff367fac31cc7cbfba03ce10cad5f63b65e0c9a46c1e164cbc68cc3c173 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4786119862bc8ecfa44aadf850d4d51ac3b8ad58 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fbdbc56cf21fb4bc7eff55727ac0f111cc266a4a7fc4e171527d15cc803e112 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..fdbc611a5d240707ec283b518ff7f75cc0ada98a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb92bf7d6b221b6f60edf31535eb3dc4df06fc4c493520966a095e9f1cd097a6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..b1c6c6f2ad9364e669cdd319c88fcc57b13c0258 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffb76cf86247d31b44febad40cd18e16353a4e6d959fbf33b8ad7d16fac97406 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..343b886627b089df37f762e363036438a7f1efa0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/14.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc90ba3cc7d166dcc832c6d9b959f8ca8fa5c8b527a5b6c8d477e023ef58baa +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d7d11a2fccf11413301cbe1e08e368ef948433b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b73bb802d5679e3217504a86bb6ca26bf53e35ba672fb9b9e3253fbf23349135 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..dcbedaaf9017e7aa94209586a937c0617461152f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58573135228c21bfa3298e5e69ab7fd7100b52a45b48d797c4312937c82d47d +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..f73582b04a846ad4ecf0fc36424e98365068dbb7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef36904a27186e51c679c4a582fe241e23c08aba3402a586b1e66db486692f25 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..00f7cc46c2346cf33476d43f31f66ecf926d7285 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/15.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c55215556344146b760c50b9b14887c56d37b25636c42988e9e040a20418862 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac057f84d9ddb99054e2195e2b6aa3ff2320fe31 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c1312a08a4d9785ac85d278cc085af87dccec08dc0727313e04b41daf6e6cef +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ae5ef4ac9af62f5c7adede156a607fa19b6eefe2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad25df928eefcc9e49a0aac38f19a530df3d73cac1aaa1b83aa9fefd89f7a2e2 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..088d297147f76d84491afc688cfadd87594e3b67 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e60205da09015c3c4e0d3a474a7264b23d746c83aeb6df7135f82fa660b6748 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2e6f59f9796113a46a3fefb78b94369a2afc19e9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/16.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5433f17825a0861b071a404785f65b36a38c99aca5ecf234cad626798a9b40 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f79f667ae705e78fe24e1a143eef7505092f2ed3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecec5d0c132e5be1727d6390f42fc3a3c17843381f4e7c50056dabe6b89343de +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1e8d77119d5bdf0fbfa1c0fbee4197066530c4e2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1deefa39bcd8bc929e6ee198ad257d6cd2d69141bd0b33a665ef795c28b1aaee +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..6cd0342699b39d17ad309c4c3a0bad0089d456ea --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d782edbcc6a88aec74fe5a568b35f522cd530738d2bf2b98dcf7a6bd86e294d +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..1f576208fd987cb87fab20d581b7314749279239 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/17.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec49b467539952a7637b18709812f05b9790ed835560f825208e267051e50395 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3c1b0bb33c26444473f215101f05237be0ac8c2a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c66380eba39e4bb0e907496c275a87684988a064c7675a5783faec4c139b5a +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..cdde591af2d7812991c38e4a9a6e7ba1c393bb46 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd4cfda8ea4ec5eba734d8a7ad93cb6ebf83a1acb39fb7868d570ef6540dd424 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..fc1ee38e6f22b7908301bf5fb24450dcabab8dd5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6215b57d824903bad48db8cffc0a3ff7b6fbf8800aba517b69c58f1299386c4 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..c89f0c47e8be9fad23c23c2f17991a8d5ccfd3f6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/18.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957495937bf3db6ad52e25d933a58303565999fbd91c9d88af6fea775585e2f6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..69addc8e887876a627122c9238869c67dabed73c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e558472375d232a4972e16a806689f562c180382f11eb732a006e0b96c639ae7 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..b2b29778b9630f7311c6269e242832c7c15c6267 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f7ab94a8ae72506f50c5c412205dbe1068bf40a62f6363d1ad7503503f28de8 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..9e4bf71c6304254aa643d2e8be403030facaef7b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95fdd87c08448a52c25f8980fb1cb5f46207a3db788d18369117e4692f72ea1a +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..09bbf66d5c25c8b15ec95806cadcaca0a20ac110 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/19.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ad3bd34296af9482a107654bd175317165d66959e7c93763f6dcb6b2ccb9c7 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f87bbe3d480e44369a01e85e242718f4b50ee412 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6be28ebc83034f1e398aec7221f48a95348dccd7750f74348074bf5a455cbb +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..aacad5164560caa891a02b29901169e2156d5563 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bfb27ba7541f785ba446db852e430f16c29ef5cb74454ca82bd01729c1c4127 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..245381cb15912da4d85e02f04416544ac762c226 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d85faa204373a782de3af1934f63d9db2f73e99e5d2f51378f1c0783ecafdd +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..838ab8ea8d4a22b6a03e6abcf89e3f3377e5e9c4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/2.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae579dc0f5f6eb6cc7e4b6518682109d0aca0d7f17f9da8ad3f3710c00a4d20 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c30e3c9d9039f5ca5347c2a6d9f88bbd586ddea8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f736d2b3cfb786ff5274f2fcedeb45e97863c5581579c62940b09e830f13f5 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..5931b47bd86e90f5440746c3a23b040de27d338c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f91630fbb5b533e45cd5958392c5303fbaab278318e7b13a0c5c47cdac3761 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..fe18741a359c8f7aaa0c6544f17b4cf3af94a57b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d2b8d5fdf1f1cf328d8c25ac0b078042749a60a00ab060e99c9363a33825a0 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..0ff479ca7ed70cb495c6df1f983939b97bfd8215 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/20.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975ca2741a5e53b1628a135983a466ae2a0cfd00170c86708e7b166488b78bff +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8e60d978cdf0523a01de02d90cd446a32e7e854e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57d91dfc19f4395a5cbf5e03c509d97e90199d9850ca07a6ffbe649ad71d367 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..df5f150bef439617026b86ac483f6669904f16fe --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d484975e51ada107da356b6436f07e18bd5b712f4a6d03011c842d7c05cbb0c +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..758ad3a2602389877d695e5daa28e4b006626b8c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f3e1cf126aa72233539f31d7c4d2bfe4c8147ef763a2d8bc9ccba50dc40c97 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..61a5a5e270eac24a57af818b921d52718ac70eca --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/21.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bcb015147182df83d79206908fca4ec36b64ee1c3e07f273e5699f1447d287a +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a19d18ff41fc1b4830614d94bfec93979c7a57e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe887af256050c037f08cf14e4081f075f7f709ef2948057e6e8e585cac4272 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..b5738154ced09ac73f3f1a98cbdba5f4a42749ef --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316496fd6142272bdb43fb91bb9afb62594dffde8b00bbce3c31c8f209b88049 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..5263a1b5f17d0966a8fc5e60a820bb6c044e42e6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b3f6dd13e9d22a554a76994b9aa5a0898e7eab755750a15b8e82805618367e +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..4ed91d22a7b302d8a2f5bc8ad17fbfbf74e4083a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/22.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00827078d7335cc71e49b092b89a84d1715b044d0de423ee85f109f3a1e57927 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a7c8bee721d45385373550fc51816dcad54ccfb9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd548675dbb3e6520134819ef50e88974cd0a73fb985737291eecab7353164f0 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..08b88d514c323f192ff3489eff0b3013d8e2c12b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:007a0311f8a5fd8daeea37eea9e9364dea35ff3a0c256f138440bbc73bf49719 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..0ccff7913570f69d030669ddfd4e622f968e1b5d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16541fa0b685e6b5e03ce56cbc7694e1d2b82c3e4ace1ce9afad0b3a3bfc2161 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..14b62d9495f95974318861e8194640cc8dbfe6a0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/23.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:504164544f54833dc523224945a27cd73d3ebccc760e0bcfe4f81ec87182687d +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b45388cfe8f1a60c463a77b9e65baca9f23d367 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4fe48d75ef57bf8f05e1fa4f366a530837de57eac3e7c6deabc8580ec4e4d65 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..244be875fc0e4603b3c4b372eb56d7b2e4c319b1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce71bfe285dc58d0ec19a8e35402f3bf155fce42d937b51891401170f158122 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..c87f72b0c4edce300bbf9ccb6c25eef67d495100 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd5703081acb73188dffead966bd21b598b085a8d46bfd602b49ad1a88ffe51 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..ef986063c88f533085ee3d1733d7d1d61111d03a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/24.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1829f52a75adc41f998a13ee1b917bfab22089f7b2e1e3447e8e679343fc259 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e2810fe3785bca018555f784f845c58d5d79cb08 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e2ea9f3a5485cd657a6d9ce55f87852376544df2145064afe256f83f4cb43e +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..ac6ef5e08a974f7fd2f912696172fa266c31637c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cbe0f78e985106a4180757f1be08197dc3536ddc53821269fa71dfdaa541d2a +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..86a03baec51542d7dee76d88cb6d5cf97e408b68 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c58d993cdc27f818837702bfb38e4bd46b554c2c92c2d20364cc1149f593ff +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..17b3b5e3f7314fe425cbcf8f721b9239a0bb7892 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/25.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2450af9f824790e9e55eb34dff96ebb57cc72ba62499a0f580e654893f8241 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fd83ec238aca87236a2075571cd479444deb3bde --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1adac964c0e7f832a76c110d31572b4e5e233e4e7ee10acf45319827135329c +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..700ab386fcb92f754966538e45deb4ceb35d3265 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f322a1e1c46de13e4e5cc66b1de0d764be9e1b3ff16c5875a64a29992d8f022 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..037b4034876f3c29db9a3819b976778f3d04d33e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7843e588db0b7e61ece6048feaed69492934c4b1cdd28f8baae1336562cbcc3c +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..7d1a948a3ee8e858931ab055fff8ae3f50345223 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/26.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6385f51d475f97d27741022962237d81abbf004a7ad6b26bf5828d8e1754b3c6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ef70816869678fff447ac0571fb010e60093ccf4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cfb70252aeb574af3f3c20d1bbf164de549f3aed28a672ac67dbd993914394 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1a3c2e9c4027fb4bb34775442c9f4926aea3765e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03ae95b8a61644134784b988aba1e312c193c0d03405153c3d790d92db2f578 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..7b22c68891cec88cce4f0b712effcfd3e1681e05 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8da3c1e4c7936f0af590837a097c59f27983bb007df6ea39478cb2ed5f675bf2 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..f0da3663e694b3f1668a7ee95e74720d041a9650 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/27.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bc29a1686e3d7ee7a1721b7c0583749f5ff299590ccd068ee8541c5170aa420 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..54c97d841a04561d7fc7a4889ede531ae364c1f5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39df256df7fa648e1deb9c6fa682f20f5697ab5ed34246034bdf5ed38d4472fa +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..547d14f8eab86a8a44959622ae347bdaeffbb097 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebfab07cc059e505168abed546abbc14883e8303d2d341fdc77fbf9952180ad4 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..99ee5b608ab3320d163031fea1a86fa9977837e1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f3b719c98d111f71f33069770ebc6f95986d7aa06fb516fd27e052bcaa64fd +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..7f3ea5e7b9418626baa835292031afa5ea9ac261 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/28.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccfec1f6283056f77a1639d847224ac2f21d8a260c78710636036aa97d89a548 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..18dbef34ad4f91246bfae43828546433df51d7b5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221fe0316bcf89290de452f4eabed5d3a9c48a73a72c354d278d46abf76fa4d6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..921b5c035b29714d99ba6fe433a78b3acf17764a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f818ec3bbad39e2c743cd77e405a7cc2f4232c891b56b9ac2093213d2b9ae9 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..48768e53863e42d05bce2d31eed9858a8e7842b9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3bdc2a46ff58223e1e71cb9a1e4f82011c9fa21f6fb4b129ed0a7ba90ca4827 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..ad8f5d628d7635297972d84d179522194cd22f44 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/29.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d099c9ead84161e5db3023bd4af2f083fe6427d169caac46fb7400b27f31add +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e069b27a9d6a6de040bcdde791116e68e84a43ba --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc523f16b04f40d0709c5c54e77245004b158a488b55d7720467842e6aa2a573 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..b6dc851cb19166791b29a0176c13a2f2619a3948 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c829f5249c5764fb54da4fa7650ce69d72b57d616eeb232fab0692a4e99a6b9 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..bf64274a43fff53b6132b1d6f0324548d8ed6d61 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb4a94fd5a7cb79e8ddf5704ce194d320abdb706943f11d5bf7ca2011c4eb5b +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..8d30ef6a9fda132a90d9db04bd8cb124726d6cb4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/3.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618a47621d3e7add4d2d55915be6d61dbd96ee49704ea0f9150e0df43e090b05 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..4190d2e66b2ecba5b8e016cccd3b5d75f03cbbe4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1954db83c2f1f093d6fa2cb8ed32dfaae423d5cfe4cf6e2dc1c8d105103d20da +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..1a6fc4b50438b1484a8cec78acecf7fded52016e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501974f9324b2b069ad0851e8b92e9d3fa8bf539ef834c5adada2eadcabb32db +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..ee598a32d670cc5af6576c74c2e5930cab0ec1d4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb8a37b4ad4f00dd8b8bec9efba1929aa4acee864d922cf423f6973b83b14413 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..1f9c7e897267062783d8d5b3a9999ff00eba867b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/30.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e3b925ce5e70d18e4d78609bf2a3af2b0111243eb5d7e956292227e1e3a5ab +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c9fef31f874f901ebd2a8fee8b74c3f4b5ff3223 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b6a4abe2279e5358231c46b1e199e869efd0085655837c69aae69f6c93f8143 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..449c7252bb0adf274f37066f06d9a2d03de6cad3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e476b2d6fc1bd61092c9c0acc81b254b49c63ee270f892bfce05513bc8bd2a0b +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..cdc1ec72977808585ef69af1f2067ef50c15149e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63df6091b6d8a72d7995efb128f987b6d9060a04c85874938a135d7355d27b8b +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..7ef5964a6c202309652728130aa51b6f4cb87eda --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/31.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8687a30076cf24bbc62bf762d4a1badb7a45f78643f6f4b312fedb1cf7b509ab +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..38e4b0ce36119856c795e00fd2b0b3b0e7c74491 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c66090ac37e5ea65fc7f26b74f8b2baf2356e7af9c5ad22ffb64503b5be7136 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..c828a089461158747907f842dbbb57223cec770c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3206d01acad06e05e504a91993844cdcfb8102a82e035398df79f15ba55f17a +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..4bdb2f40a114e0fc653d9d2a28de29cefefd8029 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7cf2bc274c462db97ff97738656cb867e322c837831c929fe8adb1c61a2a545 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..bde0841f29b87b39809d393af14ddb02ec45a908 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/4.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d54603038c513b58a6270f623dc5e49974855cf3d275132a112f9cd98337078 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1bb9ceaa04972abd75116be3efbbca2474c287d1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1f7073432774fd29dc9dacc1f00f9414cb39497328f219d90f6c5b6fd09370 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..e80e0cc2e2589ae89c2c17fcc282aa8db9287b7b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2028f6abbbae022c7284f9a85d6029dfd4ded86caad62b2be3da45b3f0e18e77 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..516f9771a96b9dbf2cbc324f820698d723407651 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f918575898773fcef949cb4854541d6f09f07e6129bd909b211ed0b1c0166be1 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2d337ea991b3ed8776c2a0a7ef89c16afd0523c6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/5.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f75aa99bd3165cd16afbe3c46bbb8ccd59456ffcb055e26962eb720988881cc4 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bb9c3e9d58af0f039f3988f84aa9bb5971657391 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276e4dc21ef230884f1a76e93f2344a19df3d26882ca124ae2545e1b0676a3e3 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..b81984e6f1bf7641839a2e0c44aef12dac8b030e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fbcbd6081e64dd2b7c613fc486003b8c7ec9ff25015bca2fb8ce4f8de809aa +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..99fef197d6a65fafb3247bf314e84c9df3ccfd38 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d20875e825e686e20d3243f09807b113e4c08c3ea42f51bd9ef7d71facb0523 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..2f365c5fafe8fa3700e0dd68b6f2bc66920b0c7c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/6.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a3684abdafa0b7fd255fac8e0e48c686fa72b486257b4f77c53b3d1b1b7ef6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9ae232ec49ab5821e83ebe84eac7e1e8c76126b3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:682bb76f70a0b55114adb6f2a638c6534c74f41a1a0019ea3e3af809b8183cb5 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..bd849abfe87220457832ed32f7597b1eb6c05b2b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a2fcf69a1966e3791cba9cc81c2d04742f1f7b928599cc35090c778037a4aaa +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..5c3d6440efafa66399c584919182f86febbd5ed4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d2ee418ed6be5258e2dca217ae2628be7a42fd5aaadd0ac6a394e77c86b6b0 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..3f83842823527d0ffdc88d9580d68cbbafa68d38 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/7.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b71281b26baf04465398670b208ca3b7080367cdf13d5bd0121795f685d0750 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..55f7e5411a87775f94dbfa024c4dd5e9fc9c4a4a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b45d782bfdbaf94d34fa129d62ddeb4b6f593bc09b10a0d828cae9fb486d2a +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..65ae13aa72ed435260c06428138b5747a4a94d24 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7ea28a634507253cdcb3c0da13e60d8d7234e22cc3a470e9e5d789ec9bf968 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..1459e5716597ee50a73d4a2241e635470622b795 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8855581956afb0a1b67ec5cef11d45202d1d4e8d6bf5f1f5ba2d932e888d544 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..fa9efc269c3f4d77331de59561c4b7db61bb2c25 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/8.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:036f9be1bbaac014bd18479f996dc6794ebafb0277f84bf17931716151d33bd9 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b66a14d409de3c854ebf850bf6874142d2ad2891 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf3b48172e47b98f033c9aa65d7f4355473579fe116e85348ff2d4d78a3e1bab +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.1 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.1 new file mode 100644 index 0000000000000000000000000000000000000000..617e316c9abb022f4cce354265b1227f6b95c4b6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84581959f41d285e7af0b90f9f486142a93db6d20e91d8e52e6a35fde0bcb65c +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.2 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.2 new file mode 100644 index 0000000000000000000000000000000000000000..c48b61b54816a2b17dc89da28d8b028b57a211ff --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff699d6f83785700fab8414a2b8c88b4b7cc1df9e52408d9a9899cba361bf9f +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.3 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.3 new file mode 100644 index 0000000000000000000000000000000000000000..90144df16d256f95e5526b3adcca354b6d835d9f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_proj.weight/9.0.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da4348808e6d35484618796b3574da70c0bb1b5e1ed598829a10a28b52222a6 +size 8388608 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_0_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_0_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..af093bc040b9bfdab9ffd67f2c1c213613e5c62d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_0_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfea882a79f2bdc6691f3abffbf42f72ea90a206a873ced4c23ba225be3a52b9 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_10_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_10_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c2ed0e50688a0cbc824eee6ed07b498871987e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_10_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce2fde5075677bd348eda3e8fec4edeb648738c9160fdf341ea4bd3d502a774 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_11_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_11_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4adb79a3b81eafad2ee0f6891a7bfedf0e64cb0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_11_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7570532fbe5a7308c0eab584375a11ea5447c53c0f37baa45d0151dd0eb3f64c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_12_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_12_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f8d86274644c9610771ede40197ca9b8eac9f58 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_12_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f25e501e97cff7e8de02864772880ba25c1f94f3df6c49aaa0b4dfec3844b1b +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_13_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_13_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f39fac0eeb29a317efec3a08fad2c0ce215c5f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_13_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1342c024e8d734dba993c1b2703152ac728b93923959bd96668f521c614ff6f0 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_14_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_14_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca2e850efa96d6c00c6de5ea14f639fbf9f963a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_14_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87ac81f15e7ccca8037453d164f6b0a311df1c456912d5a5845243aa9a83107 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_15_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_15_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..437ea1fcfa2ab73eee7a898eec0997704e1b4304 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_15_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d6c29a320fc3bb7ca2177396a4d262d5bb686d6ee6695e957a5259707e910fc +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_16_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_16_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e61dfaa23975967270aad806dae065cdfaa7788 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_16_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e033d5985303a093052da5d9f4dea431c518af71c277a87f5a23bf3a6be39ad +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_17_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_17_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7bd56ed532e56a11558207a37763dbc872ce002 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_17_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9495d6607a34a2ee495c8ef1a9ef72a0c5276ada44355618992a56a7404df95 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_18_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_18_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bca5e5897d482f1f14aa7573e116d9e1f552e2d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_18_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8598da7e410942c77870b4e5bde6b7a9d28391ac318438c409c9ad8e6dca52da +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_19_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_19_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f13820fcf76e40258a06b4586e83498b826ad95 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_19_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06faf86285c4b17afd70ad266428a87834326e5cf2911a7a7f75acb12222e7bb +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_1_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_1_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..89ebbac9c03995272e3df2fa62675664d6f57716 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_1_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d595d940b7304a5515a42a13db5243328cf166c05d6b389dc38ba296f895b99c +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_20_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_20_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ea979f8b1e9e7529aacc0181479dc16e1e52a9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_20_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eccd309df2ac0d7db90c90896b13b0f798e8efc5614f96659dece819f797382 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_21_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_21_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fb7faa6a94cfff6ebdf180a413828c987073e7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_21_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1063001f00061025ff3b86b9b03e2d4b9890486ac0fd4dd52128a0b613c637 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_22_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_22_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4c370ddc2282ed7983afa95d8df86c57a47bf5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_22_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfbd9465298388f8614145b4a10caab9c7f8d0d55abe62ea7b8abfc8c47d2e8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_23_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_23_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec750c20d7ea754b7060591fc68df51db2bb12d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_23_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc13cb8c15337279cabdcfeefa23321afde337b7b1284f19824c43a0863cf76 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_24_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_24_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ebd92dcb0d34b0bd690efd0bdc2da5180f6df6f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_24_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8f7582bb9b53cf1c5fa153cef9175621b3dad029679c33aaf345766500e4d3 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_25_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_25_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e690f65e8714beb7e4217d01a10ba7cb9bd2b82 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_25_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f4e6361c8a0592b80aa747c8a0fc6d1d51fcebc316a89af4a64697edf2c228 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_26_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_26_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..855bcdfd04112b915222fc86f67f147e9ae74c65 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_26_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc5ddb8b6a5e8173eff44a1a258649591b98faefeb4ae37df307cfde547a8a +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_27_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_27_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd33c1ed411dcd0ce6f8c814e30f0f76671b0325 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_27_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e7685fc01ba14be5ea09d5faeb559f569b52461fd2c0cad1c16694f2a250b9 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_28_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_28_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac35976cb5928a8da7e4ccdb5356ae7bb705f31a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_28_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95929b1933ba15aeb06cc40866fb9bc4849d315e5167854256cfbb604ef140f7 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_29_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_29_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..18b725d90b3e3fd1650d0b3f1d82e0fa29091f46 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_29_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cc67352bf8ce0ded1ad8c89a8a7d1893620b64db012b54d1585e9983c90a8c +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_2_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_2_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eedcf274f79f2090967c28473e46e4a930f08b6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_2_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486d703cc7a816327e1b18018996059a23adf9177172614e860956333dd2eef0 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_30_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_30_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..c65f52a055b7e082e0cd65885d5c0deb922e9a06 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_30_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182b1e32fa0c27a25cd6525d3fb451cacc43f098039497d197b8af232c17956f +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_31_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_31_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..560bcd57ffc8d169bccd69b8e291d213494f7214 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_31_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a0a2cf37407340f38545d83578fb11ba1cc31dd32ba53cb6c2ef01a94e8cc8 +size 1840 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_3_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_3_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..453a09b5b68dbe4520a1a34bc51220e4967b3ad3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_3_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4320cf77a3d24b17bb878df3147154cec3781c7998cba60a0040af04b5fc791 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_4_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_4_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd55ac98a7bc03e00d0e77cfe691a007e0f00feb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_4_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f48b20cd6ce31054bb776dc121e2d8c860805aba3290e19ae82d80372d0d4b4 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_5_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_5_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa4f904fc32ad2778bb130a79be99caf55f0a168 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_5_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c00d72ef6d697433831669aab19149eb06a9acd1b5dde8d9bddbffc239dd1d +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_6_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_6_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ce60eae9a820b281c5469e683029860a30d9f4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_6_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e4978cb21be48bbb69d8455cc10f6e5e076dc85878033e24e2a2602a8bd6ad +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_7_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_7_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a75133c7bf3a3a7788686658ab1f091f3dfad7a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_7_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b4ebcae96a9f703a9dbb76d7e0a9a4a8f1842cd879e739b92a40a11242f5f1 +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_8_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_8_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa615aa0df41fd59c2241f1ac26cd10c64b24096 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_8_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c1c7068de4f865aa72c7521437552e1bf92c309441fc1ad65d305302200d5e +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_9_32.pt b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_9_32.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7061341e4ce159a3311f6dee8ebf866a52101ec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv._extra_state/shard_9_32.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e95d1a0f3a9880b886738863ad1d3e2200e21959610023c0382eb3f863b29f +size 1836 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/.zarray b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..9e424fcff6340323a44182d5f408a4370e2438c3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/.zarray @@ -0,0 +1,16 @@ +{ + "chunks": [ + 1, + 4096 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 32, + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..fadc19b73cf31d0ad537d57454889ef5ba4c36d4 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/0.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f0f84d8070a55f07db10b0260a7bc59211ddb6dc Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/1.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/10.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/10.0 new file mode 100644 index 0000000000000000000000000000000000000000..2cb782c6792c236531d3c6dbbb6ca972628bb4fc Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/10.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/11.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/11.0 new file mode 100644 index 0000000000000000000000000000000000000000..c4f472be5773744e88c62c6158ad39d8fb93ce8a Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/11.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/12.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/12.0 new file mode 100644 index 0000000000000000000000000000000000000000..20bd5c3598eb6706e2788e69c44940d0917351cf Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/12.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/13.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/13.0 new file mode 100644 index 0000000000000000000000000000000000000000..36cfaad509e806fd3d313f4f8108e782bb9eb78d Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/13.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/14.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/14.0 new file mode 100644 index 0000000000000000000000000000000000000000..0306457277c245c4e0c7d7deac7f263b891f7b83 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/14.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/15.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/15.0 new file mode 100644 index 0000000000000000000000000000000000000000..27c2208883c694699ab384cb27b76c62d97da132 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/15.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/16.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/16.0 new file mode 100644 index 0000000000000000000000000000000000000000..e614a00b67b2658fcf4c070fd65b7ddb1f1a8c29 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/16.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/17.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/17.0 new file mode 100644 index 0000000000000000000000000000000000000000..65624e8fc47d83e8deb9b76917d5cd47c9001cff Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/17.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/18.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/18.0 new file mode 100644 index 0000000000000000000000000000000000000000..ed5e0ac0b70ac8ca7fb521bee8bc4d277428b0b7 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/18.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/19.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/19.0 new file mode 100644 index 0000000000000000000000000000000000000000..4d20cc8a5925a19fff28ce7ff44ef48e7738919e Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/19.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..f80ebcda8d6358d23dbbe7c6599ee9fce521b3d4 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/2.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/20.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/20.0 new file mode 100644 index 0000000000000000000000000000000000000000..f3955006abafb1c92225f14e70551f3d9371956f Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/20.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/21.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/21.0 new file mode 100644 index 0000000000000000000000000000000000000000..f51eaa65e82e88717f53c220b5a2a31fa13e99e0 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/21.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/22.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/22.0 new file mode 100644 index 0000000000000000000000000000000000000000..6f689dc4452dc3e2ce445b51eb0ee0aa9464a98b Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/22.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/23.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/23.0 new file mode 100644 index 0000000000000000000000000000000000000000..6a2460a408e470be29cd278e4dbb7d4c69fbdbdf Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/23.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/24.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/24.0 new file mode 100644 index 0000000000000000000000000000000000000000..2c986d821c0650a68e2bd9e73b62a8d1d0af4dd0 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/24.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/25.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/25.0 new file mode 100644 index 0000000000000000000000000000000000000000..aa09d144fe86b14a1ad1afb0ad8f2949b3d4a621 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/25.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/26.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/26.0 new file mode 100644 index 0000000000000000000000000000000000000000..4284ea674e5ad6a49a3ddd383afaeebc53da0ece Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/26.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/27.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/27.0 new file mode 100644 index 0000000000000000000000000000000000000000..863e637f1a7d47404c992fe21ccacdd8bd71168c Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/27.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/28.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/28.0 new file mode 100644 index 0000000000000000000000000000000000000000..9ffcb1cdce0b20c232f70fe7c3afa6b6d030ebe4 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/28.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/29.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/29.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b246460907e5676be53671834e26c4086d58c6d Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/29.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..73b50f6e7183d591d8c970f0c26737dd3c5bcff5 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/3.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/30.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/30.0 new file mode 100644 index 0000000000000000000000000000000000000000..6c60e3af3c26063cca493d18021f590fce572d64 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/30.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/31.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/31.0 new file mode 100644 index 0000000000000000000000000000000000000000..6afca1a0d12fd24f4830443097dff8f7280c21f1 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/31.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/4.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/4.0 new file mode 100644 index 0000000000000000000000000000000000000000..8184a3b5f65c7090c74695ae61c058034456f8cb Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/4.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/5.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/5.0 new file mode 100644 index 0000000000000000000000000000000000000000..d6afb32866c8d83ab619c67d7ebb90b7f821b308 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/5.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/6.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/6.0 new file mode 100644 index 0000000000000000000000000000000000000000..e8777516fa81e2813d082199b542de3a7cfac19b Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/6.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/7.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/7.0 new file mode 100644 index 0000000000000000000000000000000000000000..83a6ce65bc7eaeb01b05025efab9e47042d21908 Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/7.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/8.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/8.0 new file mode 100644 index 0000000000000000000000000000000000000000..5ea4b6572d1b7fb58a384e2b37db9ef782a8038e Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/8.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/9.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/9.0 new file mode 100644 index 0000000000000000000000000000000000000000..b8f49b0bd6559332321f6501946e56061e4595eb Binary files /dev/null and b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.layer_norm_weight/9.0 differ diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/.zarray b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..4555a9826f0b44a0bf4dec462b3003565459e589 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/.zarray @@ -0,0 +1,18 @@ +{ + "chunks": [ + 1, + 1536, + 4096 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 32, + 6144, + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..53e48fae3a78619c8adf00b8b4229409653eebe9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0403679a205f94b5c330b5870d713d74cb9e22d137f21b0433879f3ff1beab9 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..7fab562876d25e783ef7322bce10a790b7304abc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24b639ff47e95fe57cde8a29057f926a1a165417af6dacff3937847426c97182 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..4c79cff9664b078ab3a999a5916f5376477fa706 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7aebcffb96c15f14afb53accb55d1c6359d8b1b853fc3617ead65bc5f1e5d8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..53a581c24eda3b63470f1479989d57ab2dc5a7c9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/0.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae65f73e624daab1ff9908dba31657928400d6fbeedd296da1e933e7f95562da +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..7949ed263bb37f972ac5deccb109c0af50980d0a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e3a12f7a325423c9874d22b0fe3e9b92d8cb63fdb51ea9cbbd41ff86ceeb99f +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..424a915def6c868daa1c9b51657c42c17fcf503e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88b1653169ee74408892186bd0fdec42d8445a7bf3b54bc72b5c832be4b65a0 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..4f67371e6ade295186c5a6203d078de7a2e02b0b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82be6a6753b3d19aa606c3042cf0542798a58c7d2ec86b0e9d5eb2dd1f2f9ec5 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..e144f208f5c2ac826be7ef9dba47eca88413a080 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/1.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5b94f224d2095c2413a8951409c290e1210e5919ee4b5d168d303cd3314ead2 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..baeec481204f1447a0b4ac4aa0512f0c5b16cc40 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0264cb55fa1d652d08eab8d02a5a9b31164985bcc0ba401c710c5fe8edad863c +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f90ff14b3d9810d60aee58b20790cfbeb760a7bb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4526ab13fcbab7fbb62ad74416bf66f006b4890fe6dffab27c44ec8a931a74f4 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ef9877a72f9c17f305bb5d3b498613a19c95068b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e796739c5a23893abf277167fd9b895a29c039a01b84ca7aa64ebc8f1e88f7e9 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..54b048d7d6b47487da1d7474785bd41161af89a6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/10.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c855038447de2c4719b37d4c0186b4852341584bc2d125d12d6d9759d146c1d0 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..61bf5081bb52ff79c6b40a5e33c0418b2165a2c8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7959aba2dbb7b9af254d5c9c80e4fd4b5ee4c935b07a0dddeee8caa53573c4fc +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b4a5130b5c3d652a6c5a21a1c75cacef4013e292 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d847020c95b8bc5d96e9634d4a9bd1d0fc27a2d2a2f221354fc92b407aacf0 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..aefcc17734cc9729a8f28490f8e8de5eb0b32c74 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d50a9e079c5632f70c9dd17d62d4b1f3374ada849e6d1d9c52e5770e44b1c551 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..588da74f8013826f05d5d001ab02087fc856ca53 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/11.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:306aa9d56310676ce19cecb33c9fb858dd47b57e587a8bccb14bc0d4cdee203f +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ec89533dc88ef6c9391cb8c8ea3c535f87a35d50 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cc52e205291c90078abbbf27e99068eb1ae196def4d4bb55b83a2c92bc47d7 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e45c9b6c0ed7398bdef998ba09ac3ad0525599b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ada52edf45143afd90746b9c9e4e114239e9a03b99a1bd191d36315b0d80367 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..051101654a4306d7cb4ce0b8b0eb2b6325b1f2a3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:040f036cacd3addb590db63cb6f57d32f5173f75fb29d9c457f868a7151f44ad +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..f4dd39792ca660bde976cac404fb9897fe88a82c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/12.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7546a742e29e9158e016cdea515d2ba43307287b30f9e44452cefdcd5dcd434 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c31f9e3ea18c584b4044b1961bf034b5dcf5f72b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae87d55f3c315561ce63469269b3aeea6365664235dddb1d05d7e0e3a43b6070 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..478706e6c7f0b1206321a1dab5f7bf838cbf91f1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec623acac4fcbfa235a4cb54dec0df66c032c368ab60bb833cf34bbabaa976b +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1eecc729a4475ce228c118feafe8f9ad7d6e57c0 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d2fcd269e5f4579b5ce271d37f3e33e1a3028f9cd4a26d6ba4386968eb8e61 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6531a3addf21f023c1a1b4d65b3f4d814149a14a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/13.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32263d79a410e967e0ff0cfadb1ae1e68d634bd2781faa5dcd7ad9ceb2a274c2 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a18591f9fc8e62574e3825a454e06adc4d9c63fa --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a95a4351a56eddb341186cff38b80f06bb79b01584b60bee5b022c1dd2674120 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ba3a65462a09d3ac8f4a8be0f52e442a4f77c77d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1850f73f18e8e85968b20bdb1eeb212c4a6f619e5f564fd9ce99e34a5c65b40 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a6976ff7ce35152f23b297fa5d8a9cffce9a434a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f9ae0654dad5a6405755e8db5d341177a9f3996ecec66712b4c7d112588f37 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a2ca56da1c3621fd54c97afe89d7e12e8822c8d6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/14.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c848f58592a04d1ac6d48650a53f57e220ed6da56ae42cc4edc3f680e9c14fd5 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a44f45929a115bfa215fccc4cab1a87af5ad3243 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5128983007a5c408fb94324588707db3cf7a83de6d4f965f6b04a6622635ea8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a368a1d6bb5df04834cbf74bd56cc2d2ccaba5f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f06dc0c8957893fd849f356a67c8505b9bab614776f07559e390edfa3ddfd69 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..018e78bffb5c8757c5384550c09161b1252fe088 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb54fab75e683ead5169e448ee663ad4b93d007fe654a8e65e08d094f90baf8e +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..af5ed48809484aeadfe9bebcc93ffbb7055dfba7 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/15.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c5978f6121fdfc1eb415297b37f91fe6e261eca5c98408d4262074af4840ba +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..3dce6c97b47c75f21106774aec4037cbbbf5940f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29833a5cb9def74f66803aa22e5cf154390b099464dcef220268d0f74b50d17e +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e94321dee6f2d948454ac6ea4939f4d22676af82 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3933d912caef472466618e98f3af79b64f7ad3089681342cd60dd9fa65152e +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3e39c542ad0a92e8c8771274df2cbff464077686 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b8d416f39d8055f8fd098ca1dfe6f590f2eb7404bbd409e3f19699ce6942793 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1eede2f4d4df3acdb0eb7fc1c4441ab0dd613c12 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/16.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47eb826248ba35ac13470785ddc6a8e94a2c9f57d378928fe557bf32eea1b9e8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..0403a4284895b8bf2b0c6e32d3ecbc6a2228266e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:911bfab28b5369fc84178a62855b15989b11718363b6ba73752cfda674a5108f +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..8649beac153dc5e1fe7437a949f31cefe6cd92de --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cffa070a845d4a116abd3f9855b2319ac00b5a70acecdf7d326ed53b28fe62f +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..3e058f95e8860e51cfebaed373beffb7e40ee54a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8d1c1078c63f71869cf153f463e2c235500a201feef4b968648b70524ab3ff +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..5b5008fe19cf6492919caf8c7e484f15e839bdba --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/17.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f5cbd25b8e5296919d5e586efa8dc5b08f94bb7ce43dc7584d295c0bfcca50 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..bdeaab0c37ed6efe8b438b1e6a0b563f01ee120e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b805626a44b5c67e8df05ca505bc254ca3035ce066c50cd546a680f27c57623 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..6323745144ab09f708b1af2fba768efb1a1b2a0c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96228795bdb84f2051ea7e526247667b099582cd9bd163d2a8dd3f7edb959b1 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..062c1f0295862b536f4bed7a6a1ed9b4d76aa26a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a5866e7e2822d582eeb2bef387e5feef907e3d558d79982192cc775a5276fdf +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..433ef07699ab2ed56534e6eecd2d4c0cc28acfbc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/18.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb29f80cc7adccdc501d8e48cbef67d66616528ecc3ab7e23ca9fa50d826bfe4 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..f63c75ace51775bb840ae713baf47c7583bcc9fd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26040972a2919d0025aaf3708bb2ce4c35e4af42412edfa12787e9ae5f75b4c8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..9fe13143176bf371f06cac74f80eb9d0f5c95914 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec3df232939473fe42d44a1f9816f4eb80d314211bc078ebe23d5563d0cbcee2 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..90fd98d74d1c2fc77e3c7cb08ffb31d29daa6a52 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5b63ee080aa19f7a993acb17a8baf36a55a2b3b2dc39f9dbb399bac08dfb92 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..fb06f322a470a8a392e0c8a91bdba15b053a6d3c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/19.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa59df2904bbd595a065b9f681b990f7ac021e32ffff046cb1331c2f850c092 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9d64595f10cbf149dc99a5a3b11a551c3c5719ef --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:facce626d18f72ac896b9c87a233e9fd9b0a25a61706eab8a1b16b1483baef95 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..201568496523da44b7335718f67368762c44e391 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7786d703a6a9fd424ed8ce5624594baf8f1e279a152c74bb69c6cc8007a58e5 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a3de6333fea6fb1b15ed511c0fbfd68c98d7672 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9de14e701c95d30cca9a9fd4ac8beba4a69dd1e08ad04852ce28153a101a63a4 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc74b61be22844ed029466269582f32b25537e6c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/2.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1507b4dcfbcbc2361a1de2210d1938b31e1bf18b4d07bbe99e0f0f80dafc485b +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d94192bab9347845a0ca2461dad2d8f43a5e1f22 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313e48fd8beac1171e01e0116c05b7e8cc6d66d7b07d4a8f53d8061466442df7 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..580f26814da410c32be014642269b125cbd6c015 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85730d08acfc25dcdb1d34a604632294e2a30f301a6d2180499fb1b1e19dba3 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..4ba51317b4c98c0b1c0ab5a96a34494a88909e4a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a83e86d1fb86680abdf98f179664869d1501ccd0f22737109efc1807b276e527 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6d938bd1c486ebe3b61940bef4f70b5b78f24572 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/20.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47c97a715b295b1432d2a68aba9e4deff4944789e1478c1e4d6e7b1bc1c201a +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..40b0f67638d325501ffef10002db15feed6276f3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0cc399eae67ad9429aa35e4eb6c94a4f023aaf2a2672151ea8241ada324e2e +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..ed0f863ff9e6341a8c5cedf05d750fa61cd86184 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:038460bc864e219f54597bd6e5e46a7ec983da8bd7eee7d61b99a463681bce24 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b489bdbecbff0bf0fb8d5e30d7a04d4763f358ec --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1f9dbe5e8ea86e5f36e1f9f2b6feccf97c9096326306289bcb1ff21f655bea +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ae9267bd8e34f375d409166f12a6ec46964a042 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/21.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32571698125e33a1a03554db5284cf10962ae8001954f51e9d42e64dce66cf41 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..c37c863c16748489b3b968d6eae0c0ad81ee387a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3cd7b08fdf83d59fa4dfdbb097053a6db636d24e8bab388efbdef4c667c0aac +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..608b1652ae2938a03ad60116647bb72ec5606013 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90402bea7299c30a9c180fee5328b9ee23368e93e35fe4fa0d37f0b099b5fb49 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..cc7e2f904762c4f572d11864db095c62bfc6005d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b4c26c38dc5cbae23449f25487ef2951e6cca61ccf489856e9321fa3ab1caf9 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b04d49ef52360d85182584b8317857cbc8095766 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/22.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:198904d2e03bb7e521882209a404f7f6bbf1654f459875ba7bad7a24c5866e00 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..a64feecccd704f7fb6c1ba0cc8d55cfbba4ef244 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5cec1b82bbec7c5cf577a07aefef98bbbddab880c005287a59aa76074051fe +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..157a63843a4960083283011f1fef076e1396fb78 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe139f964f3f4d96bc83020581055ae7e0940b8a70e583f03086c24161d0b20 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..6010c995faad9b39ca5c83925e5154ac6ade08e8 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77eec1b3b02627f0b7f66669420e2b9bdbc88f4e11af51821f87f159d7c3ada7 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..09c17264b1c5c1726faa6808891306370ff2c7c1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/23.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0872da0747bd8131c0034da4928514c30fa1f33ded8b79bba813b42918ad64 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..e0d1a7ee3d8a9e10f4664941c97e903a90d51faa --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389bf015a3d45293614dee2ba417542ef542374ff844b2321e53cdcc1d99c2a9 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b1a92f26cba8c7bbcf4336dc7d4787ca6671d1ee --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d683f5872d57fcd8d74ae415c5847b12b2c539bd13849b58ca732fe773ad1c8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..9a11fa84baa1f78edcee9143c030465c520259db --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e75fd09fe91725b334499d9553b1ed9b33e27508bbe5ae928bc059dc1ab08c9 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3cda95d5c4f1b5ee7068c9c96576d5bd240de9dc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/24.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:336e8c46e37805116f16e8596334bd01c020f7a28a2039931dd1f68bd6012c92 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..8355d56b45bb2fb271eafde2de1e62bb33be1995 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8e168bc30f3a57d8586f2bc435a6acc90ef9e32608236cbb691233c293deb04 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..59eebf82441d45240925e22719f27d5d142c66fc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66fa0ace975df095b569b3a90a0379195c13c75a64c79911b978167f113244b5 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..92b9ed9158665abed03e987771910678bb0df0cf --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe04301ed9d5c47ec10841b95e921c5e0c86b646a2acbf035ead5877f258cd50 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..15cb2dcb2d4381b8e35e39564be877832bf39e90 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/25.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166f7835abcc72792634bc6d67715ddd133567a1d239514c186066a42e23f469 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..26edc7068a1cd16629ee8b2f4cb06ff58a7a69d6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545d2c2a29354577a884889799bb3a04a59e14da7a77d07dfb5525f2b348a7f1 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..58a0b816cb41e1c773a66ae36bf2512aea90d165 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f1b246b156925ef01612f4c1286f2cb9da626dc81a11b1645cc1d11f7a73d3 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..eec530d40973fb6ea5e6d95cbfbe11e6798a215e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9788bbb904d6f9953a158ff1a1af725809438b7257e57484918039bf8373256f +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..b754d24d4f51f8ac945f9f268e8cfd58d8038169 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/26.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ad28b74cf0a40446db11158238b7657842b884fe45ac0ee4ef32406f4631cb +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..41305482a1da76f820aeb960161653b9f99f444c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fec881ed3461d8f61504868f71237b4a4bad3175f19d8ea001460abd46d1bc60 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..63fe28dcc1f944c3dea1b83f755982883005b410 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:279139ec4e2d6de06d2b66e32a6d8fd46fddad3a690f5b5e41e816d49c83369d +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..a82f074cd53f24969b8c4f624ec32561d0a3b976 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d06d87b99b3ac042bb6318a71b432d70fc1f42ab6803caf24f072c3bfac1548a +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6c7dbdde093ea494736ae7a33cfb9e7f87213799 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/27.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55b12a62c788b03290e03d80c873ad55c5fdca9f8b7a3811ad945bbd281a4b41 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2a6dcc1ef9c25250c7be4ea866382d2fa18e7b5 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f7e41f619aca259f0fc584c085b2396b70be9a2d769a380f1453bd9dbdd7b9a +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..de17ddbd28b1a32f934dd02761529410e7333032 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3dd424b9898cfc73fb0045a264d831adedbb903d3767f09de338179cb211db +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..b012ac8b00a4f3ae1807edb5de4cc2212277b685 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45094f9b0b752d5188b48ad34c15993da63d47782b542cc3a00de48af14f9a55 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..7e6f09a701daabd2d2579bfe0417caac09d311a2 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/28.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9849b010ec8ff5edde8b70986c8a286e402f6114601d65dbf65cbece92d45ec8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee4ae5c235199814c4b7685846c8c99c5e8c7605 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aee734a0daf383fabd041ad4133e4b32f24c75b334429b0b7e02194d7152e78 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..d544a1a11f29c84c0a014d8f1ae9d7d7b88845cc --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f63fd63cc19f6578fc8a8c90cb3689370ecec0298d642a5e7e2d7736026b48 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..bde3cd3119fa8b25f7a97f31fe4405d80d3c0892 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49a3752e5e274bd22638a203dd5e52a98b22356299e667a466bbd380249590a4 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6b31085042dad92449f2c9af5fa7a13df508a32a --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/29.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2574a419ecf8ed713df9cb98243881e8de2e5ea8229821b66c15bcf8169b011 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9c7b95496fe6c51aa838aae74a38d5b93be5caca --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad6e5646960068712a30cb342afc556fa05db9ff8075d68f15338d4c610d69b8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e6ef54a0d0facefffd0f6c85f9b45854f4ac4c62 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d5ed950ca0f0ad8bc22ac65906ef8a0ad4fd056849f69c13336fb941a3d4bdf +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..17d76d8d3fd07653fc1f5811ed89689859d2bd07 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97201b7bae48c350e142170e36680668d16c38458bd9e4166524ff6802e7a00b +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..acb92be5eab20f261005f11ba86c78b5413f6f1c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/3.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82cb58891bca761f8d22fbbcf60e656d39e71084f904427be48f9c31310d844c +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..68cd1d27c3fad45c393335ceb1c1f1ace733c2e9 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64cf3492b877b0784f9d9f1afcf27e019f529e2e3f346dcf397955858b993fa1 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5503fc4b6ef68df15d926bda15a20616513d8965 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffcd3b538e59e2c4665054929ad2564afdd591c963f639bf0c7f834ea73259b +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..d1b7f231ca1955948507bde9fe296a1a43486f17 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07082104a7ec3b219fce054023072d71b76b7e4b318d6d67e450f6eff4aab412 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..3e78098663bf76e20174f62e098cf3d974992cdb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/30.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca767d99b4223412e1d93dee03e3a6e2b2ce96ec6f16eaf5dad2a9903589f0f9 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..db74251810145efdfbd9b21d630b4d6f5dbc0c6b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9aa221de1370c581a9d86e37598fbca45dbf8520656c73512f2f3862e1e7c70 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..f3020ae5ed2cdaa8f04a79c8c2b648e791e1de03 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1181474300a12a7f62e38fa76def5bf37a905d9b0635d071de90575166f16469 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c203f353b9447b33bff56341eb09c22cbbceed9f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31ba3b9202da0e1511264be209eae00db58d64db8400f61578f55aa5510f4155 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..bf1c572a5357512f129e6f167057333b3fac8529 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/31.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f44f24572d58591f63e2452859eada38f0c214b55cfd12036076c346b33818fa +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..2cd25559a18ba0decbd4dd1b057583d63e32798b --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f8776dd34b56a3ac978a855b9c9342b9776e11b70f13cbddb237bedb83a4c0 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..789816dbf51b48dc9c61033307c564907f5f8f19 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c193d6f2bc1b364a850606cbea0f8a88e6bed7956b12adab4c8fb055c98d9ee +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c2e110a345f5e2f510a9b8a6600904543233c9a1 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fc280f13e87e3e8afb535be4992a63153587964759150a8a4040daae24e7e0 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..9839c54864d6da2bda98237f83616db96f078558 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/4.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2570bcf11a10fb8ed76fc12c8cdab9551338e93c99bf19522b64fe759dff1e2a +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..dd3109e42d9907eb1b68bc07a86d6ee64e589a8e --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77bc983c86c66d22d4f473c9205808b67e08e9005666c4bacece44200c51e869 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..3b730e03941098e22314780765870dff8ceb14c4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8640f74156f6d0e0ebde2d6712123c6b601a0f5ed98c9df90c75bb7a021f422 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..6eaa9974ffb46838a56f400f2fb57b143b45c4cd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a4cb7aa9dbfbdd5d6ac6fff5985117fe095e1965ad7d2349b7ef576c47bca2f +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..603445d652866c3b3ba1d4d9e1047ec985f44a89 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/5.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736e8639767fc032c352fc060c0003c83d6ef4fcdeb8ee41b92ab10dcd188565 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..d65bf70e733a16449f7c6c197ad3761a7eaace7d --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f49c48903b78c84b4dd335bc2f21e64f68a795a8d4e0dd3c18ebb595fea44ad +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..b5cf2da2a779d3f06c45012b268fc78bce8d85f3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9490edf8482e6ce7b3faab426a1313d8412e9ada26113335f155fb9e33416d73 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8d621d5077ce8d2e993bb7379def7c3f3be455fd --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b6ccb4b69167b7560a5dbc6efa17b44e11e05ae3b02ebecebcaba04a46e4e4a +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..a9179a35272830e2336ceee587403d9a4cbc1efb --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/6.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23b08f33ac946b09b4372f349ae909bf5f2f176b8cf5c826478c51d8d0268bab +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..efbf394ef32cb739bee5ec6ec0aaa8e77bc64ec3 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb4411662a75632bff3862dff5aa0e3dc07a9f8a21d129327e886c5ea2586575 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..5efce91c8112fd31c6cc9a509a9a07c6104b226c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2930d1247a165aa1072227637fe0d31ab53a34ecc41268641ba5fb20a0fb4683 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..c4d392dff5fdbe1c45f1154e5ee2dd5e0f148c9c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75d3472adb573be7196836b63e17d7e693b1b72b89707b73bee6371cf062421 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..45399e205a26b4475e5e32ed102bbf3cdd94742f --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/7.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d23828adcf6467a3a5981f7afa82d67fa45c7e6af47ab7fad920e24c27f6dae +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..26bbecae97b6c75cb7a0eecfbb2116512d79d782 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aa765687737be4e604f944f4a4eebc5198200ed097d580004b8c956e4c043ab +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..339817f9f7c69c7bed73b052ee2edf8a636fea31 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477e1ad5785a8c18c6aa8460cfb36b4e0bd5edc1d955c10c395526fcb4928dd0 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..1acd9c3649bafdd025a7b7181701ed29127f8628 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45eaad46a42f74cfe8eca206b536dc974494260c0a164b5ecf57544a5ceaf9f1 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..4482476dacdac2d564cc18a31ffd9d515924949c --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/8.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8becafcdc5b63c8d20454707258f5d629973df29651ee47188eaa9e1ad5110f8 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.0.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.0.0 new file mode 100644 index 0000000000000000000000000000000000000000..9e96497ff87230b1e0bdbabca99e9299700d9b39 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4cef85f143bc86622c9b23db105380c59a41fb3eae35c29812778841800b73 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.1.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.1.0 new file mode 100644 index 0000000000000000000000000000000000000000..e03374cf4dcc9f611558460ecc7467005ba17d08 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f42134790bbd23643bd8104db9e06412d48ac84200716f49814630e1bb4c282 +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.2.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.2.0 new file mode 100644 index 0000000000000000000000000000000000000000..ffef3fc684a81b8418c749ec4fc614955ad097b6 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a4fceb141ed99365416911338d5898846316b68ccd76b41c5d144e4790b00b +size 12582912 diff --git a/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.3.0 b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.3.0 new file mode 100644 index 0000000000000000000000000000000000000000..490526caed2a2f9f00cc6310795854ae5ec375d4 --- /dev/null +++ b/nemo_model/model_weights/model.decoder.layers.self_attention.linear_qkv.weight/9.3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3748207381013268c9b9c0d2eb3cd74ce90519b9a28f0c5aa382493615066222 +size 12582912 diff --git a/nemo_model/model_weights/model.embedding.word_embeddings.weight/.zarray b/nemo_model/model_weights/model.embedding.word_embeddings.weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..eefcdc18190119aafafcac41296120db1ee09506 --- /dev/null +++ b/nemo_model/model_weights/model.embedding.word_embeddings.weight/.zarray @@ -0,0 +1,16 @@ +{ + "chunks": [ + 32128, + 4096 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 128512, + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.embedding.word_embeddings.weight/0.0 b/nemo_model/model_weights/model.embedding.word_embeddings.weight/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..da552f450f215f3ca25a191f54e63ea0b78acff5 --- /dev/null +++ b/nemo_model/model_weights/model.embedding.word_embeddings.weight/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba446389a75e27792c5b092956596c2ea8a2265d742bbc555256b89e971f428 +size 263192576 diff --git a/nemo_model/model_weights/model.embedding.word_embeddings.weight/1.0 b/nemo_model/model_weights/model.embedding.word_embeddings.weight/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..1d679ec117bdc3cbc45ce66af066e2075827777d --- /dev/null +++ b/nemo_model/model_weights/model.embedding.word_embeddings.weight/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a29daad0e1f6f6388ac4ae6810ed949168e5621449a9b9754c979a0135da78 +size 263192576 diff --git a/nemo_model/model_weights/model.embedding.word_embeddings.weight/2.0 b/nemo_model/model_weights/model.embedding.word_embeddings.weight/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..8afc8b848871997e0986a092428857b063c23bec --- /dev/null +++ b/nemo_model/model_weights/model.embedding.word_embeddings.weight/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd093e5beedb85fc693446c2b3692870cdbafde4ac7b99ad7d533234ce5e125d +size 263192576 diff --git a/nemo_model/model_weights/model.embedding.word_embeddings.weight/3.0 b/nemo_model/model_weights/model.embedding.word_embeddings.weight/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..de14c19e96bc837e8800714592189a60890325ff --- /dev/null +++ b/nemo_model/model_weights/model.embedding.word_embeddings.weight/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b001cc8ac7f3bf0a20a6128192b92c6f1048430be41b3f7822adf35934e8ad +size 263192576 diff --git a/nemo_model/model_weights/model.output_layer.weight/.zarray b/nemo_model/model_weights/model.output_layer.weight/.zarray new file mode 100644 index 0000000000000000000000000000000000000000..eefcdc18190119aafafcac41296120db1ee09506 --- /dev/null +++ b/nemo_model/model_weights/model.output_layer.weight/.zarray @@ -0,0 +1,16 @@ +{ + "chunks": [ + 32128, + 4096 + ], + "compressor": null, + "dtype": "bfloat16", + "fill_value": null, + "filters": null, + "order": "C", + "shape": [ + 128512, + 4096 + ], + "zarr_format": 2 +} \ No newline at end of file diff --git a/nemo_model/model_weights/model.output_layer.weight/0.0 b/nemo_model/model_weights/model.output_layer.weight/0.0 new file mode 100644 index 0000000000000000000000000000000000000000..1e5ebe2da26a9d8962d812347634b4dfaad1f51f --- /dev/null +++ b/nemo_model/model_weights/model.output_layer.weight/0.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6490dfde5d968745b4023e6098e9ba131def36aa065bb17bca3c8a18a87e7541 +size 263192576 diff --git a/nemo_model/model_weights/model.output_layer.weight/1.0 b/nemo_model/model_weights/model.output_layer.weight/1.0 new file mode 100644 index 0000000000000000000000000000000000000000..bb1e4b5adef8cc37250c90116ccdb07aa709511a --- /dev/null +++ b/nemo_model/model_weights/model.output_layer.weight/1.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed07660d481b4eb9da593c91317f415412e9d883d94a446895592534f10e7828 +size 263192576 diff --git a/nemo_model/model_weights/model.output_layer.weight/2.0 b/nemo_model/model_weights/model.output_layer.weight/2.0 new file mode 100644 index 0000000000000000000000000000000000000000..54e2bbcfd87c4fd0d20149d0277eabab4f8c386e --- /dev/null +++ b/nemo_model/model_weights/model.output_layer.weight/2.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df847a3a57ae30c460c71139531d15ff33735102dac9740234ee1c52fbc2d082 +size 263192576 diff --git a/nemo_model/model_weights/model.output_layer.weight/3.0 b/nemo_model/model_weights/model.output_layer.weight/3.0 new file mode 100644 index 0000000000000000000000000000000000000000..6da2945d4b4d6d6a7a2a142ce320b15d09c3a162 --- /dev/null +++ b/nemo_model/model_weights/model.output_layer.weight/3.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a02da3babff570b841e7f48fbf3cc0b4209ef5f38c596e9eb93e8b76b96262e +size 263192576