diff --git a/.gitattributes b/.gitattributes index a6344aa..6c6b3b8 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +model.safetensors filter=lfs diff=lfs merge=lfs -text diff --git a/config.json b/config.json index 1de5c7a..7fb5cc8 100644 --- a/config.json +++ b/config.json @@ -17,10 +17,10 @@ "num_key_value_heads": 2, "rms_norm_eps": 1e-06, "rope_theta": 1000000.0, - "sliding_window": 131072, + "sliding_window": 32768, "tie_word_embeddings": true, "torch_dtype": "bfloat16", - "transformers_version": "4.44.0", + "transformers_version": "4.43.1", "use_cache": true, "use_sliding_window": false, "vocab_size": 151936 diff --git a/generation_config.json b/generation_config.json index c5c3810..dfc1107 100644 --- a/generation_config.json +++ b/generation_config.json @@ -11,4 +11,4 @@ "top_p": 0.8, "top_k": 20, "transformers_version": "4.37.0" -} \ No newline at end of file +} diff --git a/model.safetensors b/model.safetensors index f374d9a..8c1667f 100644 --- a/model.safetensors +++ b/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c1b9b30e907950516ba3c646bdf570d8084c25a6410a0cdca80cf04b11bc13a8 +oid sha256:c37182df9abfc69755c8e6e17c37357cc4919d5f636795dbcf428e4945ac81f3 size 3087467144