Upload folder using huggingface_hub

Files changed (5) hide show

config.json ADDED Viewed

+{
+  "model_type": "sam1",
+  "architectures": [
+    "SAM1ForCausalLM"
+  ],
+  "vocab_size": 50261,
+  "max_position_embeddings": 1024,
+  "hidden_size": 768,
+  "num_hidden_layers": 16,
+  "num_attention_heads": 12,
+  "intermediate_size": 5376,
+  "hidden_act": "silu",
+  "rope_theta": 10000,
+  "rms_norm_eps": 1e-05,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "pad_token_id": 50256,
+  "custom_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<think>",
+    "<think/>"
+  ]
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a31500d64f87cf2e35d743c96692b98b3ea78d4b5c42679a3bca4b8245787f67
+size 1252639768

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

+{
+  "tokenizer_class": "GPT2Tokenizer",
+  "model_max_length": 1024,
+  "pad_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "bos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>",
+  "additional_special_tokens": [
+    "<|im_start|>",
+    "<|im_end|>",
+    "<think>",
+    "<think/>"
+  ]
+}

training_history.csv ADDED Viewed

+accuracy,loss,val_accuracy,val_loss
+0.8683860898017883,0.8338250517845154,0.9013352394104004,0.4916256070137024
+0.9069636464118958,0.4496036469936371,0.9123231768608093,0.4182259440422058
+0.9167993068695068,0.3842655122280121,0.9181107878684998,0.3843038082122803
+0.9244006872177124,0.33804553747177124,0.9216646552085876,0.365914523601532
+0.9301119446754456,0.30558690428733826,0.9232332110404968,0.3598633408546448