Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- {
- "base_model_name": "MaziyarPanahi_NeuralHermes-2.5-Mistral-7B-Mistral-7B-Instruct-v0.2-slerp",
- "base_model_class": "MistralForCausalLM",
- "base_loaded_in_4bit": true,
- "base_loaded_in_8bit": false,
- "projections": "gate, down, up, q, k, v, o",
- "loss": 0.1514,
- "grad_norm": 2.5066869258880615,
- "learning_rate": 0.0,
- "epoch": 1.0,
- "current_steps": 251,
- "current_steps_adjusted": 251,
- "epoch_adjusted": 1.0,
- "train_runtime": 1726.5746,
- "train_samples_per_second": 1.166,
- "train_steps_per_second": 0.146,
- "total_flos": 4.814574168362189e+16,
- "train_loss": 0.33752105723593445,
- "eval_loss": 0.10965719074010849,
- "eval_runtime": 67.4495,
- "eval_samples_per_second": 7.457,
- "eval_steps_per_second": 0.934
- }
Advertisement
Add Comment
Please, Sign In to add comment