Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- llm_load_print_meta: n_merges = 151387
- llm_load_print_meta: vocab_only = 0
- llm_load_print_meta: n_ctx_train = 131072
- llm_load_print_meta: n_embd = 5120
- llm_load_print_meta: n_layer = 48
- llm_load_print_meta: n_head = 40
- llm_load_print_meta: n_head_kv = 8
- llm_load_print_meta: n_rot = 128
- llm_load_print_meta: n_swa = 0
- llm_load_print_meta: n_embd_head_k = 128
- llm_load_print_meta: n_embd_head_v = 128
- llm_load_print_meta: n_gqa = 5
- llm_load_print_meta: n_embd_k_gqa = 1024
- llm_load_print_meta: n_embd_v_gqa = 1024
- llm_load_print_meta: f_norm_eps = 0.0e+00
- llm_load_print_meta: f_norm_rms_eps = 1.0e-05
- llm_load_print_meta: f_clamp_kqv = 0.0e+00
- llm_load_print_meta: f_max_alibi_bias = 0.0e+00
- llm_load_print_meta: f_logit_scale = 0.0e+00
- llm_load_print_meta: n_ff = 13824
- llm_load_print_meta: n_expert = 0
- llm_load_print_meta: n_expert_used = 0
- llm_load_print_meta: causal attn = 1
- llm_load_print_meta: pooling type = 0
- llm_load_print_meta: rope type = 2
- llm_load_print_meta: rope scaling = linear
- llm_load_print_meta: freq_base_train = 1000000.0
- llm_load_print_meta: freq_scale_train = 1
- llm_load_print_meta: n_ctx_orig_yarn = 131072
- llm_load_print_meta: rope_finetuned = unknown
- llm_load_print_meta: ssm_d_conv = 0
- llm_load_print_meta: ssm_d_inner = 0
- llm_load_print_meta: ssm_d_state = 0
- llm_load_print_meta: ssm_dt_rank = 0
- llm_load_print_meta: ssm_dt_b_c_rms = 0
- llm_load_print_meta: model type = 14B
- llm_load_print_meta: model ftype = Q4_K - Medium
- llm_load_print_meta: model params = 14.77 B
- llm_load_print_meta: model size = 8.37 GiB (4.87 BPW)
- llm_load_print_meta: general.name = DeepSeek R1 Distill Qwen 14B
- llm_load_print_meta: BOS token = 151646 '<|begin▁of▁sentence|>'
- llm_load_print_meta: EOS token = 151643 '<|end▁of▁sentence|>'
- llm_load_print_meta: EOT token = 151643 '<|end▁of▁sentence|>'
- llm_load_print_meta: PAD token = 151643 '<|end▁of▁sentence|>'
- llm_load_print_meta: LF token = 148848 'ÄĬ'
- llm_load_print_meta: FIM PRE token = 151659 '<|fim_prefix|>'
- llm_load_print_meta: FIM SUF token = 151661 '<|fim_suffix|>'
- llm_load_print_meta: FIM MID token = 151660 '<|fim_middle|>'
- llm_load_print_meta: FIM PAD token = 151662 '<|fim_pad|>'
- llm_load_print_meta: FIM REP token = 151663 '<|repo_name|>'
- llm_load_print_meta: FIM SEP token = 151664 '<|file_sep|>'
- llm_load_print_meta: EOG token = 151643 '<|end▁of▁sentence|>'
- llm_load_print_meta: EOG token = 151662 '<|fim_pad|>'
- llm_load_print_meta: EOG token = 151663 '<|repo_name|>'
- llm_load_print_meta: EOG token = 151664 '<|file_sep|>'
- llm_load_print_meta: max token length = 256
- llm_load_tensors: CPU model buffer size = 8566.04 MiB
- llama_new_context_with_model: n_seq_max = 4
- llama_new_context_with_model: n_ctx = 8192
- llama_new_context_with_model: n_ctx_per_seq = 2048
- llama_new_context_with_model: n_batch = 2048
- llama_new_context_with_model: n_ubatch = 512
- llama_new_context_with_model: flash_attn = 0
- llama_new_context_with_model: freq_base = 1000000.0
- llama_new_context_with_model: freq_scale = 1
- llama_new_context_with_model: n_ctx_per_seq (2048) < n_ctx_train (131072) -- the full capacity of the model will not be utilized
- llama_kv_cache_init: kv_size = 8192, offload = 1, type_k = 'f16', type_v = 'f16', n_layer = 48, can_shift = 1
- llama_kv_cache_init: CPU KV buffer size = 1536.00 MiB
- llama_new_context_with_model: KV self size = 1536.00 MiB, K (f16): 768.00 MiB, V (f16): 768.00 MiB
- llama_new_context_with_model: CPU output buffer size = 2.40 MiB
- llama_new_context_with_model: CPU compute buffer size = 696.01 MiB
- llama_new_context_with_model: graph nodes = 1686
- llama_new_context_with_model: graph splits = 1
- time=2025-02-03T09:26:55.929Z level=INFO source=server.go:594 msg="llama runner started in 21.09 seconds"
- [GIN] 2025/02/03 - 09:28:36 | 200 | 2m1s | 172.16.48.1 | POST "/api/chat"
- [GIN] 2025/02/03 - 09:28:46 | 200 | 10.542817507s | 172.16.48.1 | POST "/api/chat"
- [GIN] 2025/02/03 - 09:29:03 | 200 | 16.598067666s | 172.16.48.1 | POST "/api/chat"
- [GIN] 2025/02/03 - 12:13:07 | 200 | 1.634404ms | 172.16.48.1 | GET "/api/tags"
- [GIN] 2025/02/03 - 12:13:08 | 200 | 38.901µs | 172.16.48.1 | GET "/api/version"
- [GIN] 2025/02/03 - 12:13:16 | 200 | 477.079µs | 172.16.48.1 | GET "/api/tags"
- [GIN] 2025/02/03 - 12:20:05 | 404 | 9.009µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
- [GIN] 2025/02/03 - 12:20:05 | 404 | 16.343µs | 192.168.88.231 | GET "/apple-touch-icon.png"
- [GIN] 2025/02/03 - 12:20:05 | 404 | 10.756µs | 192.168.88.231 | GET "/favicon.ico"
- [GIN] 2025/02/03 - 12:20:06 | 200 | 32.406µs | 192.168.88.231 | GET "/"
- [GIN] 2025/02/03 - 12:23:53 | 404 | 10.057µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
- [GIN] 2025/02/03 - 12:23:53 | 404 | 10.266µs | 192.168.88.231 | GET "/apple-touch-icon.png"
- [GIN] 2025/02/03 - 12:23:53 | 404 | 10.337µs | 192.168.88.231 | GET "/favicon.ico"
- [GIN] 2025/02/03 - 12:23:53 | 200 | 49.657µs | 192.168.88.231 | GET "/"
- [GIN] 2025/02/03 - 12:24:29 | 404 | 7.473µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
- [GIN] 2025/02/03 - 12:24:29 | 404 | 8.591µs | 192.168.88.231 | GET "/apple-touch-icon.png"
- [GIN] 2025/02/03 - 12:24:29 | 404 | 9.149µs | 192.168.88.231 | GET "/favicon.ico"
- [GIN] 2025/02/03 - 12:24:29 | 200 | 46.653µs | 192.168.88.231 | GET "/"
- [GIN] 2025/02/03 - 12:24:30 | 404 | 7.683µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
- [GIN] 2025/02/03 - 12:24:30 | 404 | 11.942µs | 192.168.88.231 | GET "/apple-touch-icon.png"
- [GIN] 2025/02/03 - 12:24:30 | 404 | 10.965µs | 192.168.88.231 | GET "/favicon.ico"
- [GIN] 2025/02/03 - 12:24:30 | 200 | 46.583µs | 192.168.88.231 | GET "/"
- [GIN] 2025/02/03 - 12:24:32 | 404 | 8.451µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
- [GIN] 2025/02/03 - 12:24:32 | 404 | 8.52µs | 192.168.88.231 | GET "/apple-touch-icon.png"
- [GIN] 2025/02/03 - 12:24:32 | 404 | 11.244µs | 192.168.88.231 | GET "/favicon.ico"
- [GIN] 2025/02/03 - 12:24:32 | 200 | 43.999µs | 192.168.88.231 | GET "/"
Advertisement
Add Comment
Please, Sign In to add comment