Guest User

Untitled

a guest
Feb 3rd, 2025
21
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 6.59 KB | None | 0 0
  1. llm_load_print_meta: n_merges = 151387
  2. llm_load_print_meta: vocab_only = 0
  3. llm_load_print_meta: n_ctx_train = 131072
  4. llm_load_print_meta: n_embd = 5120
  5. llm_load_print_meta: n_layer = 48
  6. llm_load_print_meta: n_head = 40
  7. llm_load_print_meta: n_head_kv = 8
  8. llm_load_print_meta: n_rot = 128
  9. llm_load_print_meta: n_swa = 0
  10. llm_load_print_meta: n_embd_head_k = 128
  11. llm_load_print_meta: n_embd_head_v = 128
  12. llm_load_print_meta: n_gqa = 5
  13. llm_load_print_meta: n_embd_k_gqa = 1024
  14. llm_load_print_meta: n_embd_v_gqa = 1024
  15. llm_load_print_meta: f_norm_eps = 0.0e+00
  16. llm_load_print_meta: f_norm_rms_eps = 1.0e-05
  17. llm_load_print_meta: f_clamp_kqv = 0.0e+00
  18. llm_load_print_meta: f_max_alibi_bias = 0.0e+00
  19. llm_load_print_meta: f_logit_scale = 0.0e+00
  20. llm_load_print_meta: n_ff = 13824
  21. llm_load_print_meta: n_expert = 0
  22. llm_load_print_meta: n_expert_used = 0
  23. llm_load_print_meta: causal attn = 1
  24. llm_load_print_meta: pooling type = 0
  25. llm_load_print_meta: rope type = 2
  26. llm_load_print_meta: rope scaling = linear
  27. llm_load_print_meta: freq_base_train = 1000000.0
  28. llm_load_print_meta: freq_scale_train = 1
  29. llm_load_print_meta: n_ctx_orig_yarn = 131072
  30. llm_load_print_meta: rope_finetuned = unknown
  31. llm_load_print_meta: ssm_d_conv = 0
  32. llm_load_print_meta: ssm_d_inner = 0
  33. llm_load_print_meta: ssm_d_state = 0
  34. llm_load_print_meta: ssm_dt_rank = 0
  35. llm_load_print_meta: ssm_dt_b_c_rms = 0
  36. llm_load_print_meta: model type = 14B
  37. llm_load_print_meta: model ftype = Q4_K - Medium
  38. llm_load_print_meta: model params = 14.77 B
  39. llm_load_print_meta: model size = 8.37 GiB (4.87 BPW)
  40. llm_load_print_meta: general.name = DeepSeek R1 Distill Qwen 14B
  41. llm_load_print_meta: BOS token = 151646 '<|begin▁of▁sentence|>'
  42. llm_load_print_meta: EOS token = 151643 '<|end▁of▁sentence|>'
  43. llm_load_print_meta: EOT token = 151643 '<|end▁of▁sentence|>'
  44. llm_load_print_meta: PAD token = 151643 '<|end▁of▁sentence|>'
  45. llm_load_print_meta: LF token = 148848 'ÄĬ'
  46. llm_load_print_meta: FIM PRE token = 151659 '<|fim_prefix|>'
  47. llm_load_print_meta: FIM SUF token = 151661 '<|fim_suffix|>'
  48. llm_load_print_meta: FIM MID token = 151660 '<|fim_middle|>'
  49. llm_load_print_meta: FIM PAD token = 151662 '<|fim_pad|>'
  50. llm_load_print_meta: FIM REP token = 151663 '<|repo_name|>'
  51. llm_load_print_meta: FIM SEP token = 151664 '<|file_sep|>'
  52. llm_load_print_meta: EOG token = 151643 '<|end▁of▁sentence|>'
  53. llm_load_print_meta: EOG token = 151662 '<|fim_pad|>'
  54. llm_load_print_meta: EOG token = 151663 '<|repo_name|>'
  55. llm_load_print_meta: EOG token = 151664 '<|file_sep|>'
  56. llm_load_print_meta: max token length = 256
  57. llm_load_tensors: CPU model buffer size = 8566.04 MiB
  58. llama_new_context_with_model: n_seq_max = 4
  59. llama_new_context_with_model: n_ctx = 8192
  60. llama_new_context_with_model: n_ctx_per_seq = 2048
  61. llama_new_context_with_model: n_batch = 2048
  62. llama_new_context_with_model: n_ubatch = 512
  63. llama_new_context_with_model: flash_attn = 0
  64. llama_new_context_with_model: freq_base = 1000000.0
  65. llama_new_context_with_model: freq_scale = 1
  66. llama_new_context_with_model: n_ctx_per_seq (2048) < n_ctx_train (131072) -- the full capacity of the model will not be utilized
  67. llama_kv_cache_init: kv_size = 8192, offload = 1, type_k = 'f16', type_v = 'f16', n_layer = 48, can_shift = 1
  68. llama_kv_cache_init: CPU KV buffer size = 1536.00 MiB
  69. llama_new_context_with_model: KV self size = 1536.00 MiB, K (f16): 768.00 MiB, V (f16): 768.00 MiB
  70. llama_new_context_with_model: CPU output buffer size = 2.40 MiB
  71. llama_new_context_with_model: CPU compute buffer size = 696.01 MiB
  72. llama_new_context_with_model: graph nodes = 1686
  73. llama_new_context_with_model: graph splits = 1
  74. time=2025-02-03T09:26:55.929Z level=INFO source=server.go:594 msg="llama runner started in 21.09 seconds"
  75. [GIN] 2025/02/03 - 09:28:36 | 200 | 2m1s | 172.16.48.1 | POST "/api/chat"
  76. [GIN] 2025/02/03 - 09:28:46 | 200 | 10.542817507s | 172.16.48.1 | POST "/api/chat"
  77. [GIN] 2025/02/03 - 09:29:03 | 200 | 16.598067666s | 172.16.48.1 | POST "/api/chat"
  78. [GIN] 2025/02/03 - 12:13:07 | 200 | 1.634404ms | 172.16.48.1 | GET "/api/tags"
  79. [GIN] 2025/02/03 - 12:13:08 | 200 | 38.901µs | 172.16.48.1 | GET "/api/version"
  80. [GIN] 2025/02/03 - 12:13:16 | 200 | 477.079µs | 172.16.48.1 | GET "/api/tags"
  81. [GIN] 2025/02/03 - 12:20:05 | 404 | 9.009µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
  82. [GIN] 2025/02/03 - 12:20:05 | 404 | 16.343µs | 192.168.88.231 | GET "/apple-touch-icon.png"
  83. [GIN] 2025/02/03 - 12:20:05 | 404 | 10.756µs | 192.168.88.231 | GET "/favicon.ico"
  84. [GIN] 2025/02/03 - 12:20:06 | 200 | 32.406µs | 192.168.88.231 | GET "/"
  85. [GIN] 2025/02/03 - 12:23:53 | 404 | 10.057µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
  86. [GIN] 2025/02/03 - 12:23:53 | 404 | 10.266µs | 192.168.88.231 | GET "/apple-touch-icon.png"
  87. [GIN] 2025/02/03 - 12:23:53 | 404 | 10.337µs | 192.168.88.231 | GET "/favicon.ico"
  88. [GIN] 2025/02/03 - 12:23:53 | 200 | 49.657µs | 192.168.88.231 | GET "/"
  89. [GIN] 2025/02/03 - 12:24:29 | 404 | 7.473µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
  90. [GIN] 2025/02/03 - 12:24:29 | 404 | 8.591µs | 192.168.88.231 | GET "/apple-touch-icon.png"
  91. [GIN] 2025/02/03 - 12:24:29 | 404 | 9.149µs | 192.168.88.231 | GET "/favicon.ico"
  92. [GIN] 2025/02/03 - 12:24:29 | 200 | 46.653µs | 192.168.88.231 | GET "/"
  93. [GIN] 2025/02/03 - 12:24:30 | 404 | 7.683µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
  94. [GIN] 2025/02/03 - 12:24:30 | 404 | 11.942µs | 192.168.88.231 | GET "/apple-touch-icon.png"
  95. [GIN] 2025/02/03 - 12:24:30 | 404 | 10.965µs | 192.168.88.231 | GET "/favicon.ico"
  96. [GIN] 2025/02/03 - 12:24:30 | 200 | 46.583µs | 192.168.88.231 | GET "/"
  97. [GIN] 2025/02/03 - 12:24:32 | 404 | 8.451µs | 192.168.88.231 | GET "/apple-touch-icon-precomposed.png"
  98. [GIN] 2025/02/03 - 12:24:32 | 404 | 8.52µs | 192.168.88.231 | GET "/apple-touch-icon.png"
  99. [GIN] 2025/02/03 - 12:24:32 | 404 | 11.244µs | 192.168.88.231 | GET "/favicon.ico"
  100. [GIN] 2025/02/03 - 12:24:32 | 200 | 43.999µs | 192.168.88.231 | GET "/"
  101.  
Advertisement
Add Comment
Please, Sign In to add comment