{"id":24040,"date":"2023-06-14T11:46:55","date_gmt":"2023-06-14T02:46:55","guid":{"rendered":"http:\/\/nori.company\/?p=24040"},"modified":"2023-06-14T11:46:55","modified_gmt":"2023-06-14T02:46:55","slug":"llama-cpp-%ec%97%90-%ec%a0%84%ec%b2%b4-cuda-gpu-%ea%b0%80%ec%86%8d-%ec%b6%94%ea%b0%80","status":"publish","type":"post","link":"https:\/\/nori.company\/?p=24040","title":{"rendered":"llama.cpp \uc5d0 \uc804\uccb4 CUDA GPU \uac00\uc18d \ucd94\uac00"},"content":{"rendered":"<ul>\n<li>\ubaa8\ub4e0 \ub0a8\uc740 ggml \ud150\uc11c\ub4e4\uc5d0 GPU \uac00\uc18d\uc744 \ucd94\uac00\ud558\ub294 PR<\/li>\n<li>RTX 3090\uc5d0\uc11c \ud504\ub86c\ud504\ud2b8 \ucc98\ub9ac\ub294 2\ubc30, \ud1a0\ud070 \uc0dd\uc131\uc740 1.3~1.8\ubc30\uae4c\uc9c0 \uac00\uc18d<\/li>\n<li>4090+i9\uc5d0\uc11c 7B q4 \ubaa8\ub378\uc758 \uacbd\uc6b0 \ucd08\ub2f9 109\ud1a0\ud070 \uc0dd\uc131<\/li>\n<\/ul>\n<p>&#8230;<\/p>\n<p>\ucd9c\ucc98 : <a href=\"https:\/\/news.hada.io\/topic?id=9390\" target=\"_blank\" rel=\"noopener\">GeekNews &#8211; \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4 <\/a><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\ubaa8\ub4e0 \ub0a8\uc740 ggml \ud150\uc11c\ub4e4\uc5d0 GPU \uac00\uc18d\uc744 \ucd94\uac00\ud558\ub294 PR RTX 3090\uc5d0\uc11c \ud504\ub86c\ud504\ud2b8 \ucc98\ub9ac\ub294 2\ubc30, \ud1a0\ud070 \uc0dd\uc131\uc740 1.3~1.8\ubc30\uae4c\uc9c0 \uac00\uc18d 4090+i9\uc5d0\uc11c 7B q4&hellip;<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":true,"jetpack_social_options":{"image_generator_settings":{"template":"highway","default_image_id":0,"font":"","enabled":false},"version":2}},"categories":[138],"tags":[163],"class_list":["post-24040","post","type-post","status-publish","format-standard","hentry","category-it","tag-geeknews-----"],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"jetpack_shortlink":"https:\/\/wp.me\/pa3PO4-6fK","jetpack-related-posts":[{"id":23708,"url":"https:\/\/nori.company\/?p=23708","url_meta":{"origin":24040,"position":0},"title":"NVIDIA DGX GH200: \ucd5c\ucd08\uc758 100 \ud14c\ub77c\ubc14\uc774\ud2b8 GPU \uba54\ubaa8\ub9ac \uc2dc\uc2a4\ud15c","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 1\uc77c","format":false,"excerpt":"COMPUTEX 2023\uc5d0\uc11c NVIDIA\uac00 \ubc1c\ud45c\ud55c GPU\uac00\uc18d \ucef4\ud4e8\ud305\uc758 \uc2e0\uae30\uc6d0 Grace Hopper Superchip \uacfc NVLink \uc2a4\uc704\uce58 \uc2dc\uc2a4\ud15c\uc744 \uacb0\ud569\ud558\uc5ec \ucd5c\ub300 256\uac1c\uc758 GPU\ub97c \ud1b5\ud569 144\ud14c\ub77c\ubc14\uc774\ud2b8\uc758 \uba54\ubaa8\ub9ac\ub97c \uace0\uc18d\uc73c\ub85c \uc811\uadfc \uac00\ub2a5. \ucd5c\ucd08\ub85c 100\ud14c\ub77c \uc7a5\ubcbd\uc744 \ud5c8\ubb3c\uc740 \ucd5c\ucd08\uc758 \uc288\ud37c\ucef4\ud4e8\ud130 1\uac1c\uc758 A100 320GB \uc2dc\uc2a4\ud15c\uacfc \ube44\uad50... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":23248,"url":"https:\/\/nori.company\/?p=23248","url_meta":{"origin":24040,"position":1},"title":"Brex\uc758 \ud504\ub86c\ud504\ud2b8 \uc5d4\uc9c0\ub2c8\uc5b4\ub9c1 \uac00\uc774\ub4dc","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 5\uc6d4 16\uc77c","format":false,"excerpt":"\ubbf8\uad6d\uc758 \ud540\ud14c\ud06c \ud68c\uc0ac\uc778 Brex\uac00 \ub0b4\ubd80 \uc9c1\uc6d0\ub4e4\uc744 \uc704\ud574 \uc791\uc131\ud55c Prompt Engineering \uac00\uc774\ub4dc \ubaa9\ucc28 LLM \uc774\ub780 \ubb34\uc5c7\uc778\uac00 \ud504\ub86c\ud504\ud2b8\ub780 ? : \ud788\ub4e0 \ud504\ub86c\ud504\ud2b8, \ud1a0\ud070, \ud1a0\ud070 \ub9ac\ubc0b, \ud504\ub86c\ud504\ud2b8 \ud574\ud0b9 \uc65c \ud504\ub86c\ud504\ud2b8 \uc5d4\uc9c0\ub2c8\uc5b4\ub9c1\uc774 \ud544\uc694\ud55c\uac00? : Bot\uc5d0\uc11c \ubb3c\uace0\uae30 \uc8fc\uae30, \ubb3c\uace0\uae30 \uc7a1\ub294 \ubc95 \uac00\ub974... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24079,"url":"https:\/\/nori.company\/?p=24079","url_meta":{"origin":24040,"position":2},"title":"LocalAI &#8211; \uc140\ud504\ud638\uc2a4\ud2b8 \uac00\ub2a5\ud55c OpenAI \ud638\ud658 API","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 15\uc77c","format":false,"excerpt":"OpenAI\uc640 \ud638\ud658\ub418\ub294 REST API\ub85c \ub2e4\uc591\ud55c LLM\ub4e4\uc744 \uc774\uc6a9 \uac00\ub2a5 GPU \uc5c6\uc774\ub3c4 \uac00\ub2a5. llama.cpp \ud638\ud658 LLM\uc5d0\uc11c\ub294 GPU \uac00\uc18d \uc9c0\uc6d0 \ub2e4\uc911 \ubaa8\ub378\uc744 \uc9c0\uc6d0\ud558\uba70, \uc624\ub514\uc624 \ud2b8\ub79c\uc2a4\ud06c\ub9bd\uc158, \ud14d\uc2a4\ud2b8 \uc0dd\uc131, \uc774\ubbf8\uc9c0 \uc0dd\uc131(Stable Diffusion) \uc9c0\uc6d0 \ud55c\ubc88 \ub85c\ub529\ub418\uba74 \ubaa8\ub378\uc744 \uba54\ubaa8\ub9ac\uc5d0 \uc800\uc7a5\ud574\ub450\uace0 \ube60\ub978 \ucd94\ub860 \uc9c0\uc6d0... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24147,"url":"https:\/\/nori.company\/?p=24147","url_meta":{"origin":24040,"position":3},"title":"roop &#8211; \uc6d0\ud074\ub9ad \ub525\ud398\uc774\ud06c(\uc5bc\uad74 \uad50\uccb4)","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 17\uc77c","format":false,"excerpt":"CPU \ubc0f GPU \uac00\uc18d \uc9c0\uc6d0(AMD, NVIDIA, Apple Silicon, Intel) \ubc14\uafc0 \uc5bc\uad74 \uc774\ubbf8\uc9c0\uc640 \ud0c0\uac9f \uc774\ubbf8\uc9c0\/\ub3d9\uc601\uc0c1 \ub9cc \ub123\uace0 \ud074\ub9ad\ud558\uba74 \ubc14\ub85c \uc0dd\uc131 \uc624\uc6a9 \ubc29\uc9c0\ub97c \uc704\ud574 \ubd80\uc801\uc808\ud55c \ubbf8\ub514\uc5b4\uc5d0\uc11c \uc791\ub3d9\ud558\ub294 \uac83\uc744 \ubc29\uc9c0\ud558\ub294 \uae30\ub2a5 \ub0b4\uc7a5 ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":22449,"url":"https:\/\/nori.company\/?p=22449","url_meta":{"origin":24040,"position":4},"title":"Web LLM &#8211; WebGPU\ub85c \ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c LLM \uac00\uc18d\ud558\uc5ec \uc2e4\ud589\ud558\uae30","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 4\uc6d4 18\uc77c","format":false,"excerpt":"\uc11c\ubc84 \uc5c6\uc774 \ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c LLaMA, Vicuna \uac19\uc740 LLM\uc744 WASM\uc744 \uc774\uc6a9\ud558\uc5ec \uad6c\ub3d9 WebGPU\ub85c \uac00\uc18d \ud558\uc9c0\ub9cc, \ubcc4\ub3c4\ub85c Apache TVM\uc774 \uc9c0\uc6d0\ud558\ub294 GPU \ubc31\uc5d4\ub4dc\ub4e4(CUDA, OpenCL, Vulkan)\ub3c4 \uc9c0\uc6d0 MLC(Machine Learning Compilation) \uae30\uc220\uc744 \uc0ac\uc6a9 ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":29948,"url":"https:\/\/nori.company\/?p=29948","url_meta":{"origin":24040,"position":5},"title":"Contour &#8211; C++\ub85c \uc791\uc131\ub41c \ud604\ub300\uc801\uc774\uace0 \ube60\ub978 \ud130\ubbf8\ub110 \uc5d0\ubbac\ub808\uc774\ud130","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 11\uc6d4 11\uc77c","format":false,"excerpt":"\ub9ac\ub205\uc2a4, OS\/X, FreeBSD, \uc708\ub3c4\uc6b0 \uc9c0\uc6d0 GPU \uac00\uc18d \ub80c\ub354\ub9c1, High-DPI, 256 \ubc0f \ud2b8\ub8e8\uceec\ub7ec \uc9c0\uc6d0 \ud3f0\ud2b8 Ligatures, \uc720\ub2c8\ucf54\ub4dc Emoji \ubc0f Grapheme, \ubcfc\ub4dc\/\uc774\ud0e4\ub9ad \ud3f0\ud2b8, Sixel \uc778\ub77c\uc778 \uc774\ubbf8\uc9c0 \ub7f0\ud0c0\uc784\uc5d0 Configuration \ub9ac\ub85c\ub4dc \uac00\ub2a5 \ud074\ub9ad\uac00\ub2a5\ud55c \ud558\uc774\ud37c \ub9c1\ud06c, \ud14d\uc2a4\ud2b8 Reflow \ub4f1 ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]}],"_links":{"self":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/24040","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=24040"}],"version-history":[{"count":1,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/24040\/revisions"}],"predecessor-version":[{"id":24041,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/24040\/revisions\/24041"}],"wp:attachment":[{"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=24040"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=24040"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=24040"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}