{"id":22449,"date":"2023-04-18T10:48:34","date_gmt":"2023-04-18T01:48:34","guid":{"rendered":"http:\/\/nori.company\/?p=22449"},"modified":"2023-04-18T10:48:34","modified_gmt":"2023-04-18T01:48:34","slug":"web-llm-webgpu%eb%a1%9c-%eb%b8%8c%eb%9d%bc%ec%9a%b0%ec%a0%80%ec%97%90%ec%84%9c-llm-%ea%b0%80%ec%86%8d%ed%95%98%ec%97%ac-%ec%8b%a4%ed%96%89%ed%95%98%ea%b8%b0","status":"publish","type":"post","link":"https:\/\/nori.company\/?p=22449","title":{"rendered":"Web LLM &#8211; WebGPU\ub85c \ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c LLM \uac00\uc18d\ud558\uc5ec \uc2e4\ud589\ud558\uae30"},"content":{"rendered":"<ul>\n<li>\uc11c\ubc84 \uc5c6\uc774 \ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c LLaMA, Vicuna \uac19\uc740 LLM\uc744 WASM\uc744 \uc774\uc6a9\ud558\uc5ec \uad6c\ub3d9<\/li>\n<li>WebGPU\ub85c \uac00\uc18d \ud558\uc9c0\ub9cc, \ubcc4\ub3c4\ub85c Apache TVM\uc774 \uc9c0\uc6d0\ud558\ub294 GPU \ubc31\uc5d4\ub4dc\ub4e4(CUDA, OpenCL, Vulkan)\ub3c4 \uc9c0\uc6d0<\/li>\n<li>MLC(Machine Learning Compilation) \uae30\uc220\uc744 \uc0ac\uc6a9<\/li>\n<\/ul>\n<p>&#8230;<\/p>\n<p>\ucd9c\ucc98 : <a href=\"https:\/\/news.hada.io\/topic?id=8977\" target=\"_blank\" rel=\"noopener\">GeekNews &#8211; \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4 <\/a><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\uc11c\ubc84 \uc5c6\uc774 \ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c LLaMA, Vicuna \uac19\uc740 LLM\uc744 WASM\uc744 \uc774\uc6a9\ud558\uc5ec \uad6c\ub3d9 WebGPU\ub85c \uac00\uc18d \ud558\uc9c0\ub9cc, \ubcc4\ub3c4\ub85c Apache TVM\uc774 \uc9c0\uc6d0\ud558\ub294 GPU \ubc31\uc5d4\ub4dc\ub4e4(CUDA, OpenCL,&hellip;<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":true,"jetpack_social_options":{"image_generator_settings":{"template":"highway","default_image_id":0,"font":"","enabled":false},"version":2}},"categories":[138],"tags":[163],"class_list":["post-22449","post","type-post","status-publish","format-standard","hentry","category-it","tag-geeknews-----"],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"jetpack_shortlink":"https:\/\/wp.me\/pa3PO4-5Q5","jetpack-related-posts":[{"id":26861,"url":"https:\/\/nori.company\/?p=26861","url_meta":{"origin":22449,"position":0},"title":"Web LLM &#8211; Llama2 7B\/13B \uc9c0\uc6d0 \uc2dc\uc791","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 8\uc6d4 30\uc77c","format":false,"excerpt":"\uc11c\ubc84 \uc5c6\uc774 \ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c Llama, RedPajama, Vicuna \uac19\uc740 LLM\uc744 WASM\uc73c\ub85c \uad6c\ub3d9\ud558\ub294 \uc11c\ube44\uc2a4 Llama 2 7B\/13B \uc9c0\uc6d0 \uc2dc\uc791 Llama 2 70B\ub3c4 \uc9c0\uc6d0\ud558\uc9c0\ub9cc, \uc560\ud50c \uc2e4\ub9ac\ucf58 \ub9e5 + 64GB \ub7a8 \uc774\uc0c1\uc5d0\uc11c\ub9cc \uc0ac\uc6a9 \uac00\ub2a5 WebGPU\ub85c \uac00\uc18d ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24292,"url":"https:\/\/nori.company\/?p=24292","url_meta":{"origin":22449,"position":1},"title":"OpenLLM &#8211; LLM\uc744 \ud504\ub85c\ub355\uc158\uc5d0\uc11c \uc6b4\uc601\ud558\uae30 \uc704\ud55c \uc624\ud508 \ud50c\ub7ab\ud3fc","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 22\uc77c","format":false,"excerpt":"\ub2e4\uc591\ud55c \uc885\ub958\uc758 LLM\uc744 \uc9c0\uc6d0\ud558\uc5ec \ucd94\ub860, \ubc30\ud3ec \uac00\ub2a5 StableLM, Falcon, DOlly, Flan-T5, ChatGLM, StarCoder,.. \ud558\ub098\uc758 \uba85\ub839\uc73c\ub85c LLM\uc744 RESTful API \ub610\ub294 gRPC\ub85c \uc11c\ube59 WebUI, CLI, Python\/Javascript Client \ub610\ub294 \ubaa8\ub4e0 HTTP Client\uc5d0\uc11c \ud638\ucd9c LangChai... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":30219,"url":"https:\/\/nori.company\/?p=30219","url_meta":{"origin":22449,"position":2},"title":"Tarsier &#8211; \uc6f9 \uc778\ud130\ub799\uc158 \uc5d0\uc774\uc804\ud2b8\ub97c \uc704\ud55c \ube44\uc83c \uc720\ud2f8\ub9ac\ud2f0","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 11\uc6d4 16\uc77c","format":false,"excerpt":"GPT-4(V)\ub85c \uc6f9 \uc778\ud130\ub799\uc158\uc744 \uc790\ub3d9\ud654\ud560 \ub54c \uc0dd\uae30\ub294 \uc9c8\ubb38\ub4e4 LLM\uc758 \uc751\ub2f5\uc744 \uc5b4\ub5bb\uac8c \uc6f9 \uc5d8\ub9ac\uba3c\ud2b8\ub85c \ub9e4\ud551\ud560\uae4c? LLM\uc758 \uc791\uc5c5 \uacf5\uac04\uc744 \ub354 \uc798 \uc774\ud574\ud558\uae30 \uc704\ud574 \ud398\uc774\uc9c0\ub97c \ub9c8\ud06c\uc5c5\ud558\ub824\uba74 \uc5b4\ub5bb\uac8c \ud574\uc57c \ud560\uae4c? \ud14d\uc2a4\ud2b8 \uc804\uc6a9 LLM\uc5d0 '\uc2a4\ud06c\ub9b0\uc0f7'\uc744 \uc81c\uacf5\ud558\ub824\uba74 \uc5b4\ub5bb\uac8c \ud574\uc57c \ud558\ub098? Tarsier... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":27098,"url":"https:\/\/nori.company\/?p=27098","url_meta":{"origin":22449,"position":3},"title":"LangFuse &#8211; LLM\uc571\uc744 \uc704\ud55c \uc624\ud508\uc18c\uc2a4 Observability &#038; Analytics \uc194\ub8e8\uc158","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 9\uc6d4 5\uc77c","format":false,"excerpt":"LLM\uc744 \uc774\uc6a9\ud558\uc5ec \ub9cc\ub4e4\uc5b4\uc9c4 \uc571\ub4e4\uc744 \uc704\ud55c \ub3c4\uad6c Observability \ubcf5\uc7a1\ud55c \ub85c\uadf8\uc640 \ud2b8\ub808\uc774\uc2a4\ub97c \ube44\uc96c\uc5bc UI\ub85c \ud0d0\uc0c9 \ubc0f \ub514\ubc84\uadf8 \uc0ac\uc6a9\uc790 \ud53c\ub4dc\ubc31\uc5d0 \ub530\ub77c \uc2e4\ud589 \ud2b8\ub808\uc774\uc2a4\ub97c \uc138\uadf8\uba3c\ud2b8\ud654 Analytics: \ube44\uc6a9, \uc9c0\uc5f0\uc2dc\uac04 \ubc0f \uc751\ub2f5 \ud488\uc9c8\uc744 \uce21\uc815 & \uac1c\uc120 \ubaa8\ub378\ubcc4 \ud1a0\uadfc \uc0ac\uc6a9\ub7c9,... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":27116,"url":"https:\/\/nori.company\/?p=27116","url_meta":{"origin":22449,"position":4},"title":"LangFuse &#8211; LLM\uc571\uc744 \uc704\ud55c \uc624\ud508\uc18c\uc2a4 Observability &#038; Analytics \uc194\ub8e8\uc158","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 9\uc6d4 5\uc77c","format":false,"excerpt":"LLM\uc744 \uc774\uc6a9\ud558\uc5ec \ub9cc\ub4e4\uc5b4\uc9c4 \uc571\ub4e4\uc744 \uc704\ud55c \ub3c4\uad6c Observability \ubcf5\uc7a1\ud55c \ub85c\uadf8\uc640 \ud2b8\ub808\uc774\uc2a4\ub97c \ube44\uc96c\uc5bc UI\ub85c \ud0d0\uc0c9 \ubc0f \ub514\ubc84\uadf8 \uc0ac\uc6a9\uc790 \ud53c\ub4dc\ubc31\uc5d0 \ub530\ub77c \uc2e4\ud589 \ud2b8\ub808\uc774\uc2a4\ub97c \uc138\uadf8\uba3c\ud2b8\ud654 Analytics: \ube44\uc6a9, \uc9c0\uc5f0\uc2dc\uac04 \ubc0f \uc751\ub2f5 \ud488\uc9c8\uc744 \uce21\uc815 & \uac1c\uc120 \ubaa8\ub378\ubcc4 \ud1a0\uadfc \uc0ac\uc6a9\ub7c9,... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":27928,"url":"https:\/\/nori.company\/?p=27928","url_meta":{"origin":22449,"position":5},"title":"WhatsApp-Llama &#8211; \uc790\uc2e0\uc758 \uc653\uce20\uc571 \ub300\ud654\ub85c LLM \ud30c\uc778\ud29c\ub2dd \ud558\uae30","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 9\uc6d4 23\uc77c","format":false,"excerpt":"Llama 7B \ub97c \uc790\uc2e0\uc758 \uc653\uce20\uc571 \ub300\ud654\ub85c \ud30c\uc778\ud29c\ub2dd\ud558\uc5ec, \uc790\uc2e0\ucc98\ub7fc \ub9d0\ud558\uac8c \ub9cc\ub4e4\uae30 QLoRA \uc640 int4 \uc591\uc790\ud654\ub85c \uc2f1\uae00 GPU(P100 + 16GB)\ub85c \ud30c\uc778\ud29c\ub2dd \uac00\ub2a5 3\uac00\uc9c0 \uc9c8\ubb38\uc5d0 \ub300\ud55c 2\uac00\uc9c0 \ub2f5(LLM or \ubcf8\uc778)\uc744 \ud3c9\uac00\ud558\ub294 \uc2e4\ud5d8\uacb0\uacfc \uc57d 10%\uc758 \uce5c\uad6c\ub4e4(20\uba85\uc911 2\uba85)\uc774 \uc18d\uc558\ub2e4\uace0 ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]}],"_links":{"self":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/22449","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=22449"}],"version-history":[{"count":1,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/22449\/revisions"}],"predecessor-version":[{"id":22450,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/22449\/revisions\/22450"}],"wp:attachment":[{"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=22449"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=22449"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=22449"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}