{"id":27489,"date":"2023-09-13T11:52:43","date_gmt":"2023-09-13T02:52:43","guid":{"rendered":"http:\/\/nori.company\/?p=27489"},"modified":"2023-09-13T11:52:43","modified_gmt":"2023-09-13T02:52:43","slug":"nvidia-llm-%ec%b6%94%eb%a1%a0%ec%9d%84-%ea%b0%80%ec%86%8d%ed%95%98%eb%8a%94-tensorrt-llm-%ec%98%a4%ed%94%88%ec%86%8c%ec%8a%a4-%ea%b3%b5%ea%b0%9c","status":"publish","type":"post","link":"https:\/\/nori.company\/?p=27489","title":{"rendered":"NVIDIA, LLM \ucd94\ub860\uc744 \uac00\uc18d\ud558\ub294 TensorRT-LLM \uc624\ud508\uc18c\uc2a4 \uacf5\uac1c"},"content":{"rendered":"<ul>\n<li>TensorRT \ub525\ub7ec\ub2dd \ucef4\ud30c\uc77c\ub7ec\uc640 \ucd5c\uc801\ud654\ub41c \ucee4\ub110, \uc804\ucc98\ub9ac\/\ud6c4\ucc98\ub9ac \ub2e8\uacc4, \uba40\ud2f0GPU\/\uba40\ud2f0\ub178\ub4dc \ud1b5\uc2e0 \uae30\ubcf8\uc694\uc18c \ub4f1\uc744 \ud3ec\ud568<\/li>\n<li>C++ \uc774\ub098 CUDA\uc5d0 \ub300\ud55c \uae4a\uc740 \uc9c0\uc2dd \uc5c6\uc774\ub3c4 LLM\uc5d0 \ucd5c\uace0 \uc131\ub2a5\uacfc \uc0ac\uc6a9\uc790 \uc815\uc758 \uae30\ub2a5\uc744 \ube60\ub974\uac8c \uc81c\uacf5 \uac00\ub2a5<\/li>\n<li>\uc624\ud508\uc18c\uc2a4 \ubaa8\ub4c8\uc2dd Python API\ub97c \uc81c\uacf5\ud558\uc5ec \uc0ac\uc6a9 \ud3b8\uc758\uc131\uacfc \ud655\uc7a5\uc131 \uc81c\uacf5<\/li>\n<li>Am&#8230;\n<p>\ucd9c\ucc98 : <a href=\"https:\/\/news.hada.io\/topic?id=10852\" target=\"_blank\" rel=\"noopener\">GeekNews &#8211; \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4 <\/a><\/li>\n<\/ul>\n","protected":false},"excerpt":{"rendered":"<p>TensorRT \ub525\ub7ec\ub2dd \ucef4\ud30c\uc77c\ub7ec\uc640 \ucd5c\uc801\ud654\ub41c \ucee4\ub110, \uc804\ucc98\ub9ac\/\ud6c4\ucc98\ub9ac \ub2e8\uacc4, \uba40\ud2f0GPU\/\uba40\ud2f0\ub178\ub4dc \ud1b5\uc2e0 \uae30\ubcf8\uc694\uc18c \ub4f1\uc744 \ud3ec\ud568 C++ \uc774\ub098 CUDA\uc5d0 \ub300\ud55c \uae4a\uc740 \uc9c0\uc2dd \uc5c6\uc774\ub3c4 LLM\uc5d0&hellip;<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":true,"jetpack_social_options":{"image_generator_settings":{"template":"highway","default_image_id":0,"font":"","enabled":false},"version":2}},"categories":[138],"tags":[163],"class_list":["post-27489","post","type-post","status-publish","format-standard","hentry","category-it","tag-geeknews-----"],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"jetpack_shortlink":"https:\/\/wp.me\/pa3PO4-79n","jetpack-related-posts":[{"id":22949,"url":"https:\/\/nori.company\/?p=22949","url_meta":{"origin":27489,"position":0},"title":"Lamini &#8211; LLM \ud6c8\ub828\uc6a9 instruction \uc14b\uc744 \ub9cc\ub4e4\uc5b4\uc8fc\ub294 \ub370\uc774\ud130 \uc0dd\uc131\uae30","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 5\uc6d4 5\uc77c","format":false,"excerpt":"\uc790\uc2e0\ub9cc\uc758 instruction-following LLM\uc744 \ud30c\uc778\ud29c\ub2dd \uac00\ub2a5\ud558\uac8c \ud574\uc8fc\ub294 \uc624\ud508\uc18c\uc2a4 71k instruction \ub370\uc774\ud130\uc14b(CC-BY \ub77c\uc774\uc13c\uc2a4\ub85c \uc0c1\uc5c5\uc6a9\ub3c4 \uc0ac\uc6a9 \uac00\ub2a5) \ub370\uc774\ud130 \uc0dd\uc131\uae30 \ucf54\ub4dc \uc81c\uacf5 (100\uac1c\uc758 \ub370\uc774\ud130 \ud3ec\uc778\ud2b8\ub9cc\uc73c\ub85c 70k+ \ub370\uc774\ud130 \ud3ec\uc778\ud2b8 \uc0dd\uc131 \uac00\ub2a5) \uc774 100\uac1c\uc758 \ub370\uc774\ud130\ud3ec\uc778\ud2b8 \uc6d0\ud615\uc744 \ucee4\uc2a4\ud130\ub9c8\uc774\uc9d5 \ud574... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":23538,"url":"https:\/\/nori.company\/?p=23538","url_meta":{"origin":27489,"position":1},"title":"DB-GPT &#8211; \ub85c\uceecGPT\ub85c \ub370\uc774\ud130\uc5d0 \ub300\ud574 \uc9c8\ubb38\ud558\uace0 \ub2f5\ubcc0 \ubc1b\uae30","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 5\uc6d4 25\uc77c","format":false,"excerpt":"Private LLM\uc744 \uad6c\ucd95\ud574\uc11c \ub370\uc774\ud130\ubca0\uc774\uc2a4 \uae30\ubc18 \uc2dc\ub098\ub9ac\uc624\ub97c \ucc98\ub9ac\ud558\ub294 \uc624\ud508\uc18c\uc2a4 \ud504\ub85c\uc81d\ud2b8 SQL \uc5b8\uc5b4 \uc0dd\uc131 \ubc0f \ubd84\uc11d \ube44\uacf5\uac1c \ub3c4\uba54\uc778 Q&A \ubc0f \ub370\uc774\ud130 \ucc98\ub9ac \ub370\uc774\ud130\ubca0\uc774\uc2a4 \uc9c0\uc2dd Q&A \ud50c\ub7ec\uadf8\uc778 \uae30\ub2a5 \uc81c\uacf5 Auto-GPT \ud50c\ub7ec\uadf8\uc778\uc744 \ub124\uc774\ud2f0\ube0c\ud558\uac8c \uc9c0\uc6d0\ud574\uc11c \uadf8\ub300\ub85c \uc2e4\ud589 ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":25781,"url":"https:\/\/nori.company\/?p=25781","url_meta":{"origin":27489,"position":2},"title":"Basaran &#8211; OpenAI Text Completion API\uc758 \uc624\ud508\uc18c\uc2a4 \ub300\uccb4\uc81c","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 8\uc6d4 4\uc77c","format":false,"excerpt":"Hugging Face Transformer \uae30\ubc18\uc758 \ud14d\uc2a4\ud2b8 \uc0dd\uc131 \ubaa8\ub378\uc5d0 \ub300\ud574\uc11c OpenAI\uc640 \ud638\ud658\ub418\ub294 \uc2a4\ud2b8\ub9ac\ubc0d API\ub97c \uc81c\uacf5 \ub2e4\ub978 LLM\uc744 \uc774\uc6a9\ud574\uc11c OpenAI \uc11c\ube44\uc2a4\ucc98\ub7fc \uc774\uc6a9 \uac00\ub2a5 \ub2e4\uc591\ud55c \ub514\ucf54\ub529 \uc804\ub7b5\uc744 \uc774\uc6a9\ud55c \uc2a4\ud2b8\ub9ac\ubc0d \uc0dd\uc131 \uac00\ub2a5 \ub514\ucf54\ub354-\uc628\ub9ac \ub610\ub294 \uc778\ucf54\ub354-\ub514\ucf54\ub354 \ubaa8\ub378 \ubaa8\ub450 \uc9c0\uc6d0 sur... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":28175,"url":"https:\/\/nori.company\/?p=28175","url_meta":{"origin":27489,"position":3},"title":"Superflows &#8211; SaaS\ub97c \uc704\ud55c AI Copilot \uc791\uc131\uc6a9 \ud234\ud0b7","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 9\uc6d4 29\uc77c","format":false,"excerpt":"\uc18c\ud504\ud2b8\uc6e8\uc5b4 \uc81c\ud488\uc5d0 AI \ube44\uc11c\ub97c \uc791\uc131\ud558\uae30 \uc27d\uac8c \ud574\uc8fc\ub294 \uc624\ud508\uc18c\uc2a4 \uc0ac\uc6a9\uc790\uac00 \uc790\uc5f0\uc5b4\ub85c \uc9c8\ubb38\ud558\uba74 \uc81c\ud488\uc758 API\ub97c \ud638\ucd9c\ud574\uc11c \ub2f5\ubcc0\uc744 \uc0dd\uc131 \uac1c\ubc1c\uc790 \ub300\uc2dc\ubcf4\ub4dc, Public \uc2a4\ud2b8\ub9ac\ubc0d API \uc81c\uacf5 \uba40\ud2f0 LLM \uc9c0\uc6d0(Llama 2, GPT4, Claude 2, PaLM 2,..) API \uc2a4\ud399\uc744 \uc5c5\ub85c\ub4dc\ud558\uc5ec \ube60\ub978 \uc14b\uc5c5 \uc9c0\uc6d0... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":27475,"url":"https:\/\/nori.company\/?p=27475","url_meta":{"origin":27489,"position":4},"title":"\uc790\uc2e0\ub9cc\uc758 Llama 2\ub97c \uc138\ubc00\ud558\uac8c \uc870\uc815\ud558\uc5ec GPT-3.5\/4\ub97c \ub300\uccb4\ud558\ub2e4","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 9\uc6d4 13\uc77c","format":false,"excerpt":"HN\uc5d0\uc11c \uc624\ud508\uc18c\uc2a4 LLM\uc758 \ubbf8\uc138 \uc870\uc815\uc5d0 \ub300\ud55c \uad00\uc2ec\uc774 \ub9ce\uc774 \uc99d\uac00\ud558\uace0 \uc788\uc74c (\uc608: Anyscale\uc758 \uac8c\uc2dc\ubb3c) \ubaa8\ub378 \ubbf8\uc138 \uc870\uc815\uc5d0 \ub300\ud55c \uba87 \ub144\uac04\uc758 \uacbd\ud5d8\uacfc \ud1b5\ucc30, \uadf8\ub9ac\uace0 \uc2e4\uc6a9\uc801\uc778 \ucf54\ub4dc \uacf5\uc720 \ub370\uc774\ud130 \ub77c\ubca8\ub9c1, \ubbf8\uc138 \uc870\uc815, \ud6a8\uc728\uc801\uc778 \ucd94\ub860 \uc2e4\ud589, \ube44\uc6a9\/\uc131\ub2a5 \ud3c9\uac00 \ub4f1\uc744 \ub2e4\ub8e8\ub294 \ub178\ud2b8\ubd81 \uc138\ud2b8 \uc81c\uacf5 \ud14c\uc2a4\ud2b8 \uc138\ud2b8... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":23242,"url":"https:\/\/nori.company\/?p=23242","url_meta":{"origin":27489,"position":5},"title":"Open-LLaMa &#8211; LLM \uc791\uc131\uc6a9 \uc644\uc804\ud55c \ud2b8\ub808\uc774\ub2dd \ud30c\uc774\ud504\ub77c\uc778","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 5\uc6d4 16\uc77c","format":false,"excerpt":"\ub370\uc774\ud130\uc14b \uc0dd\uc131\ubd80\ud130 \ud1a0\ud070\ud654, \ud504\ub86c\ud504\ud2b8 \ud29c\ub2dd, LoRA \ubc0f RLHF \uae4c\uc9c0 \uc804\uccb4 \ud30c\uc774\ud504\ub77c\uc778\uc744 \uad6c\uc131\ud55c \uc624\ud508\uc18c\uc2a4 \uc0ac\uc804\ud559\uc2b5\ub41c Open-LLama-V2-pretrain \ubaa8\ub378\ub3c4 Hugging Face\uc5d0 \uacf5\uac1c FastChat \ud3c9\uac00\ubc29\ubc95\uc5d0 \uc758\ud558\uba74 GPT-3.5\uc640 \ube44\uad50\uc2dc \uc57d 89%\uc758 \uc131\ub2a5\uc744 \ub0b8\ub2e4\uace0(\uc911\uad6d\uc5b4\ub85c\ub41c \uc9c8\ubb38\uc5d0 \ub300\ud574) \ud559\uc2b5 \uc2a4\ud53c\ub4dc\ub294 36... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]}],"_links":{"self":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/27489","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=27489"}],"version-history":[{"count":1,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/27489\/revisions"}],"predecessor-version":[{"id":27490,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/27489\/revisions\/27490"}],"wp:attachment":[{"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=27489"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=27489"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=27489"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}