{"id":23067,"date":"2023-05-09T10:47:20","date_gmt":"2023-05-09T01:47:20","guid":{"rendered":"http:\/\/nori.company\/?p=23067"},"modified":"2023-05-09T10:47:20","modified_gmt":"2023-05-09T01:47:20","slug":"mpt-7b-%ec%83%81%ec%97%85%ec%a0%81%ec%9c%bc%eb%a1%9c-%ec%9d%b4%ec%9a%a9-%ea%b0%80%eb%8a%a5%ed%95%9c-%ec%98%a4%ed%94%88%ec%86%8c%ec%8a%a4-llm","status":"publish","type":"post","link":"https:\/\/nori.company\/?p=23067","title":{"rendered":"MPT-7B, \uc0c1\uc5c5\uc801\uc73c\ub85c \uc774\uc6a9 \uac00\ub2a5\ud55c \uc624\ud508\uc18c\uc2a4 LLM"},"content":{"rendered":"<ul>\n<li>1\uc870\uac1c\uc758 \ud1a0\ud070\uc73c\ub85c \ud559\uc2b5\ub41c \ud2b8\ub79c\uc2a4\ud3ec\uba38<\/li>\n<li>LLaMA-7B\uc640 \ube44\uc2b7\ud55c \ud488\uc9c8\uc774\uc9c0\ub9cc \uc624\ud508\uc18c\uc2a4, \uc0c1\uc5c5\uc801 \uc774\uc6a9 \uac00\ub2a5<\/li>\n<li>\ucd94\uac00\ub85c 3\uac1c\uc758 \ud30c\uc778\ud29c\ub2dd \ubaa8\ub378\ub3c4 \uacf5\uac1c\n<ul>\n<li>MPT-7B-Instruct, MPT-7B-Chat, MPT-7B-StoryWriter-65K+(65K \ud1a0\ud070 \uc9c0\uc6d0)<\/li>\n<\/ul>\n<\/li>\n<li>MosaicML \ud50c\ub7ab\ud3fc\uc5d0\uc11c 9.5\uc77c\uac04 \uc57d ~$200K \ube44\uc6a9\uc73c\ub85c&#8230;\n<p>\ucd9c\ucc98 : <a href=\"https:\/\/news.hada.io\/topic?id=9132\" target=\"_blank\" rel=\"noopener\">GeekNews &#8211; \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4 <\/a><\/li>\n<\/ul>\n","protected":false},"excerpt":{"rendered":"<p>1\uc870\uac1c\uc758 \ud1a0\ud070\uc73c\ub85c \ud559\uc2b5\ub41c \ud2b8\ub79c\uc2a4\ud3ec\uba38 LLaMA-7B\uc640 \ube44\uc2b7\ud55c \ud488\uc9c8\uc774\uc9c0\ub9cc \uc624\ud508\uc18c\uc2a4, \uc0c1\uc5c5\uc801 \uc774\uc6a9 \uac00\ub2a5 \ucd94\uac00\ub85c 3\uac1c\uc758 \ud30c\uc778\ud29c\ub2dd \ubaa8\ub378\ub3c4 \uacf5\uac1c MPT-7B-Instruct, MPT-7B-Chat, MPT-7B-StoryWriter-65K+(65K \ud1a0\ud070&hellip;<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":true,"jetpack_social_options":{"image_generator_settings":{"template":"highway","default_image_id":0,"font":"","enabled":false},"version":2}},"categories":[138],"tags":[163],"class_list":["post-23067","post","type-post","status-publish","format-standard","hentry","category-it","tag-geeknews-----"],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"jetpack_shortlink":"https:\/\/wp.me\/pa3PO4-603","jetpack-related-posts":[{"id":25173,"url":"https:\/\/nori.company\/?p=25173","url_meta":{"origin":23067,"position":0},"title":"MosaicML, MPT-7B-8K \ubaa8\ub378 \uacf5\uac1c","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 7\uc6d4 21\uc77c","format":false,"excerpt":"8k \ucee8\ud14d\uc2a4\ud2b8 \uae38\uc774\ub97c \uc9c0\uc6d0\ud558\ub294 7B \ud30c\ub77c\ubbf8\ud130 \uc624\ud508\uc18c\uc2a4 LLM MPT-7B\uc5d0 \ucd94\uac00\ub85c 500B \ud1a0\ud070 \ub370\uc774\ud130\ub97c \uc774\uc6a9\ud574 256\uac1c\uc758 NVidia H100 \uc73c\ub85c 3\uc77c\uac04 \ud2b8\ub808\uc774\ub2dd 3\uac1c\uc758 \ubaa8\ub378\uc744 \uacf5\uac1c : MPT-7B-8k, MPT-7B-8k-Instruct, MPT-7B-8k-Chat \uc0c1\uc5c5\uc801 \uc6a9\ub3c4\ub85c \uc0ac\uc6a9 \uac00\ub2a5 ALiBi(Attention with Linear... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24539,"url":"https:\/\/nori.company\/?p=24539","url_meta":{"origin":23067,"position":1},"title":"XGen-7B &#8211; 1.5T \ud1a0\ud070\uc5d0 \ub300\ud574 \ucd5c\ub300 8K \uc2dc\ud000\uc2a4 \uae38\uc774\ub85c \ud6c8\ub828\ud55c 7B LLM","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 7\uc6d4 1\uc77c","format":false,"excerpt":"LLM\uc774 \ub9ce\uc774 \uc0ac\uc6a9\ub418\uba74\uc11c \uae34 \uc2dc\ud000\uc2a4\uc5d0 \ub300\ud574\uc11c \uc801\uc6a9\ud558\ub294 \uac83\uc774 \uc911\uc694\ud574\uc9d0: \ubb38\uc11c \uc694\uc57d, \ucf54\ub4dc \uc791\uc131, \ub2e8\ubc31\uc9c8 \uc11c\uc5f4 \uc608\uce21\ub4f1 \ud558\uc9c0\ub9cc \ub300\ubd80\ubd84\uc758 \uc624\ud508\uc18c\uc2a4 LLM(LLaMA, MPT, Falcon) \ub4f1\uc740 \ucd5c\ub300 2K \ud1a0\ud070 \uc2dc\ud000\uc2a4 \uae38\uc774\ub85c \ud6c8\ub828\ub428 XGen-7B \ub294 \ucd5c\ub300 8K \uc2dc\ud000\uc2a4 \uae38\uc774 \uae4c\uc9c0\ub85c 1.5T \ucf54\ud070\uc5d0 \ub300\ud574 \ud6c8\ub828 \ud45c\uc900 NL... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24580,"url":"https:\/\/nori.company\/?p=24580","url_meta":{"origin":23067,"position":2},"title":"OpenFlamingo V2 \ub9b4\ub9ac\uc988","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 7\uc6d4 3\uc77c","format":false,"excerpt":"DeepMind\uc758 Flamingo \ubaa8\ub378\uc744 \uc624\ud508\uc18c\uc2a4\ub85c \uad6c\ud604\ud55c \uac83 3B, 4B, 9B \ubaa8\ub378\uc744 \uacf5\uac1c MPT-1B\/7B \uc640 RedPajama-3B \uae30\ubc18 \uac19\uc740 Flamingo \ubaa8\ub378 \uc131\ub2a5\uc758 80% \uc774\uc0c1\uc744 \ub2ec\uc131 \ud6c8\ub828\ubc0f \ud3c9\uac00\ucf54\ub4dc\ub97c \uac1c\uc120 Fully Sharded Data Parallel (FSDP) \uc9c0\uc6d0 \uc0c8\ub85c\uc6b4 \ub370\uc774\ud130\uc14b... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24437,"url":"https:\/\/nori.company\/?p=24437","url_meta":{"origin":23067,"position":3},"title":"DeepSpeed ZeRO : \ud1b5\uc2e0\ub7c9\uc744 4\ubc30 \uc904\uc774\uba74\uc11c LLM\uacfc \ucc44\ud305 \ubaa8\ub378 \ud2b8\ub808\uc774\ub2dd \uc18d\ub3c4\uc758 \ud68d\uae30\uc801\uc778 \ud5a5\uc0c1","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 28\uc77c","format":false,"excerpt":"LLM\uc740 \uaf64 \ub9ce\uc740 \uc591\uc758 \uba54\ubaa8\ub9ac\uc640 \ucef4\ud4e8\ud305 \ub9ac\uc18c\uc2a4\ub97c \ud544\uc694\ub85c \ud568 DeppSpeed\uc758 ZeRO \ud328\ubc00\ub9ac\ub294 \uc774\ub7f0 \ubb38\uc81c\uc5d0 \ub300\ud55c \ud574\uacb0\ucc45\uc744 \uc81c\uacf5\ud558\uc5ec TNLG-17B, Bloom-176B, MPT-7B, Jurrasic-1 \ub4f1\uc5d0\uc11c \uc0ac\uc6a9\ub428 \ud558\uc9c0\ub9cc \uc218\ub9ce\uc740 GPU\ub4e4\uc774 \uc0ac\uc6a9\ub418\ub294 \ub300\uaddc\ubaa8 \uc2dc\ub098\ub9ac\uc624\uc5d0\uc11c\ub294 GPU\uac04 \uc7a6\uc740 \ud1b5\uc2e0\uc774 \ud544\uc694\ud558\ub294 \ub4f1 \uc624\ubc84\ud5e4\ub4dc\uac00 \ubc1c\uc0dd... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":25135,"url":"https:\/\/nori.company\/?p=25135","url_meta":{"origin":23067,"position":4},"title":"FlashAttention-2: \ub354 \ub098\uc740 \ubcd1\ub82c\ucc98\ub9ac\uc640 \uc791\uc5c5 \ubd84\ud560\ub85c \ub354 \ube68\ub77c\uc9c4 Attention","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 7\uc6d4 20\uc77c","format":false,"excerpt":"GPT-4(32k), MPT(65k), Calude(100k) \ub4f1 \ub354 \uae34 \ucee8\ud14d\uc2a4\ud2b8\ub97c \uac00\uc9c4 \uc5b8\uc5b4\ubaa8\ub378\uc774 \ucd9c\ud604 \ud2b8\ub79c\uc2a4\ud3ec\uba38\uc758 \ucee8\ud14d\uc2a4\ud2b8 \uae38\uc774\ub97c \ud655\uc7a5\ud558\ub294 \uac83\uc740 \ub7f0\ud0c0\uc784&\uba54\ubaa8\ub9ac \uc694\uad6c\uc0ac\ud56d\uc774 4\uc81c\uacf1\uc73c\ub85c \uc99d\uac00\ud558\uae30 \ub54c\ubb38\uc5d0 \uc5b4\ub824\uc6c0 \uc791\ub144\uc5d0 \ucd9c\uc2dc\ud55c FlashAttention\uc740 \uba54\ubaa8\ub9ac \uc0ac\uc6a9\ub7c9\uc744 \uc904\uc774\uace0 \uc5b4\ud150\uc158 \uc18d\ub3c4\ub97c \uc99d\uac00\uc2dc\ucf1c\uc11c \ub2e4\uc591\ud55c \uacf3\uc5d0... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":26701,"url":"https:\/\/nori.company\/?p=26701","url_meta":{"origin":23067,"position":5},"title":"KHOj &#8211; \ub2f9\uc2e0\uc758 \ub514\uc9c0\ud138 \ub1cc\ub97c \uc704\ud55c AI \uac1c\uc778 \ube44\uc11c","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 8\uc6d4 26\uc77c","format":false,"excerpt":"\uc790\uc2e0\uc758 \ub178\ud2b8\/\ubb38\uc11c\/\uc774\ubbf8\uc9c0 \uae30\ubc18\uc73c\ub85c \uac80\uc0c9 \ubc0f \ucc44\ud305 \uac00\ub2a5\ud55c \ub370\uc2a4\ud06c\ud0d1 \uc5b4\ud50c\ub9ac\ucf00\uc774\uc158 Emacs\/Obsidian\/\uc6f9\ube0c\ub77c\uc6b0\uc800\uc5d0\uc11c \ud65c\uc6a9 \uac00\ub2a5\ud55c \uc624\ud504\ub77c\uc778\uc5d0\uc11c \ub3d9\uc791\ud558\ub294 \uc624\ud508\uc18c\uc2a4 AI \ube44\uc11c LLama-7B \ub97c \uc774\uc6a9 ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]}],"_links":{"self":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/23067","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=23067"}],"version-history":[{"count":1,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/23067\/revisions"}],"predecessor-version":[{"id":23068,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/23067\/revisions\/23068"}],"wp:attachment":[{"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=23067"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=23067"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=23067"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}