{"id":25173,"date":"2023-07-21T11:53:30","date_gmt":"2023-07-21T02:53:30","guid":{"rendered":"http:\/\/nori.company\/?p=25173"},"modified":"2023-07-21T11:53:30","modified_gmt":"2023-07-21T02:53:30","slug":"mosaicml-mpt-7b-8k-%eb%aa%a8%eb%8d%b8-%ea%b3%b5%ea%b0%9c","status":"publish","type":"post","link":"https:\/\/nori.company\/?p=25173","title":{"rendered":"MosaicML, MPT-7B-8K \ubaa8\ub378 \uacf5\uac1c"},"content":{"rendered":"<ul>\n<li>8k \ucee8\ud14d\uc2a4\ud2b8 \uae38\uc774\ub97c \uc9c0\uc6d0\ud558\ub294 7B \ud30c\ub77c\ubbf8\ud130 \uc624\ud508\uc18c\uc2a4 LLM<\/li>\n<li>MPT-7B\uc5d0 \ucd94\uac00\ub85c 500B \ud1a0\ud070 \ub370\uc774\ud130\ub97c \uc774\uc6a9\ud574 256\uac1c\uc758 NVidia H100 \uc73c\ub85c 3\uc77c\uac04 \ud2b8\ub808\uc774\ub2dd<\/li>\n<li>3\uac1c\uc758 \ubaa8\ub378\uc744 \uacf5\uac1c : MPT-7B-8k, MPT-7B-8k-Instruct, MPT-7B-8k-Chat<\/li>\n<li>\uc0c1\uc5c5\uc801 \uc6a9\ub3c4\ub85c \uc0ac\uc6a9 \uac00\ub2a5<\/li>\n<li>ALiBi(Attention with Linear&#8230;\n<p>\ucd9c\ucc98 : <a href=\"https:\/\/news.hada.io\/topic?id=9910\" target=\"_blank\" rel=\"noopener\">GeekNews &#8211; \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4 <\/a><\/li>\n<\/ul>\n","protected":false},"excerpt":{"rendered":"<p>8k \ucee8\ud14d\uc2a4\ud2b8 \uae38\uc774\ub97c \uc9c0\uc6d0\ud558\ub294 7B \ud30c\ub77c\ubbf8\ud130 \uc624\ud508\uc18c\uc2a4 LLM MPT-7B\uc5d0 \ucd94\uac00\ub85c 500B \ud1a0\ud070 \ub370\uc774\ud130\ub97c \uc774\uc6a9\ud574 256\uac1c\uc758 NVidia H100 \uc73c\ub85c 3\uc77c\uac04 \ud2b8\ub808\uc774\ub2dd&hellip;<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"jetpack_post_was_ever_published":false,"_jetpack_newsletter_access":"","_jetpack_dont_email_post_to_subs":false,"_jetpack_newsletter_tier_id":0,"_jetpack_memberships_contains_paywalled_content":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":"","jetpack_publicize_message":"","jetpack_publicize_feature_enabled":true,"jetpack_social_post_already_shared":true,"jetpack_social_options":{"image_generator_settings":{"template":"highway","default_image_id":0,"font":"","enabled":false},"version":2}},"categories":[138],"tags":[163],"class_list":["post-25173","post","type-post","status-publish","format-standard","hentry","category-it","tag-geeknews-----"],"jetpack_publicize_connections":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"jetpack_shortlink":"https:\/\/wp.me\/pa3PO4-6y1","jetpack-related-posts":[{"id":23067,"url":"https:\/\/nori.company\/?p=23067","url_meta":{"origin":25173,"position":0},"title":"MPT-7B, \uc0c1\uc5c5\uc801\uc73c\ub85c \uc774\uc6a9 \uac00\ub2a5\ud55c \uc624\ud508\uc18c\uc2a4 LLM","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 5\uc6d4 9\uc77c","format":false,"excerpt":"1\uc870\uac1c\uc758 \ud1a0\ud070\uc73c\ub85c \ud559\uc2b5\ub41c \ud2b8\ub79c\uc2a4\ud3ec\uba38 LLaMA-7B\uc640 \ube44\uc2b7\ud55c \ud488\uc9c8\uc774\uc9c0\ub9cc \uc624\ud508\uc18c\uc2a4, \uc0c1\uc5c5\uc801 \uc774\uc6a9 \uac00\ub2a5 \ucd94\uac00\ub85c 3\uac1c\uc758 \ud30c\uc778\ud29c\ub2dd \ubaa8\ub378\ub3c4 \uacf5\uac1c MPT-7B-Instruct, MPT-7B-Chat, MPT-7B-StoryWriter-65K+(65K \ud1a0\ud070 \uc9c0\uc6d0) MosaicML \ud50c\ub7ab\ud3fc\uc5d0\uc11c 9.5\uc77c\uac04 \uc57d ~$200K \ube44\uc6a9\uc73c\ub85c... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24580,"url":"https:\/\/nori.company\/?p=24580","url_meta":{"origin":25173,"position":1},"title":"OpenFlamingo V2 \ub9b4\ub9ac\uc988","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 7\uc6d4 3\uc77c","format":false,"excerpt":"DeepMind\uc758 Flamingo \ubaa8\ub378\uc744 \uc624\ud508\uc18c\uc2a4\ub85c \uad6c\ud604\ud55c \uac83 3B, 4B, 9B \ubaa8\ub378\uc744 \uacf5\uac1c MPT-1B\/7B \uc640 RedPajama-3B \uae30\ubc18 \uac19\uc740 Flamingo \ubaa8\ub378 \uc131\ub2a5\uc758 80% \uc774\uc0c1\uc744 \ub2ec\uc131 \ud6c8\ub828\ubc0f \ud3c9\uac00\ucf54\ub4dc\ub97c \uac1c\uc120 Fully Sharded Data Parallel (FSDP) \uc9c0\uc6d0 \uc0c8\ub85c\uc6b4 \ub370\uc774\ud130\uc14b... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24539,"url":"https:\/\/nori.company\/?p=24539","url_meta":{"origin":25173,"position":2},"title":"XGen-7B &#8211; 1.5T \ud1a0\ud070\uc5d0 \ub300\ud574 \ucd5c\ub300 8K \uc2dc\ud000\uc2a4 \uae38\uc774\ub85c \ud6c8\ub828\ud55c 7B LLM","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 7\uc6d4 1\uc77c","format":false,"excerpt":"LLM\uc774 \ub9ce\uc774 \uc0ac\uc6a9\ub418\uba74\uc11c \uae34 \uc2dc\ud000\uc2a4\uc5d0 \ub300\ud574\uc11c \uc801\uc6a9\ud558\ub294 \uac83\uc774 \uc911\uc694\ud574\uc9d0: \ubb38\uc11c \uc694\uc57d, \ucf54\ub4dc \uc791\uc131, \ub2e8\ubc31\uc9c8 \uc11c\uc5f4 \uc608\uce21\ub4f1 \ud558\uc9c0\ub9cc \ub300\ubd80\ubd84\uc758 \uc624\ud508\uc18c\uc2a4 LLM(LLaMA, MPT, Falcon) \ub4f1\uc740 \ucd5c\ub300 2K \ud1a0\ud070 \uc2dc\ud000\uc2a4 \uae38\uc774\ub85c \ud6c8\ub828\ub428 XGen-7B \ub294 \ucd5c\ub300 8K \uc2dc\ud000\uc2a4 \uae38\uc774 \uae4c\uc9c0\ub85c 1.5T \ucf54\ud070\uc5d0 \ub300\ud574 \ud6c8\ub828 \ud45c\uc900 NL... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24437,"url":"https:\/\/nori.company\/?p=24437","url_meta":{"origin":25173,"position":3},"title":"DeepSpeed ZeRO : \ud1b5\uc2e0\ub7c9\uc744 4\ubc30 \uc904\uc774\uba74\uc11c LLM\uacfc \ucc44\ud305 \ubaa8\ub378 \ud2b8\ub808\uc774\ub2dd \uc18d\ub3c4\uc758 \ud68d\uae30\uc801\uc778 \ud5a5\uc0c1","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 28\uc77c","format":false,"excerpt":"LLM\uc740 \uaf64 \ub9ce\uc740 \uc591\uc758 \uba54\ubaa8\ub9ac\uc640 \ucef4\ud4e8\ud305 \ub9ac\uc18c\uc2a4\ub97c \ud544\uc694\ub85c \ud568 DeppSpeed\uc758 ZeRO \ud328\ubc00\ub9ac\ub294 \uc774\ub7f0 \ubb38\uc81c\uc5d0 \ub300\ud55c \ud574\uacb0\ucc45\uc744 \uc81c\uacf5\ud558\uc5ec TNLG-17B, Bloom-176B, MPT-7B, Jurrasic-1 \ub4f1\uc5d0\uc11c \uc0ac\uc6a9\ub428 \ud558\uc9c0\ub9cc \uc218\ub9ce\uc740 GPU\ub4e4\uc774 \uc0ac\uc6a9\ub418\ub294 \ub300\uaddc\ubaa8 \uc2dc\ub098\ub9ac\uc624\uc5d0\uc11c\ub294 GPU\uac04 \uc7a6\uc740 \ud1b5\uc2e0\uc774 \ud544\uc694\ud558\ub294 \ub4f1 \uc624\ubc84\ud5e4\ub4dc\uac00 \ubc1c\uc0dd... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":23825,"url":"https:\/\/nori.company\/?p=23825","url_meta":{"origin":25173,"position":4},"title":"RedPajama, HEML \ubca4\uce58\ub9c8\ud06c\uc5d0\uc11c \uacf5\uac1c\ub41c \ub2e4\ub978 7B LLM \ubaa8\ub378\ubcf4\ub2e4 \ub6f0\uc5b4\ub09c \uc131\ub2a5\uc744 \uac16\ub294 7B \ubaa8\ub378 \uacf5\uac1c","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 7\uc77c","format":false,"excerpt":"RedPajama-INCITE-7B \ubaa8\ub378 3\uc885 \uc18c\uac1c HELM \ubca4\uce58\ub9c8\ud06c \uae30\uc900, \uae30\uc874 \uacf5\uac1c\ub41c 7B \ubaa8\ub378\ub4e4\ubcf4\ub2e4 \ub6f0\uc5b4\ub09c RedPajama-INCITE-7B-Instruct \ubaa8\ub378\uc744 \ud3ec\ud568\ud558\uc5ec 7B\uc9dc\ub9ac 3\uc885 \ubaa8\ub378\uc744 \uacf5\uac1c RedPajama-INCITE-7B-Instruct \ubaa8\ub378 \uae30\uc874 \ubaa8\ub378\uc758 Instruct \ud29c\ub2dd \ubc84\uc804 P3 (Bi \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]},{"id":24231,"url":"https:\/\/nori.company\/?p=24231","url_meta":{"origin":25173,"position":5},"title":"OpenLLaMA 13B \uacf5\uac1c","author":"\ub178\ub9ac\ucef4\ud37c\ub2c8","date":"2023\ub144 6\uc6d4 20\uc77c","format":false,"excerpt":"\ub2e4\ub978 \uc6a9\ub3c4\uc758 \uc774\uc6a9\uc774 \uac00\ub2a5\ud558\ub3c4\ub85d \uc544\ud30c\uce58 \ub77c\uc774\uc13c\uc2a4\ub85c \ub9cc\ub4e4\uc5b4\uc9c4 LLaMA\uc758 \uc624\ud508\uc18c\uc2a4 \ubcf5\uc81c\ubcf8 1T \ud1a0\ud070\uc73c\ub85c \ud6c8\ub828\ud55c 3B, 7B, 13B \ubaa8\ub378\uc744 \uacf5\uac1c \uc0ac\uc804\ud6c8\ub828\ub41c \ubaa8\ub378\uc758 Weights\ub3c4 \uacf5\uac1c (EasyLM & PyTorch \ud3ec\ub9f7) ... \ucd9c\ucc98 : GeekNews - \uac1c\ubc1c\/\uae30\uc220\/\uc2a4\ud0c0\ud2b8\uc5c5 \ub274\uc2a4 \uc11c\ube44\uc2a4","rel":"","context":"&quot;IT&quot;\uc5d0\uc11c","block_context":{"text":"IT","link":"https:\/\/nori.company\/?cat=138"},"img":{"alt_text":"","src":"","width":0,"height":0},"classes":[]}],"_links":{"self":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/25173","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=25173"}],"version-history":[{"count":1,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/25173\/revisions"}],"predecessor-version":[{"id":25174,"href":"https:\/\/nori.company\/index.php?rest_route=\/wp\/v2\/posts\/25173\/revisions\/25174"}],"wp:attachment":[{"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=25173"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=25173"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/nori.company\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=25173"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}