{"id":4485,"date":"2023-11-21T17:30:03","date_gmt":"2023-11-21T09:30:03","guid":{"rendered":"http:\/\/www.sniper97.cn\/?p=4485"},"modified":"2023-11-21T17:30:28","modified_gmt":"2023-11-21T09:30:28","slug":"%e3%80%90%e8%ae%ba%e6%96%87%e3%80%91continual-pre-training-of-large-language-models-how-to-rewarm-up-your-model","status":"publish","type":"post","link":"http:\/\/www.sniper97.cn\/index.php\/note\/deep-learning\/paper-deep-learning\/4485\/","title":{"rendered":"\u3010\u8bba\u6587\u3011Continual Pre-Training of Large Language Models: How to (re)warm-up your model?"},"content":{"rendered":"\n<p>\u62ff\u5927\u8499\u7279\u5229\u5c14\u7684\u4e24\u6240\u5927\u5b66\u7684\u5de5\u4f5c\uff0c\u4e3b\u8981\u662f\u9a8c\u8bc1\u7ee7\u7eed\u9884\u8bad\u7ec3\u4e2d\uff0c\u5982\u4f55warmup\u4f60\u7684\u6a21\u578b\u3002<\/p>\n\n\n\n<p>\u5199\u5728notion\u4e0a\u4e86\uff0c\u61d2\u5f97\u642c\u8fd0\u3002\u94fe\u63a5\u5982\u4e0b\uff08\u53ef\u80fd\u9700\u8981\u7ffb\u5899\uff09<\/p>\n\n\n\n<p><a href=\"https:\/\/daffodil-square-501.notion.site\/Continual-Pre-Training-of-Large-Language-Models-How-to-re-warm-up-your-model-69877d14c7884c3a903205da90b0695a?pvs=4\" target=\"_blank\" rel=\"noreferrer noopener\">https:\/\/daffodil-square-501.notion.site\/Continual-Pre-Training-of-Large-Language-Models-How-to-re-warm-up-your-model-69877d14c7884c3a903205da90b0695a?pvs=4<\/a><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u62ff\u5927\u8499\u7279\u5229\u5c14\u7684\u4e24\u6240\u5927\u5b66\u7684\u5de5\u4f5c\uff0c\u4e3b\u8981\u662f\u9a8c\u8bc1\u7ee7\u7eed\u9884\u8bad\u7ec3\u4e2d\uff0c\u5982\u4f55warmup\u4f60\u7684\u6a21\u578b\u3002 \u5199\u5728notion\u4e0a [&hellip;]<\/p>\n","protected":false},"author":2,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"om_disable_all_campaigns":false,"_mi_skip_tracking":false,"_monsterinsights_sitenote_active":false,"_monsterinsights_sitenote_note":"","_monsterinsights_sitenote_category":0,"footnotes":""},"categories":[16],"tags":[],"views":5709,"_links":{"self":[{"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/posts\/4485"}],"collection":[{"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/comments?post=4485"}],"version-history":[{"count":2,"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/posts\/4485\/revisions"}],"predecessor-version":[{"id":4488,"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/posts\/4485\/revisions\/4488"}],"wp:attachment":[{"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/media?parent=4485"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/categories?post=4485"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/www.sniper97.cn\/index.php\/wp-json\/wp\/v2\/tags?post=4485"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}