"use strict";(self.webpackChunkelementary_public_docs=self.webpackChunkelementary_public_docs||[]).push([[62133],{15680:(e,t,a)=>{a.d(t,{xA:()=>p,yg:()=>m});var n=a(96540);function r(e,t,a){return t in e?Object.defineProperty(e,t,{value:a,enumerable:!0,configurable:!0,writable:!0}):e[t]=a,e}function l(e,t){var a=Object.keys(e);if(Object.getOwnPropertySymbols){var n=Object.getOwnPropertySymbols(e);t&&(n=n.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),a.push.apply(a,n)}return a}function o(e){for(var t=1;t=0||(r[a]=e[a]);return r}(e,t);if(Object.getOwnPropertySymbols){var l=Object.getOwnPropertySymbols(e);for(n=0;n=0||Object.prototype.propertyIsEnumerable.call(e,a)&&(r[a]=e[a])}return r}var i=n.createContext({}),u=function(e){var t=n.useContext(i),a=t;return e&&(a="function"==typeof e?e(t):o(o({},t),e)),a},p=function(e){var t=u(e.components);return n.createElement(i.Provider,{value:t},e.children)},s="mdxType",g={inlineCode:"code",wrapper:function(e){var t=e.children;return n.createElement(n.Fragment,{},t)}},y=n.forwardRef((function(e,t){var a=e.components,r=e.mdxType,l=e.originalType,i=e.parentName,p=c(e,["components","mdxType","originalType","parentName"]),s=u(a),y=r,m=s["".concat(i,".").concat(y)]||s[y]||g[y]||l;return a?n.createElement(m,o(o({ref:t},p),{},{components:a})):n.createElement(m,o({ref:t},p))}));function m(e,t){var a=arguments,r=t&&t.mdxType;if("string"==typeof e||r){var l=a.length,o=new Array(l);o[0]=y;var c={};for(var i in t)hasOwnProperty.call(t,i)&&(c[i]=t[i]);c.originalType=e,c[s]="string"==typeof e?e:r,o[1]=c;for(var u=2;u{a.r(t),a.d(t,{assets:()=>i,contentTitle:()=>o,default:()=>g,frontMatter:()=>l,metadata:()=>c,toc:()=>u});var n=a(58168),r=(a(96540),a(15680));const l={sidebar_position:2,product:"\u9ad8\u6027\u80fdAI\u7b97\u529b\u6c60(ACP)"},o="\u3010\u5feb\u901f\u5f00\u59cb\u3011\u5fae\u8c03Llama-3-8B-Instruct\u6a21\u578b\u6700\u4f73\u5b9e\u8df5",c={unversionedId:"cloud-foundation/compute/acp/acpBestPractices/Job-QuickStart-Llama3-8B",id:"cloud-foundation/compute/acp/acpBestPractices/Job-QuickStart-Llama3-8B",title:"\u3010\u5feb\u901f\u5f00\u59cb\u3011\u5fae\u8c03Llama-3-8B-Instruct\u6a21\u578b\u6700\u4f73\u5b9e\u8df5",description:"\u6a21\u578b\u4ecb\u7ecd",source:"@site/docs/cloud-foundation/compute/acp/acpBestPractices/Job-QuickStart-Llama3-8B.md",sourceDirName:"cloud-foundation/compute/acp/acpBestPractices",slug:"/cloud-foundation/compute/acp/acpBestPractices/Job-QuickStart-Llama3-8B",permalink:"/help/docs/cloud-foundation/compute/acp/acpBestPractices/Job-QuickStart-Llama3-8B",draft:!1,editUrl:"https://github.com/facebook/docusaurus/tree/main/packages/create-docusaurus/templates/shared/docs/cloud-foundation/compute/acp/acpBestPractices/Job-QuickStart-Llama3-8B.md",tags:[],version:"current",sidebarPosition:2,frontMatter:{sidebar_position:2,product:"\u9ad8\u6027\u80fdAI\u7b97\u529b\u6c60(ACP)"},sidebar:"tutorialSidebar",previous:{title:"\u63d0\u4ea4\u4e00\u4e2aPytorch DDP\u5206\u5e03\u5f0f\u4efb\u52a1",permalink:"/help/docs/cloud-foundation/compute/acp/acpBestPractices/Job-PyTorchDDP"},next:{title:"\u63d0\u4ea4\u4e00\u4e2aMPI\u5206\u5e03\u5f0f\u4efb\u52a1",permalink:"/help/docs/cloud-foundation/compute/acp/acpBestPractices/Job-MPI"}},i={},u=[{value:"\u6a21\u578b\u4ecb\u7ecd",id:"\u6a21\u578b\u4ecb\u7ecd",level:2},{value:"\u4f7f\u7528\u524d\u63d0",id:"\u4f7f\u7528\u524d\u63d0",level:2},{value:"\u901a\u8fc7\u63a7\u5236\u53f0\u5fae\u8c03\u6a21\u578b",id:"\u901a\u8fc7\u63a7\u5236\u53f0\u5fae\u8c03\u6a21\u578b",level:2}],p={toc:u},s="wrapper";function g(e){let{components:t,...l}=e;return(0,r.yg)(s,(0,n.A)({},p,l,{components:t,mdxType:"MDXLayout"}),(0,r.yg)("h1",{id:"\u5feb\u901f\u5f00\u59cb\u5fae\u8c03llama-3-8b-instruct\u6a21\u578b\u6700\u4f73\u5b9e\u8df5"},"\u3010\u5feb\u901f\u5f00\u59cb\u3011\u5fae\u8c03Llama-3-8B-Instruct\u6a21\u578b\u6700\u4f73\u5b9e\u8df5"),(0,r.yg)("h2",{id:"\u6a21\u578b\u4ecb\u7ecd"},"\u6a21\u578b\u4ecb\u7ecd"),(0,r.yg)("p",null,"Llama-3-8B-Instruct\u6a21\u578b\u7531Meta\u516c\u53f8\u5f00\u53d1\uff0c\u5c5e\u4e8eLlama\u7cfb\u5217\u6a21\u578b\u3002\u7531\u4e8e\u9488\u5bf9\u5bf9\u8bdd\u7528\u4f8b\u8fdb\u884c\u4e86\u4f18\u5316\uff0c\u6240\u4ee5\u8be5\u6a21\u578b\u5728\u591a\u4e2a\u884c\u4e1a\u57fa\u51c6\u6d4b\u8bd5\u4e2d\u8868\u73b0\u4f18\u4e8e\u8bb8\u591a\u73b0\u6709\u7684\u5f00\u6e90\u804a\u5929\u6a21\u578b\u3002Llama-3-8B-Instruct\u652f\u6301\u591a\u79cd\u8f93\u5165\u548c\u8f93\u51fa\uff0c\u5305\u62ec\u6587\u672c\u548c\u4ee3\u7801\u751f\u6210\uff0c\u5e76\u4e14\u91c7\u7528\u4e86\u4f18\u5316\u8fc7\u7684transformer\u67b6\u6784\u3002\u8be5\u6a21\u578b\u901a\u8fc7\u76d1\u7763\u5f0f\u5fae\u8c03\uff08SFT\uff09\u548c\u57fa\u4e8e\u4eba\u7c7b\u53cd\u9988\u7684\u5f3a\u5316\u5b66\u4e60\uff08RLHF\uff09\u8fdb\u884c\u4e86\u8c03\u4f18\u3002"),(0,r.yg)("h2",{id:"\u4f7f\u7528\u524d\u63d0"},"\u4f7f\u7528\u524d\u63d0"),(0,r.yg)("blockquote",null,(0,r.yg)("p",{parentName:"blockquote"},"\u524d\u7f6e\u52a8\u4f5c1\uff1a\u5728\u5f39\u6027\u8ba1\u7b97\u96c6\u7fa4\uff08AEC2\uff09\u521b\u5efa\u5de5\u4f5c\u7a7a\u95f4 --\x3e \u521b\u5efa\u8282\u70b9 --\x3e \u5c06\u8282\u70b9\u7ed1\u5b9a\u5230\u76ee\u6807\u96c6\u7fa4\u3002\u5982\u60a8\u5df2\u7ecf\u6709\u53ef\u7528\u96c6\u7fa4\u5219\u53ef\u4ee5\u5ffd\u89c6\u672c\u6b65\u9aa4\u3002\u524d\u7f6e\u52a8\u4f5c2\uff1a\u5728\u6587\u4ef6\u5b58\u50a8AFS\u521b\u5efa\u6587\u4ef6\u7cfb\u7edf")),(0,r.yg)("h2",{id:"\u901a\u8fc7\u63a7\u5236\u53f0\u5fae\u8c03\u6a21\u578b"},"\u901a\u8fc7\u63a7\u5236\u53f0\u5fae\u8c03\u6a21\u578b"),(0,r.yg)("ol",null,(0,r.yg)("li",{parentName:"ol"},(0,r.yg)("p",{parentName:"li"},"\u70b9\u51fb\u8fdb\u5165ACP\u9ad8\u6027\u80fd\u7b97\u529b\u6c60\u3002")),(0,r.yg)("li",{parentName:"ol"},(0,r.yg)("p",{parentName:"li"},"\u9009\u5b9a\u5de5\u4f5c\u7a7a\u95f4\u3002")),(0,r.yg)("li",{parentName:"ol"},(0,r.yg)("p",{parentName:"li"},"\u70b9\u51fb\u5de6\u4fa7\u680f\u5feb\u901f\u5f00\u59cb\u3002")),(0,r.yg)("li",{parentName:"ol"},(0,r.yg)("p",{parentName:"li"},"\u70b9\u51fbMeta-Llama-3-8B-Instruct\u6a21\u578b\u3002"))),(0,r.yg)("p",null,(0,r.yg)("img",{src:a(51049).A,width:"1948",height:"994"})),(0,r.yg)("ol",{start:5},(0,r.yg)("li",{parentName:"ol"},"\u5173\u952e\u914d\u7f6e")),(0,r.yg)("ul",null,(0,r.yg)("li",{parentName:"ul"},(0,r.yg)("p",{parentName:"li"},"\u57fa\u672c\u4fe1\u606f"),(0,r.yg)("ul",{parentName:"li"},(0,r.yg)("li",{parentName:"ul"},"\u586b\u5165\u663e\u793a\u540d\u79f0\uff0c\u5fae\u8c03\u65b9\u6cd5\u53ef\u4ee5\u91c7\u7528LoRA\u6216\u5168\u53c2\u5fae\u8c03\uff0cLora\u5fae\u8c03\u6240\u9700\u65f6\u95f4\u66f4\u77ed\uff0c\u5e76\u6839\u636e\u663e\u5361\u7c7b\u578b\u9700\u6c42\u9009\u62e9\u96c6\u7fa4\uff08\u60a8\u53ef\u7528\u7684\u96c6\u7fa4\u53ef\u80fd\u4e0e\u672c\u5b9e\u4f8b\u622a\u56fe\u4e0d\u540c\uff0c\u8bf7\u4ee5\u5b9e\u9645\u60c5\u51b5\u4e3a\u51c6\uff09\u3002")))),(0,r.yg)("p",null,(0,r.yg)("img",{src:a(26398).A,width:"1458",height:"790"})),(0,r.yg)("ul",null,(0,r.yg)("li",{parentName:"ul"},(0,r.yg)("p",{parentName:"li"},"\u8d44\u6e90\u914d\u7f6e"),(0,r.yg)("ul",{parentName:"li"},(0,r.yg)("li",{parentName:"ul"},"\u4f18\u5148\u7ea7\uff1a\u9009\u62e9\u4efb\u52a1\u4f18\u5148\u7ea7\uff08\u542b\u6700\u9ad8\u3001\u9ad8\u4f18\u548c\u666e\u901a\uff09\u3002"),(0,r.yg)("li",{parentName:"ul"},"\u5b9e\u4f8b\u914d\u7f6e\uff1a\u672c\u4f8b\u9009\u62e9\u5355\u526f\u672c\u6570\u5373\u53ef\uff08\u82e5\u6a21\u578b\u53c2\u6570\u91cf\u66f4\u5927\uff0c\u53ef\u4ee5\u8003\u8651\u901a\u8fc7\u591a\u673a\u591a\u5361\u8fdb\u884c\u8bad\u7ec3\uff0c\u5373\u526f\u672c\u6570\u9009\u62e9>1\uff09\u3002"),(0,r.yg)("li",{parentName:"ul"},"GPU\u7c7b\u578b\uff1a\u5bf9\u4e8e\u672c\u793a\u4f8b\u76848B\u6a21\u578b\uff0cLoRA\u5fae\u8c03\u5efa\u8bae\u4f7f\u7528\u5355\u5f2024GB\u4ee5\u4e0a\u663e\u5b58\u7684\u52a0\u901f\u5361\uff0c\u5168\u53c2\u5fae\u8c03\u5efa\u8bae1-4\u5f2080GB\u663e\u5b58\u52a0\u901f\u5361\u3002")))),(0,r.yg)("p",null,(0,r.yg)("img",{src:a(30221).A,width:"1467",height:"823"})),(0,r.yg)("ul",null,(0,r.yg)("li",{parentName:"ul"},(0,r.yg)("p",{parentName:"li"},"\u6570\u636e\u96c6\u914d\u7f6e"),(0,r.yg)("ul",{parentName:"li"},(0,r.yg)("li",{parentName:"ul"},'\u5e73\u53f0\u63d0\u4f9b\u4e86\u9ed8\u8ba4\u6570\u636e\u96c6\u4f9b\u8bad\u7ec3\uff0c\u65e0\u9700\u8fdb\u884c\u989d\u5916\u64cd\u4f5c\u83b7\u53d6\u6570\u636e\u96c6\uff1b\u53e6\u5916\uff0c\u60a8\u4e5f\u53ef\u4ee5\u81ea\u884c\u63d0\u4f9b\u8bad\u7ec3\u6570\u636e\u96c6\uff08\u76ee\u524d\u53ea\u652f\u6301\u901a\u8fc7http\u6216https\u65b9\u5f0f\u4e0a\u4f20\u81ea\u5b9a\u4e49\u6570\u636e\u96c6\uff09\uff1a\u8bad\u7ec3\u6570\u636e\u63a5\u53d7Json\u683c\u5f0f\u8f93\u5165\uff0c\u6bcf\u6761\u6570\u636e\u7531\u95ee\u9898\u3001\u7b54\u6848\u7ec4\u6210\uff0c\u5206\u522b\u7528"instruction"\u548c"output"\u5b57\u6bb5\u8868\u793a\uff0c\u6570\u636e\u96c6\u683c\u5f0f\u793a\u4f8b\u5982\u4e0b\uff1a ')),(0,r.yg)("pre",{parentName:"li"},(0,r.yg)("code",{parentName:"pre"},'[ { "instruction": "hi", "input": "", "output": "Hello! I am {{name}}, an AI assistant developed by {{author}}. How can I assist you today?" }, { "instruction": "\u4f60\u662f\u5546\u6c64\u79d1\u6280\u5f00\u53d1\u7684SenseChat\u5417\uff1f", "input": "", "output": "\u62b1\u6b49\uff0c\u6211\u4e0d\u662f \u5546\u6c64\u79d1\u6280 \u5f00\u53d1\u7684 SenseChat\uff0c\u6211\u662f {{author}} \u5f00\u53d1\u7684 {{name}}\uff0c\u65e8\u5728\u4e3a\u7528\u6237\u63d0\u4f9b\u667a\u80fd\u5316\u7684\u56de\u7b54\u548c\u5e2e\u52a9\u3002" } ]\n'))),(0,r.yg)("li",{parentName:"ul"},(0,r.yg)("p",{parentName:"li"},"\u8d85\u53c2\u6570\u914d\u7f6e"),(0,r.yg)("ul",{parentName:"li"},(0,r.yg)("li",{parentName:"ul"},"\u5e73\u53f0\u63d0\u4f9b\u9ed8\u8ba4\u6a21\u578b\u5fae\u8c03\u8d85\u53c2\u6570\uff0c\u60a8\u4e5f\u53ef\u4ee5\u6839\u636e\u9700\u8981\u81ea\u884c\u8c03\u6574\u3002")),(0,r.yg)("table",null,(0,r.yg)("tr",null,(0,r.yg)("th",null,"\u8d85\u53c2\u6570\u540d\u79f0"),(0,r.yg)("th",null,"\u89e3\u91ca"),(0,r.yg)("th",null,"\u9ed8\u8ba4\u503c")),(0,r.yg)("tr",null,(0,r.yg)("td",null,"\u8bad\u7ec3batch size"),(0,r.yg)("td",null,"\u8bad\u7ec3\u65f6\u6bcf\u5757GPU\u4e0a\u7684\u6279\u91cf\u5927\u5c0f"),(0,r.yg)("td",null,"1")),(0,r.yg)("tr",null,(0,r.yg)("td",null,"\u9a8c\u8bc1batch size"),(0,r.yg)("td",null,"\u9a8c\u8bc1\u65f6\u6bcf\u5757GPU\u4e0a\u7684\u6279\u91cf\u5927\u5c0f"),(0,r.yg)("td",null,"1")),(0,r.yg)("tr",null,(0,r.yg)("td",null,"max epochs"),(0,r.yg)("td",null,"\u6700\u5927\u7684\u8bad\u7ec3\u8fed\u4ee3\u6b21\u6570\uff0c\u503c\u8d8a\u5927\u8bad\u7ec3\u8d8a\u4e45"),(0,r.yg)("td",null,"3")),(0,r.yg)("tr",null,(0,r.yg)("td",null,"learning rate"),(0,r.yg)("td",null,"\u51b3\u5b9a\u4e86\u8bad\u7ec3\u795e\u7ecf\u7f51\u7edc\u65f6\u6743\u91cd\u53c2\u6570\u66f4\u65b0\u7684\u901f\u5ea6\uff08\u5efa\u8bae0.0001-0.00001\uff09"),(0,r.yg)("td",null,"0.0001")),(0,r.yg)("tr",null,(0,r.yg)("td",null,"max samples"),(0,r.yg)("td",null,"\u8fdb\u884c\u5fae\u8c03\u65f6\u7684\u8bad\u7ec3\u96c6\u6700\u5927\u6570\u636e\u603b\u91cf\uff08\u800cbatch size\u662f\u6bcf\u6b21\u8fed\u4ee3\u7684\u6570\u636e\u91cf\uff09"),(0,r.yg)("td",null,"1000"))))),(0,r.yg)("ul",null,(0,r.yg)("li",{parentName:"ul"},(0,r.yg)("p",{parentName:"li"},"\u8bad\u7ec3\u8f93\u51fa\u53caTensorBoard\u914d\u7f6e"),(0,r.yg)("ul",{parentName:"li"},(0,r.yg)("li",{parentName:"ul"},"\u8bad\u7ec3\u8f93\u51fa\u914d\u7f6e\uff1a\u5982\u60a8\u5df2\u7ecf\u6709\u5b58\u50a8\u5377\uff0c\u53ef\u4ee5\u76f4\u63a5\u9009\u62e9\u76ee\u6807\u5b58\u50a8\u5377\u3002\u6a21\u578b\u5b58\u50a8\u6302\u8f7d\u8def\u5f84\u9ed8\u8ba4\u4e3a/mnt/afs/model\u3002"),(0,r.yg)("li",{parentName:"ul"},'TensorBoard\u914d\u7f6e\uff1a\u91c7\u96c6TensorBoard\u53ef\u9009\uff0c\u82e5\u9009\u5b9a\u201c\u662f"\uff0c\u5219\u9700\u8981\u9009\u62e9\u76ee\u6807\u5b58\u50a8\u5377\uff0c\u9ed8\u8ba4\u6302\u8f7d\u8def\u5f84\u4e3a/mnt/afs/tensorlog\u3002'),(0,r.yg)("li",{parentName:"ul"},"\u82e5\u8fd8\u6ca1\u6709\u4efb\u4f55\u6587\u4ef6\u5b58\u50a8\u5377\uff0c\u8bf7\u5148\u524d\u5f80AFS\u6587\u4ef6\u5b58\u50a8\u521b\u5efa\uff0c\u5982\u679c\u4e0d\u6302\u8f7d\u6301\u4e45\u5b58\u50a8\uff0c\u8bad\u7ec3\u7ed3\u679c\u5c06\u4f1a\u4e22\u5931\u3002")))),(0,r.yg)("p",null,(0,r.yg)("img",{src:a(19473).A,width:"1584",height:"771"})),(0,r.yg)("ol",{start:6},(0,r.yg)("li",{parentName:"ol"},"\u70b9\u51fb\u5b8c\u6210\u521b\u5efa")),(0,r.yg)("ul",null,(0,r.yg)("li",{parentName:"ul"},"\u521b\u5efa\u5b8c\u6bd5\u540e\uff0c\u4efb\u52a1\u4f1a\u7ecf\u5386\u3010\u521d\u59cb\u5316\u3011-\u3010\u542f\u52a8\u4e2d\u3011\uff0c\u3010\u8fd0\u884c\u4e2d\u3011\u7b49\u72b6\u6001\uff0c\u5982\u72b6\u6001\u8f6c\u4e3a\u3010\u6210\u529f\u3011\uff0c\u8bf4\u660e\u8bad\u7ec3\u4efb\u52a1\u5df2\u5b8c\u6210\uff0c\u8bf7\u5230\u76ee\u6807\u6587\u4ef6\u5b58\u50a8\u7a7a\u95f4\u67e5\u770b\u5fae\u8c03\u5b8c\u6bd5\u7684\u6a21\u578b\uff1b\u82e5\u5931\u8d25\uff0c\u53ef\u4ee5\u901a\u8fc7\u201c\u590d\u5236\u201d\uff08\u4f4d\u4e8e\u4efb\u52a1\u5217\u8868\u6bcf\u4e2a\u4efb\u52a1\u7684\u53f3\u4fa7-\u64cd\u4f5c\uff09\uff0c\u91cd\u65b0\u5f00\u59cb\u6a21\u578b\u5fae\u8c03\u3002"),(0,r.yg)("li",{parentName:"ul"},"\u6ce8\u610f\uff0c\u5feb\u901f\u5f00\u59cb\u4e2d\u7684\u6a21\u578b\u6bcf\u6b21\u5fae\u8c03\u90fd\u662f\u57fa\u4e8e\u9884\u7f6e\u955c\u50cf\u4ece\u5934\u5f00\u59cb\uff0c\u6682\u4e0d\u652f\u6301\u57fa\u4e8e\u5df2\u6709\u6a21\u578b\u7684checkpoint\u8fdb\u884c\u7eed\u8bad\u7ec3\uff09\u3002")),(0,r.yg)("p",null,(0,r.yg)("img",{src:a(70405).A,width:"1280",height:"201"})))}g.isMDXComponent=!0},70405:(e,t,a)=>{a.d(t,{A:()=>n});const n=a.p+"assets/images/\u4efb\u52a1\u5217\u8868-98bc9f03adca74b7f5c2ac89efc91154.png"},26398:(e,t,a)=>{a.d(t,{A:()=>n});const n=a.p+"assets/images/\u57fa\u672c\u4fe1\u606f-aa9df01f97620c6bfe1df9487e03c6c5.png"},19473:(e,t,a)=>{a.d(t,{A:()=>n});const n=a.p+"assets/images/\u5b58\u50a8\u914d\u7f6e-faf6c76561984d91f7381e552fdddac8.png"},51049:(e,t,a)=>{a.d(t,{A:()=>n});const n=a.p+"assets/images/\u5feb\u901f\u5f00\u59cb\u4f4d\u7f6e\u6307\u5bfc-c7d7bae6aea3d8b677329301ea34a51b.png"},30221:(e,t,a)=>{a.d(t,{A:()=>n});const n=a.p+"assets/images/\u8d44\u6e90\u914d\u7f6e-1b12678f79912ce4a6f5e80504bc6848.png"}}]);