{"id":2494,"date":"2024-03-11T23:55:02","date_gmt":"2024-03-11T15:55:02","guid":{"rendered":"https:\/\/www.aqwu.net\/wp\/?p=2494"},"modified":"2024-04-28T20:02:15","modified_gmt":"2024-04-28T12:02:15","slug":"%e4%ba%86%e8%a7%a3-llama-2-%e6%a8%a1%e5%9e%8b%e7%bb%93%e6%9e%847","status":"publish","type":"post","link":"https:\/\/www.aqwu.net\/wp\/?p=2494","title":{"rendered":"\u4e86\u89e3 LLaMA-2 \u6a21\u578b\u7ed3\u6784(7)"},"content":{"rendered":"\n<h2 class=\"wp-block-heading\"><strong>12. \u6a21\u578b\u6587\u4ef6\u7684\u914d\u7f6e\u4fe1\u606f<\/strong><\/h2>\n\n\n\n<p>\u6839\u636e\u524d\u9762\u4fdd\u5b58\u7684\u6a21\u578b\u6587\u4ef6 output\/model.bin \u7684\u5185\u5bb9\uff0c\u53ef\u4ee5\u77e5\u9053\uff0c\u6a21\u578b\u914d\u7f6e\u4fe1\u606f\u7684\u8d77\u59cb\u4f4d\u7f6e\u662f0\uff0c\u5927\u5c0f\u662f28\u4e2a\u5b57\u8282\uff0c\u4e0b\u9762\u6765\u5206\u6790\u6a21\u578b\u914d\u7f6e\u7684\u8be6\u7ec6\u4fe1\u606f<\/p>\n\n\n\n<p>\u547d\u540d\u4e3a test03.c\uff0c\u6587\u4ef6\u4fdd\u5b58\u5230 newsrc \u76ee\u5f55\u4e0b\uff1a<\/p>\n\n\n\n<div class=\"wp-block-urvanov-syntax-highlighter-code-block\"><pre class=\"lang:c decode:true \">#include &lt;stdio.h&gt;\n#include &lt;stdlib.h&gt;\n#include &lt;ctype.h&gt;\n#include &lt;time.h&gt;\n#include &lt;math.h&gt;\n#include &lt;string.h&gt;\n#include &lt;fcntl.h&gt;\n#include &lt;unistd.h&gt;\n#include &lt;sys\/mman.h&gt;\n\n\/\/ \u7528\u4e8e\u5b58\u50a8\u548c\u4f20\u9012 Transformer \u6a21\u578b\u7684\u8d85\u53c2\u6570\uff0c\u5373\u6784\u5efa\u6a21\u578b\u6240\u9700\u7684\u5404\u79cd\u53c2\u6570\u3002\n\/\/ \u5728\u5b9e\u9645\u5e94\u7528\u4e2d\uff0c\u8fd9\u4e2a\u7ed3\u6784\u4f53\u7684\u5b9e\u4f8b\u901a\u5e38\u4f1a\u4f5c\u4e3a\u53c2\u6570\u4f20\u9012\u7ed9\u6a21\u578b\u7684\u6784\u9020\u51fd\u6570\uff0c\u4ee5\u521d\u59cb\u5316\u6a21\u578b\u7684\u7ed3\u6784\u3002\ntypedef struct {\n    \/\/ \u4ee3\u8868 Transformer \u6a21\u578b\u7684\u7ef4\u5ea6\u3002\u5728\u81ea\u7136\u8bed\u8a00\u5904\u7406\u4e2d\uff0c\u8fd9\u4e2a\u7ef4\u5ea6\u901a\u5e38\u662f\u5d4c\u5165\uff08embedding\uff09\u5c42\u548c\u6240\u6709 Transformer \u5c42\u7684\u8f93\u51fa\u7ef4\u5ea6\u3002\n    int dim; \/\/ transformer dimension\n    \/\/ \u4ee3\u8868\u524d\u9988\u795e\u7ecf\u7f51\u7edc\u5c42\uff08Feed Forward Neural Network Layer\uff0c\u5373 Transformer \u6a21\u578b\u4e2d\u7684\u5168\u8fde\u63a5\u5c42\uff09\u7684\u9690\u85cf\u5c42\u7ef4\u5ea6\u3002\n    int hidden_dim; \/\/ for ffn layers\n    \/\/ \u8868\u793a\u6a21\u578b\u4e2d\u7684\u5c42\u6570\u91cf\u3002\u5728\u4e00\u4e2a\u6807\u51c6\u7684 Transformer \u6a21\u578b\u4e2d\uff0c\u4e00\u4e2a\u5c42\u5305\u542b\u4e00\u4e2a\u591a\u5934\u81ea\u6ce8\u610f\u529b\u673a\u5236\uff08Multi-head Self Attention Mechanism\uff09\u548c\u4e00\u4e2a\u524d\u9988\u795e\u7ecf\u7f51\u7edc\u5c42\u3002\n    int n_layers; \/\/ number of layers\n    \/\/ \u8868\u793a\u591a\u5934\u6ce8\u610f\u529b\u673a\u5236\u4e2d\u67e5\u8be2\u5934\u7684\u6570\u91cf\u3002\u591a\u5934\u6ce8\u610f\u529b\u5141\u8bb8\u6a21\u578b\u540c\u65f6\u5173\u6ce8\u8f93\u5165\u5e8f\u5217\u4e2d\u7684\u591a\u4e2a\u4f4d\u7f6e\n    int n_heads; \/\/ number of query heads\n    \/\/ \u8868\u793a\u952e\/\u503c\u5bf9\u7684\u5934\u7684\u6570\u91cf\u3002\u8fd9\u53ef\u4ee5\u5c0f\u4e8e\u67e5\u8be2\u5934\u7684\u6570\u91cf\uff0c\u56e0\u4e3a\u6709\u4e00\u4e9b\u6a21\u578b\u53ef\u80fd\u4f7f\u7528\u591a\u67e5\u8be2\u529f\u80fd\u3002\n    int n_kv_heads; \/\/ number of key\/value heads (can be &lt; query heads because of multiquery)\n    \/\/ \u4ee3\u8868\u6a21\u578b\u7684\u8bcd\u6c47\u8868\u5927\u5c0f\u3002\u5bf9\u4e8e\u5b57\u8282\u7ea7\u7684\u6a21\u578b\uff0c\u8bcd\u6c47\u91cf\u901a\u5e38\u4e3a 256\uff0c\u56e0\u4e3a\u6709 256 \u4e2a\u53ef\u80fd\u7684\u5b57\u8282\u503c\u3002\n    int vocab_size; \/\/ vocabulary size, usually 256 (byte-level)\n    \/\/ \u8868\u793a\u6a21\u578b\u53ef\u4ee5\u5904\u7406\u7684\u6700\u5927\u5e8f\u5217\u957f\u5ea6\u3002\u5e8f\u5217\u957f\u5ea6\u662f\u8f93\u5165\u5230\u6a21\u578b\u4e2d\u7684 token\uff08\u5982\u5355\u8bcd\u6216\u5b57\u8282\uff09\u7684\u6570\u91cf\u3002\n    int seq_len; \/\/ max sequence length\n} Config;\n\nint main(int argc, char *argv[]) {\n    Config config;\n    char *checkpoint = \"..\/output\/model.bin\";\n    \n    FILE *file = fopen(checkpoint, \"rb\");\n    if (!file) { \n      fprintf(stderr, \"Couldn't open file %s\\n\", checkpoint); \n      exit(EXIT_FAILURE); \n    }\n\n    \/\/ \u8bfb\u53d6\u6587\u4ef6\u4e2d\u7684 Config \u7ed3\u6784\u4f53\u4fe1\u606f\u3002\n    if (fread(&amp;config, sizeof(Config), 1, file) != 1) { \n      fprintf(stderr, \"Couldn't read file %s\\n\", checkpoint); \n      exit(EXIT_FAILURE); \n    }\n    fclose(file);\n    \n    printf(\"sizeof(Config) = %ld\\n\", sizeof(Config));\n    printf(\"dim            = %d\\n\", config.dim);\n    printf(\"hidden_dim     = %d\\n\", config.hidden_dim);\n    printf(\"n_layers       = %d\\n\", config.n_layers);\n    printf(\"n_heads        = %d\\n\", config.n_heads);\n    printf(\"n_kv_heads     = %d\\n\", config.n_kv_heads);\n    printf(\"vocab_size     = %d\\n\", config.vocab_size);\n    printf(\"seq_len        = %d\\n\", config.seq_len);\n    \n    return 0;\n}<\/pre><\/div>\n\n\n\n<p>\u7f16\u8bd1 test03.c<\/p>\n\n\n\n<div class=\"wp-block-urvanov-syntax-highlighter-code-block\"><pre class=\"lang:sh decode:true \">make test03\ncc     test03.c   -o test03<\/pre><\/div>\n\n\n\n<p>\u8fd0\u884c test03<\/p>\n\n\n\n<div class=\"wp-block-urvanov-syntax-highlighter-code-block\"><pre class=\"lang:python decode:true \">.\/test03\nsizeof(Config) = 28\ndim            = 4096\nhidden_dim     = 11008\nn_layers       = 32\nn_heads        = 32\nn_kv_heads     = 32\nvocab_size     = -32000\nseq_len        = 4096<\/pre><\/div>\n\n\n\n<p><\/p>\n","protected":false},"excerpt":{"rendered":"<p>12. \u6a21\u578b\u6587\u4ef6\u7684\u914d\u7f6e\u4fe1\u606f \u6839\u636e\u524d\u9762\u4fdd\u5b58\u7684\u6a21\u578b\u6587\u4ef6 output\/model.bin \u7684\u5185\u5bb9\uff0c\u53ef\u4ee5\u77e5\u9053\uff0c\u6a21\u578b\u914d [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"site-sidebar-layout":"default","site-content-layout":"","ast-site-content-layout":"default","site-content-style":"default","site-sidebar-style":"default","ast-global-header-display":"","ast-banner-title-visibility":"","ast-main-header-display":"","ast-hfb-above-header-display":"","ast-hfb-below-header-display":"","ast-hfb-mobile-header-display":"","site-post-title":"","ast-breadcrumbs-content":"","ast-featured-img":"","footer-sml-layout":"","theme-transparent-header-meta":"","adv-header-id-meta":"","stick-header-meta":"","header-above-stick-meta":"","header-main-stick-meta":"","header-below-stick-meta":"","astra-migrate-meta-layouts":"set","ast-page-background-enabled":"default","ast-page-background-meta":{"desktop":{"background-color":"var(--ast-global-color-4)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"ast-content-background-meta":{"desktop":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"_jetpack_memberships_contains_paid_content":false,"footnotes":""},"categories":[313,289,443,442,312],"tags":[242,314],"class_list":["post-2494","post","type-post","status-publish","format-standard","hentry","category-chatgpt","category-gpt","category-llm","category-llms","category-openai","tag-chatgpt","tag-openai-api"],"views":1008,"jetpack_sharing_enabled":true,"jetpack_featured_media_url":"","_links":{"self":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts\/2494","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=2494"}],"version-history":[{"count":8,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts\/2494\/revisions"}],"predecessor-version":[{"id":2516,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts\/2494\/revisions\/2516"}],"wp:attachment":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=2494"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=2494"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=2494"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}