{"id":4776,"date":"2024-09-19T22:49:22","date_gmt":"2024-09-19T14:49:22","guid":{"rendered":"https:\/\/www.aqwu.net\/wp\/?p=4776"},"modified":"2024-09-19T22:50:17","modified_gmt":"2024-09-19T14:50:17","slug":"%e8%9e%8d%e5%90%88%e6%a8%a1%e5%9e%8b-llama-3-1-8b-fusion-9010","status":"publish","type":"post","link":"https:\/\/www.aqwu.net\/wp\/?p=4776","title":{"rendered":"\u878d\u5408\u6a21\u578b Llama-3.1-8B-Fusion-9010"},"content":{"rendered":"\n<h2 class=\"wp-block-heading\">\u6982\u8ff0<\/h2>\n\n\n\n<p><code>Llama-3.1-8B-Fusion-9010<\/code>\u662f\u4e00\u4e2a\u6df7\u5408\u6a21\u578b\uff0c\u5b83\u7ed3\u5408\u4e86\u4e24\u4e2a\u5f3a\u5927\u7684\u57fa\u4e8e Llama \u7684\u6a21\u578b\u7684\u4f18\u52bf\uff1a<a href=\"https:\/\/huggingface.co\/arcee-ai\/Llama-3.1-SuperNova-Lite\">arcee-ai\/Llama-3.1-SuperNova-Lite<\/a>&nbsp;\u548c&nbsp;<a href=\"https:\/\/huggingface.co\/mlabonne\/Meta-Llama-3.1-8B-Instruct-abliterated\">mlabonne\/Meta-Llama-3.1-8B-Instruct-abliterated<\/a>\u3002\u6743\u91cd\u4ee5 9\uff1a1 \u7684\u6bd4\u4f8b\u6df7\u5408\uff0c\u5176\u4e2d 90% \u7684\u6743\u91cd\u6765\u81ea SuperNova-Lite\uff0c10% \u6765\u81ea\u88ab\u5220\u51cf\u7684 Meta-Llama-3.1-8B-Instruct \u6a21\u578b\u3002<strong>\u867d\u7136\u662f\u7b80\u5355\u7684\u6df7\u5408\uff0c\u4f46\u6a21\u578b\u662f\u53ef\u7528\u7684\uff0c\u5e76\u4e14\u6ca1\u6709\u51fa\u73b0\u4e71\u7801<\/strong>\u3002 \u8fd9\u662f\u4e00\u4e2a\u5b9e\u9a8c\u3002\u6211\u5206\u522b\u6d4b\u8bd5&nbsp;<a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-9010\">9\uff1a1<\/a>\u3001<a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-8020\">8\uff1a2<\/a>\u3001<a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-7030\">7\uff1a3<\/a>\u3001<a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-6040\">6\uff1a4<\/a>&nbsp;\u548c&nbsp;<a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-5050\">5\uff1a5<\/a>&nbsp;\u7684\u6bd4\u7387\uff0c\u4ee5\u67e5\u770b\u5b83\u4eec\u5bf9\u6a21\u578b\u7684\u5f71\u54cd\u6709\u591a\u5927\u3002 \u6240\u6709\u6a21\u578b\u8bc4\u4f30\u62a5\u544a\u5c06\u5728\u968f\u540e\u63d0\u4f9b\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\"><a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-9010#model-details\"><\/a>\u578b\u53f7\u8be6\u7ec6\u4fe1\u606f<\/h2>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>\u57fa\u672c\u578b\u53f7\uff1a<\/strong>\n<ul class=\"wp-block-list\">\n<li><a href=\"https:\/\/huggingface.co\/arcee-ai\/Llama-3.1-SuperNova-Lite\">arcee-ai\/llama-3.1-SuperNova-Lite<\/a>\u00a0\uff0890%\uff09<\/li>\n\n\n\n<li><a href=\"https:\/\/huggingface.co\/mlabonne\/Meta-Llama-3.1-8B-Instruct-abliterated\">mlabonne\/Meta-Llama-3.1-8B-Instruct-abliterated<\/a>\u00a0\uff0810%\uff09<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li><strong>\u578b\u53f7\u5c3a\u5bf8\uff1a<\/strong>8B \u53c2\u6570<\/li>\n\n\n\n<li><strong>\u5efa\u7b51\uff1a<\/strong>Meta 3.1<\/li>\n\n\n\n<li><strong>\u6df7\u5408\u6bd4\u4f8b\uff1a<\/strong>9\uff1a1 \uff08SuperNova-Lite\uff1aMeta-Llama-3.1-8B-Instruct-abliterated\uff09<\/li>\n<\/ul>\n\n\n\n<h2 class=\"wp-block-heading\"><a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-9010#key-features\"><\/a>\u4e3b\u8981\u7279\u70b9<\/h2>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>SuperNova-Lite \u8d21\u732e \uff0890%\uff09\uff1a<\/strong>Llama-3.1-SuperNova-Lite \u662f Arcee.ai \u5f00\u53d1\u7684\u4e00\u4e2a 8B \u53c2\u6570\u6a21\u578b\uff0c\u57fa\u4e8e Llama-3.1-8B-Instruct \u67b6\u6784\u3002<\/li>\n\n\n\n<li><strong>Meta-Llama-3.1-8B-Instruct-abliterated \u8d21\u732e \uff0810%\uff09\uff1a<\/strong>\u8fd9\u662f Llama 3.1 8B Instruct \u7684\u672a\u7ecf\u5ba1\u67e5\u7248\u672c\uff0c\u4f7f\u7528\u6d88\u878d\u521b\u5efa\u3002<\/li>\n<\/ul>\n\n\n\n<h2 class=\"wp-block-heading\"><a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-9010#usage\"><\/a>\u7528\u6cd5<\/h2>\n\n\n\n<p>\u60a8\u53ef\u4ee5\u901a\u8fc7\u4f7f\u7528 Hugging Face \u7684\u00a0<code>transformers<\/code>\u00a0\u5e93\u52a0\u8f7d\u5b83\u6765\u5728\u60a8\u7684\u5e94\u7528\u7a0b\u5e8f\u4e2d\u4f7f\u7528\u8fd9\u4e2a\u6df7\u5408\u6a21\u578b\uff1a<\/p>\n\n\n\n<div class=\"wp-block-urvanov-syntax-highlighter-code-block\"><pre class=\"lang:python decode:true \" >import torch\nfrom transformers import AutoModelForCausalLM, AutoTokenizer, TextStreamer\nimport time\n\nmixed_model_name = \"huihui-ai\/Llama-3.1-8B-Fusion-9010\"\n\n# Check if CUDA is available\ndevice = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n\n# Load model and tokenizer\nmixed_model = AutoModelForCausalLM.from_pretrained(mixed_model_name, device_map=device, torch_dtype=torch.bfloat16)\ntokenizer = AutoTokenizer.from_pretrained(mixed_model_name)\n\n# Ensure the tokenizer has pad_token_id set\ntokenizer.pad_token_id = tokenizer.eos_token_id\n\n# Input loop\nprint(\"Start inputting text for inference (type 'exit' to quit)\")\nwhile True:\n    prompt = input(\"Enter your prompt: \")\n    if prompt.lower() == \"exit\":\n        print(\"Exiting inference loop.\")\n        break\n\n    # Inference phase: Generate text using the modified model\n    chat = [\n        {\"role\": \"system\", \"content\": \"You are a helpful assistant.\"},\n        {\"role\": \"user\", \"content\": prompt}\n    ]\n\n    # Prepare input data\n    input_ids = tokenizer.apply_chat_template(\n        chat, tokenize=True, add_generation_prompt=True, return_tensors=\"pt\"\n    ).to(device)\n\n    # Use TextStreamer for streaming output\n    streamer = TextStreamer(tokenizer, skip_special_tokens=True)\n\n    # Record the start time\n    start_time = time.time()\n\n    # Generate text and stream output character by character\n    outputs = mixed_model.generate(\n        input_ids,\n        max_new_tokens=8192,\n        do_sample=True,\n        temperature=0.6,\n        top_p=0.9,\n        streamer=streamer  # Enable streaming output\n    )\n\n    # Record the end time\n    end_time = time.time()\n\n    # Calculate the number of generated tokens\n    generated_tokens = outputs[0][input_ids.shape[-1]:].shape[0]\n\n    # Calculate the total time taken\n    total_time = end_time - start_time\n\n    # Calculate tokens generated per second\n    tokens_per_second = generated_tokens \/ total_time\n\n    print(f\"\\nGenerated {generated_tokens} tokens in total, took {total_time:.2f} seconds, generating {tokens_per_second:.2f} tokens per second.\")\n<\/pre><\/div>\n\n\n\n<h2 class=\"wp-block-heading\"><a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-9010#evaluations\"><\/a>\u8bc4\u4f30<\/h2>\n\n\n\n<p>\u4ee5\u4e0b\u6570\u636e\u5df2\u91cd\u65b0\u8bc4\u4f30\u5e76\u8ba1\u7b97\u4e3a\u6bcf\u6b21\u6d4b\u8bd5\u7684\u5e73\u5747\u503c\u3002<\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>Benchmark<\/th><th>SuperNova-Lite<\/th><th>Meta-Llama-3.1-8B-Instruct-abliterated<\/th><th>Llama-3.1-8B-Fusion-9010<\/th><th>Llama-3.1-8B-Fusion-8020<\/th><th>Llama-3.1-8B-Fusion-7030<\/th><th>Llama-3.1-8B-Fusion-6040<\/th><th>Llama-3.1-8B-Fusion-5050<\/th><\/tr><\/thead><tbody><tr><td>IF_Eval<\/td><td>82.09<\/td><td>76.29<\/td><td>82.44<\/td><td>82.93<\/td><td><strong>83.10<\/strong><\/td><td>82.94<\/td><td>82.03<\/td><\/tr><tr><td>MMLU Pro<\/td><td><strong>35.87<\/strong><\/td><td>33.1<\/td><td>35.65<\/td><td>35.32<\/td><td>34.91<\/td><td>34.5<\/td><td>33.96<\/td><\/tr><tr><td>TruthfulQA<\/td><td><strong>64.35<\/strong><\/td><td>53.25<\/td><td>62.67<\/td><td>61.04<\/td><td>59.09<\/td><td>57.8<\/td><td>56.75<\/td><\/tr><tr><td>BBH<\/td><td><strong>49.48<\/strong><\/td><td>44.87<\/td><td>48.86<\/td><td>48.47<\/td><td>48.30<\/td><td>48.19<\/td><td>47.93<\/td><\/tr><tr><td>GPQA<\/td><td>31.98<\/td><td>29.50<\/td><td>32.25<\/td><td>32.38<\/td><td><strong>32.61<\/strong><\/td><td>31.14<\/td><td>30.6<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<p>\u539f\u6587\u94fe\u63a5\uff1a<a href=\"https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-9010\">https:\/\/huggingface.co\/huihui-ai\/Llama-3.1-8B-Fusion-9010<\/a><\/p>\n\n\n\n<p><\/p>\n","protected":false},"excerpt":{"rendered":"<p>\u6982\u8ff0 Llama-3.1-8B-Fusion-9010\u662f\u4e00\u4e2a\u6df7\u5408\u6a21\u578b\uff0c\u5b83\u7ed3\u5408\u4e86\u4e24\u4e2a\u5f3a\u5927\u7684\u57fa\u4e8e Llama \u7684\u6a21 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"site-sidebar-layout":"default","site-content-layout":"","ast-site-content-layout":"default","site-content-style":"default","site-sidebar-style":"default","ast-global-header-display":"","ast-banner-title-visibility":"","ast-main-header-display":"","ast-hfb-above-header-display":"","ast-hfb-below-header-display":"","ast-hfb-mobile-header-display":"","site-post-title":"","ast-breadcrumbs-content":"","ast-featured-img":"","footer-sml-layout":"","theme-transparent-header-meta":"","adv-header-id-meta":"","stick-header-meta":"","header-above-stick-meta":"","header-main-stick-meta":"","header-below-stick-meta":"","astra-migrate-meta-layouts":"set","ast-page-background-enabled":"default","ast-page-background-meta":{"desktop":{"background-color":"var(--ast-global-color-4)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"ast-content-background-meta":{"desktop":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"_jetpack_memberships_contains_paid_content":false,"footnotes":""},"categories":[444,443,442],"tags":[559,558],"class_list":["post-4776","post","type-post","status-publish","format-standard","hentry","category-ai","category-llm","category-llms","tag-funsion","tag-llama-3-1"],"views":2617,"jetpack_sharing_enabled":true,"jetpack_featured_media_url":"","_links":{"self":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts\/4776","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=4776"}],"version-history":[{"count":2,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts\/4776\/revisions"}],"predecessor-version":[{"id":4778,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=\/wp\/v2\/posts\/4776\/revisions\/4778"}],"wp:attachment":[{"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=4776"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=4776"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.aqwu.net\/wp\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=4776"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}