{"id":1706,"date":"2023-07-02T20:45:31","date_gmt":"2023-07-02T11:45:31","guid":{"rendered":"https:\/\/fukugyouhistory.tokyo\/?p=1706"},"modified":"2023-10-31T00:27:00","modified_gmt":"2023-10-30T15:27:00","slug":"rinna%e3%81%ae%e6%97%a5%e6%9c%ac%e8%aa%9e%e7%89%b9%e5%8c%96gpt%e8%a8%80%e8%aa%9e%e3%83%a2%e3%83%87%e3%83%ab%e3%80%80google-colab%e3%81%ae%e7%84%a1%e6%96%99%e6%9e%a0%e3%81%a7%e5%8b%95%e3%81%8b%e3%81%97","status":"publish","type":"post","link":"https:\/\/fukugyouhistory.tokyo\/?p=1706","title":{"rendered":"Rinna\u793e\u306e\u65e5\u672c\u8a9e\u7279\u5316GPT\u8a00\u8a9e\u30e2\u30c7\u30eb\u3000Google Colab\u306e\u7121\u6599\u67a0\u3067\u52d5\u304b\u3057\u3066\u307f\u305f\u3000"},"content":{"rendered":"\n<p>\u4e45\u3057\u304f\u66f4\u65b0\u3067\u304d\u3066\u3044\u307e\u305b\u3093\u3067\u3057\u305f\u3002<\/p>\n\n\n\n<p>2023\u5e745\u6708\u306bRinna\u793e\u304c\u516c\u958b\u3057\u305f<a href=\"https:\/\/huggingface.co\/rinna\/japanese-gpt-neox-3.6b-instruction-ppo\" target=\"_blank\" rel=\"noreferrer noopener\">\u65e5\u672c\u8a9e\u306b\u7279\u5316\u3057\u305f36\u5104\u30d1\u30e9\u30e1\u30fc\u30bf\u3092\u6301\u3064\u5bfe\u8a71GPT\u8a00\u8a9e\u30e2\u30c7\u30eb<\/a>\u3092\u5b9f\u884c\u3057\u3066\u884c\u304d\u307e\u3059\u3002<br>GPU\u30e1\u30e2\u30ea\u30b5\u30a4\u30ba\u306b\u5fdc\u3058\u3066\u3001model\u8aad\u307f\u8fbc\u307f\u306e\u30aa\u30d7\u30b7\u30e7\u30f3\u5909\u66f4\u3067\u304d\u308b\u3088\u3046\u3067\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u6307\u5b9a\u306a\u3057<\/li>\n\n\n\n<li>torch_dtype=torch.float16<\/li>\n\n\n\n<li>load_in_8bit=True<\/li>\n\n\n\n<li>load_in_4bit=True<\/li>\n<\/ul>\n\n\n\n<p>\u4eca\u56de\u306f\u3001\u300cload_in_8bit=True\u300d\u3092\u6307\u5b9a\u3057\u3066\u52d5\u304b\u3057\u3066\u3044\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<p><\/p>\n\n\n\n<!--more-->\n\n\n\n<h2 class=\"wp-block-heading\">Rinna\u306e\u65e5\u672c\u8a9e\u7279\u5316GPT\u8a00\u8a9e\u30e2\u30c7\u30eb\u3000\u5b9f\u884c<\/h2>\n\n\n\n<p><a rel=\"noreferrer noopener\" href=\"https:\/\/colab.research.google.com\/?hl=ja\" target=\"_blank\">Google Colaboratory<\/a>\u306b\u30a2\u30af\u30bb\u30b9\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u6700\u521d\u306b\u3001\u300c\u7de8\u96c6\u300d\u2192\u300c\u30ce\u30fc\u30c8\u30d6\u30c3\u30af\u306e\u8a2d\u5b9a\u300d\u304b\u3089\u3001<br>\u30cf\u30fc\u30c9\u30a6\u30a7\u30a2\u30a2\u30af\u30bb\u30e9\u30ec\u30fc\u30c8\u3092\u300cGPU\u300d\u306b\u8a2d\u5b9a\u3057\u307e\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image\"><img decoding=\"async\" width=\"880\" height=\"343\" sizes=\"(max-width: 880px) 100vw, 880px\" src=\"https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/03\/image-35.png\" alt=\"\" class=\"wp-image-182\" srcset=\"https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/03\/image-35.png 880w, https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/03\/image-35-300x117.png 300w, https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/03\/image-35-768x299.png 768w\" \/><\/figure>\n\n\n\n<p>\u4ee5\u4e0b\u306e\u30b3\u30de\u30f3\u30c9\u3092\u5165\u529b\u3057\u3001Shift+Enter\u3092\u62bc\u3057\u3066\u5b9f\u884c\u3057\u307e\u3057\u3087\u3046\u3002<br>GPU\u306e\u60c5\u5831\u304c\u51fa\u3066\u304f\u308c\u3070\u3001\u6b63\u5e38\u306b\u8a2d\u5b9a\u5909\u66f4\u3067\u304d\u3066\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>!nvidia-smi<\/code><\/pre>\n\n\n\n<p>\u7d9a\u3051\u3066\u30b3\u30fc\u30c9\u3092\u8a18\u8f09\u3057\u3066\u304d\u307e\u3059\u3002\u5fc5\u8981\u306a\u30e9\u30a4\u30d6\u30e9\u30ea\u3092\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3057\u307e\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>!pip install transformers\n!pip install SentencePiece\n!pip install Accelerate\n!pip install bitsandbytes<\/code><\/pre>\n\n\n\n<p>\u7d39\u4ecb\u3055\u308c\u3066\u3044\u308b\u30b5\u30f3\u30d7\u30eb\u30b3\u30fc\u30c9\u306e\u30aa\u30d7\u30b7\u30e7\u30f3\u90e8\u5206\u3092\u5909\u66f4\u3057\u3066\u3001\u4ee5\u4e0b\u306e\u30b3\u30fc\u30c9\u3067\u5b9f\u884c\u3057\u3066\u3044\u304d\u307e\u3059\u3002<br>\u300cdevice_map={&#8220;&#8221;: 0}\u300d\u306e\u8ffd\u52a0\u3001\u300cmodel.to(&#8220;cuda&#8221;)\u300d\u90e8\u5206\u3092\u30b3\u30e1\u30f3\u30c8\u30a2\u30a6\u30c8\u304c\u8ffd\u52a0\u3067\u5fc5\u8981\u306a\u3088\u3046\u3067\u3059\u3002<br>\uff08\u300cmodel.to(&#8220;cuda&#8221;)\u300d\u90e8\u5206\u3092\u30b3\u30e1\u30f3\u30c8\u30a2\u30a6\u30c8\u3057\u3066\u3082\u3001GPU\u3067\u52d5\u4f5cOK\uff09<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>import torch\nfrom transformers import AutoTokenizer, AutoModelForCausalLM\n\nmodel_name = \"rinna\/japanese-gpt-neox-3.6b-instruction-ppo\"\ntokenizer = AutoTokenizer.from_pretrained(model_name, use_fast=False)\nmodel = AutoModelForCausalLM.from_pretrained(model_name,\n    # torch_dtype=torch.float16,\n    device_map={\"\": 0},\n    load_in_8bit=True\n    )\n\n# if torch.cuda.is_available():\n#     model = model.to(\"cuda\")<\/code><\/pre>\n\n\n\n<pre class=\"wp-block-code\"><code>prompt = &#91;\n    {\n        \"speaker\": \"\u30e6\u30fc\u30b6\u30fc\",\n        \"text\": \"\u6b21\u306e\u6587\u7ae0\u306e\u8a02\u6b63\u3057\u3066\u304f\u3060\u3055\u3044\u3002\u300c\u4eca\u65e5\u306f\u71b1\u3044\u4e00\u65e5\u3067\u3059\u300d\"\n    }\n]\n\nprompt = &#91;\n    f\"{uttr&#91;'speaker']}: {uttr&#91;'text']}\"\n    for uttr in prompt\n]\n\nprompt = \"&lt;NL&gt;\".join(prompt)\n\nprompt = (\n    prompt\n    + \"&lt;NL&gt;\"\n    + \"\u30b7\u30b9\u30c6\u30e0: \"\n)<\/code><\/pre>\n\n\n\n<pre class=\"wp-block-code\"><code>token_ids = tokenizer.encode(prompt, add_special_tokens=False, return_tensors=\"pt\")\n\nwith torch.no_grad():\n    output_ids = model.generate(\n        token_ids.to(model.device),\n        do_sample=True,\n        max_new_tokens=128,\n        temperature=0.7,\n        repetition_penalty=1.1,\n        pad_token_id=tokenizer.pad_token_id,\n        bos_token_id=tokenizer.bos_token_id,\n        eos_token_id=tokenizer.eos_token_id\n    )\n\noutput = tokenizer.decode(output_ids.tolist()&#91;0]&#91;token_ids.size(1):])\noutput = output.replace(\"&lt;NL&gt;\", \"\\n\")\nprint(output)<\/code><\/pre>\n\n\n\n<p>\u30e2\u30c7\u30eb\u306e\u8aad\u307f\u8fbc\u307f\u6642\u306b\u30e9\u30a4\u30d6\u30e9\u30ea\u306e\u6ce8\u610f\u30e1\u30c3\u30bb\u30fc\u30b8\u304c\u51fa\u307e\u3057\u305f\u304c\u3001\u7121\u4e8b\u306b\u5b9f\u884c\u3067\u304d\u307e\u3057\u305f\u3002<br>\u5b9f\u884c\u6642\u306eGPU\u30e1\u30e2\u30ea\u306e\u30b5\u30a4\u30ba\u306f5GB\u7a0b\u5ea6\u3067\u3001\u3061\u3083\u3093\u3068Google Colab\u306e\u7121\u6599\u67a0\u3067\u52d5\u4f5c\u3057\u307e\u3057\u305f\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img data-dominant-color=\"f7f7f7\" data-has-transparency=\"false\" style=\"--dominant-color: #f7f7f7;\" decoding=\"async\" width=\"338\" height=\"42\" sizes=\"(max-width: 338px) 100vw, 338px\" src=\"https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/07\/image-3.png\" alt=\"\" class=\"wp-image-1719 not-transparent\" srcset=\"https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/07\/image-3.png 338w, https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/07\/image-3-300x37.png 300w\" \/><\/figure>\n\n\n\n<p><a rel=\"noreferrer noopener\" href=\"https:\/\/note.com\/npaka\/n\/n6fe8d930b114\" target=\"_blank\">npaka\u3055\u3093\u306e\u8a18\u4e8b<\/a>\u306b\u3066\u3001\u6bd4\u8f03\u3057\u305f\u7d50\u679c\u304c\u8f09\u3063\u3066\u304a\u308a\u307e\u3057\u305f\u306e\u3067\u3001\u5f15\u7528\u3057\u307e\u3059\u3068\u3001<br>\u8a2d\u5b9a\u306a\u3057\uff08float32\uff09\u3060\u306815GB\u7a0b\u5ea6\u3001float16\u3060\u30688GB\u7a0b\u5ea6\u3001int8\u3060\u30685GB\u7a0b\u5ea6\u3067\u52d5\u4f5c\u3059\u308b\u3088\u3046\u3067\u3059\u3002<br>\uff08\u901a\u5e38\u3001\u30e1\u30e2\u30ea\u4f7f\u7528\u91cf\u304c\u6e1b\u308b\u5206\u3001\u30c8\u30ec\u30fc\u30c9\u30aa\u30d5\u3068\u3057\u3066LLM\u306e\u7cbe\u5ea6\u304c\u4f4e\u4e0b\u3059\u308b\u3068\u306e\u3053\u3068\uff09<\/p>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h2 class=\"wp-block-heading\">\u30d7\u30ed\u30f3\u30d7\u30c8\u306e\u4e0e\u3048\u65b9\u3092\u5909\u3048\u3066\u307f\u308b<\/h2>\n\n\n\n<p>\u4ee5\u4e0b\u306e\u3088\u3046\u306b\u30b5\u30f3\u30d7\u30eb\u3092\u4e0e\u3048\u3066\u3001\u30d7\u30ed\u30f3\u30d7\u30c8\u3092\u5b9f\u884c\u3057\u3066\u307f\u307e\u3057\u305f\u3002<br>\u5b9f\u884c\u90e8\u5206\u306e\u30b3\u30fc\u30c9\u306f\u5909\u308f\u308a\u307e\u305b\u3093\u3002<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>prompt = &#91;\n    {\n        \"speaker\": \"\u30e6\u30fc\u30b6\u30fc\",\n        \"text\": \"\u4f1a\u793e\u540d\uff1aApple Inc.\u3001\u5275\u7acb\uff1a1976\u5e744\u67081\u65e5\u3001\u5f93\u696d\u54e1\u6570\uff1a154,000\u4eba\u3001\u4e8b\u696d\u5185\u5bb9\uff1a\u30c7\u30b8\u30bf\u30eb\u5bb6\u5ead\u96fb\u5316\u88fd\u54c1\u3001\u30bd\u30d5\u30c8\u30a6\u30a7\u30a2\u3001\u30aa\u30f3\u30e9\u30a4\u30f3\u30b5\u30fc\u30d3\u30b9\u306e\u958b\u767a\u30fb\u8ca9\u58f2\"\n    },\n    {\n        \"speaker\": \"\u30b7\u30b9\u30c6\u30e0\",\n        \"text\": \"Apple Inc.\u306f\u30011976\u5e744\u67081\u65e5\u306b\u5275\u7acb\u3055\u308c\u3001\u5f93\u696d\u54e1\u6570\u306f154,000\u4eba\u3092\u62b1\u3048\u307e\u3059\u3002\u4e8b\u696d\u5185\u5bb9\u3068\u3057\u3066\u306f\u3001\u30c7\u30b8\u30bf\u30eb\u5bb6\u5ead\u96fb\u5316\u88fd\u54c1\u3001\u30bd\u30d5\u30c8\u30a6\u30a7\u30a2\u3001\u30aa\u30f3\u30e9\u30a4\u30f3\u30b5\u30fc\u30d3\u30b9\u306e\u958b\u767a\u30fb\u8ca9\u58f2\u3092\u884c\u3063\u3066\u3044\u307e\u3059\u3002\"\n    },\n    {\n        \"speaker\": \"\u30e6\u30fc\u30b6\u30fc\",\n        \"text\": \"\u4f1a\u793e\u540d\uff1aMeta Platforms, Inc.\u3001\u5275\u7acb\uff1a2004\u5e742\u67084\u65e5\u3001\u5f93\u696d\u54e1\u6570\uff1a52,534\u4eba\u3001\u4e8b\u696d\u5185\u5bb9\uff1a\u4e16\u754c\u7684\u306b\u5c55\u958b\u3055\u308c\u3066\u3044\u308b\u30bd\u30fc\u30b7\u30e3\u30eb\u30fb\u30cd\u30c3\u30c8\u30ef\u30fc\u30ad\u30f3\u30b0\u30fb\u30b5\u30fc\u30d3\u30b9\u306e\u904b\u55b6\"\n    }\n]\n\nprompt = &#91;\n    f\"{uttr&#91;'speaker']}: {uttr&#91;'text']}\"\n    for uttr in prompt\n]\n\nprompt = \"&lt;NL&gt;\".join(prompt)\n\nprompt = (\n    prompt\n    + \"&lt;NL&gt;\"\n    + \"\u30b7\u30b9\u30c6\u30e0: \"\n)<\/code><\/pre>\n\n\n\n<pre class=\"wp-block-code\"><code>token_ids = tokenizer.encode(prompt, add_special_tokens=False, return_tensors=\"pt\")\n\nwith torch.no_grad():\n    output_ids = model.generate(\n        token_ids.to(model.device),\n        do_sample=True,\n        max_new_tokens=128,\n        temperature=0.7,\n        repetition_penalty=1.1,\n        pad_token_id=tokenizer.pad_token_id,\n        bos_token_id=tokenizer.bos_token_id,\n        eos_token_id=tokenizer.eos_token_id\n    )\n\noutput = tokenizer.decode(output_ids.tolist()&#91;0]&#91;token_ids.size(1):])\noutput = output.replace(\"&lt;NL&gt;\", \"\\n\")\nprint(output)<\/code><\/pre>\n\n\n\n<p>\u7d50\u679c\u306f\u4ee5\u4e0b\u306e\u901a\u308a\u3002\u601d\u60d1\u901a\u308a\u306e\u6587\u7ae0\u3092\u4f5c\u6210\u3057\u3066\u304f\u308c\u307e\u3057\u305f\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img data-dominant-color=\"eaeaea\" data-has-transparency=\"false\" style=\"--dominant-color: #eaeaea;\" decoding=\"async\" width=\"808\" height=\"30\" sizes=\"(max-width: 808px) 100vw, 808px\" src=\"https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/07\/image-4.png\" alt=\"\" class=\"wp-image-1727 not-transparent\" srcset=\"https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/07\/image-4.png 808w, https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/07\/image-4-300x11.png 300w, https:\/\/fukugyouhistory.tokyo\/wp-content\/uploads\/2023\/07\/image-4-768x29.png 768w\" \/><\/figure>\n\n\n\n<pre class=\"wp-block-preformatted\">Meta Platforms, Inc.\u306f\u30012004\u5e742\u67084\u65e5\u306b\u5275\u7acb\u3055\u308c\u305f\u30a2\u30e1\u30ea\u30ab\u306e\u4f01\u696d\u3067\u3001\u5f93\u696d\u54e1\u306f52,534\u4eba\u3067\u3059\u3002\u4e8b\u696d\u5185\u5bb9\u306f\u3001\u4e16\u754c\u7684\u306b\u5c55\u958b\u3055\u308c\u3066\u3044\u308b\u30bd\u30fc\u30b7\u30e3\u30eb\u30fb\u30cd\u30c3\u30c8\u30ef\u30fc\u30ad\u30f3\u30b0\u30fb\u30b5\u30fc\u30d3\u30b9\u306e\u904b\u55b6\u3067\u3059\u3002&lt;\/s&gt;\n<\/pre>\n\n\n\n<p>\u30b5\u30f3\u30d7\u30eb\u306e\u4e0e\u3048\u65b9\u6b21\u7b2c\u3067\u53ef\u80fd\u6027\u304c\u5e83\u304c\u308a\u305d\u3046\u3067\u3059\u3002<br>\u65e2\u5b58\u306e\u30b5\u30f3\u30d7\u30eb\u3092\u5143\u306b\u3057\u3066\u6587\u7ae0\u3092\u4f5c\u6210\u3059\u308b\u5206\u306b\u306f\u3001\u7cbe\u5ea6\u9ad8\u304f\u3067\u304d\u305d\u3046\u306a\u671f\u5f85\u611f\u304c\u3042\u308a\u307e\u3059<\/p>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<p>\u4eca\u56de\u306f\u3068\u308a\u3042\u3048\u305a\u30b5\u30f3\u30d7\u30eb\u30b3\u30fc\u30c9\u3092\u5143\u306b\u3001Google Colab\u306e\u7121\u6599\u67a0\u3067\u5b9f\u884c\u3057\u305f\u306e\u3067\u3059\u304c\u3001<br>\u4f7f\u3044\u65b9\u6b21\u7b2c\uff08\u30d7\u30ed\u30f3\u30d7\u30c8\u306e\u4e0e\u3048\u65b9\u6b21\u7b2c\uff09\u3067\u3059\u3054\u3044\u4f7f\u3044\u52dd\u624b\u304c\u826f\u304f\u306a\u308a\u305d\u3046\u3067\u3059\u3002<\/p>\n\n\n\n<p>\u5916\u90e8\u306b\u30c7\u30fc\u30bf\u3092\u9001\u3089\u305a\u306b\u30ed\u30fc\u30ab\u30eb\u3067\u5b9f\u884c\u3067\u304d\u308b\u5206\u3001\u5916\u90e8\u306b\u60c5\u5831\u3092\u63d0\u4f9b\u3067\u304d\u306a\u3044\u74b0\u5883\u3067\u6709\u7528\u304b\u3068\u3002<\/p>\n\n\n\n<p>\u3068\u308a\u3042\u3048\u305a\u3001\u3053\u3053\u307e\u3067\u3002<\/p>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h2 class=\"wp-block-heading\">\u53c2\u8003<\/h2>\n\n\n\n<p>CTranslate2\u3092\u4f7f\u7528\u3057\u3066\u30e2\u30c7\u30eb\u5909\u63db\u3092\u5b9f\u884c\u3059\u308b\u3068\u3001\u8efd\u91cf\uff0bCPU\u306e\u307f\u3067\u3082\u63a8\u8ad6\u306e\u5b9f\u884c\u304c\u53ef\u80fd\u306b\u306a\u308b\u3068\u306e\u3053\u3068\u3002<br><s>Google Colab\u306e\u7121\u6599\u67a0\u3067\u306f\u5909\u63db\u306b\u5fc5\u8981\u306a\u30e1\u30e2\u30ea\u304c\u8db3\u308a\u305a\u8a66\u3057\u3066\u3044\u306a\u3044\u306e\u3067\u3001\u53c2\u8003\u306b\u66f8\u304d\u7559\u3081\u3066\u304a\u304d\u307e\u3059\u3002<\/s><br><s>\uff08GPU\u304c\u306a\u304f\u3066\u3082\u3001\u30e1\u30e2\u30ea\u3055\u3048\u5927\u5bb9\u91cf\u304c\u78ba\u4fdd\u3067\u304d\u308c\u3070\u5b9f\u884c\u3067\u304d\u308b\u306e\u3067\u3001\u671f\u5f85\u611f\u304c\u3042\u308a\u307e\u3059\uff09<\/s><br>\u2192\u3000\u30e1\u30e2\u30ea64GB\u306e\u74b0\u5883\u3067\u30c6\u30b9\u30c8\u3059\u308b\u6a5f\u4f1a\u304c\u3042\u308a\u3001\u5b9f\u969b\u306b\u52d5\u304b\u3057\u3066\u307f\u307e\u3057\u305f\u3002\uff082023\/10\/29\uff09\u3002<\/p>\n\n\n\n<p>\u53c2\u8003\u60c5\u5831\u306f\u3001\u540c\u3058\u304f<a rel=\"noreferrer noopener\" href=\"https:\/\/note.com\/npaka\/n\/nd493e282e5e9\" target=\"_blank\">npaka\u3055\u3093\u306e\u8a18\u4e8b<\/a>\u3088\u308a\u3002<\/p>\n\n\n\n<p>\uff1c\u30e2\u30c7\u30eb\u306e\u5909\u63db\uff1e<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>!pip install ctranslate2\n!pip install sentencepiece transformers<\/code><\/pre>\n\n\n\n<pre class=\"wp-block-code\"><code>!ct2-transformers-converter \\\n    --model rinna\/japanese-gpt-neox-3.6b-instruction-ppo \\\n    --quantization int8 \\\n    --output_dir .\/rinna_ppo-ct2 \\\n    --low_cpu_mem_usage<\/code><\/pre>\n\n\n\n<p>\u203b\u300cYou are using the default legacy behaviour of the &lt;class \u2026\u300d\u3068\u30e1\u30c3\u30bb\u30fc\u30b8\u304c\u51fa\u307e\u3059\u304c\u3001<br>\u3000\u3068\u308a\u3042\u3048\u305a\u300c&#8211;output_dir\u300d\u3067\u6307\u5b9a\u3057\u305f\u30d5\u30a9\u30eb\u30c0\u306b\u30013\u500b\u306e\u30d5\u30a1\u30a4\u30eb\u304c\u554f\u984c\u306a\u304f\u4f5c\u6210\u3055\u308c\u3066\u3044\u308b\u306f\u305a\u3067\u3059\u3002<br>\u3000\uff08config.json\u3001model.bin\u3001vocabulary.txt\uff09<br>\u3000\u4e0b\u8a18\u306etokenizer\u30aa\u30d7\u30b7\u30e7\u30f3\u306b\u300clegacy=False\u300d\u3092\u5165\u308c\u308b\u3053\u3068\u3067\u3001\u30e2\u30c7\u30eb\u5b9f\u884c\u6642\u306b\u306f\u4e0a\u8a18\u8868\u793a\u306f\u56de\u907f\u3067\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<p>\uff1c\u63a8\u8ad6\u306e\u5b9f\u884c\uff1e<\/p>\n\n\n\n<pre class=\"wp-block-code\"><code>import ctranslate2\nimport transformers\nimport torch\n\nmodel_name = \"rinna\/japanese-gpt-neox-3.6b-instruction-ppo\"\nct2_model = \".\/rinna_ppo-ct2\"\n\n# \u30b8\u30a7\u30cd\u30ec\u30fc\u30bf\u30fc\u3068\u30c8\u30fc\u30af\u30ca\u30a4\u30b6\u30fc\u306e\u6e96\u5099\ndevice = \"cuda\" if torch.cuda.is_available() else \"cpu\"\ngenerator = ctranslate2.Generator(ct2_model, device=device)\ntokenizer = transformers.AutoTokenizer.from_pretrained(model_name, use_fast=False, legacy=False)<\/code><\/pre>\n\n\n\n<pre class=\"wp-block-code\"><code>prompt = &#91;\n    {\n        \"speaker\": \"\u30e6\u30fc\u30b6\u30fc\",\n        \"text\": \"\u6b21\u306e\u6587\u7ae0\u306e\u8a02\u6b63\u3057\u3066\u304f\u3060\u3055\u3044\u3002\u300c\u4eca\u65e5\u306f\u71b1\u3044\u4e00\u65e5\u3067\u3059\u300d\"\n    }\n]\n\nprompt = &#91;\n    f\"{uttr&#91;'speaker']}: {uttr&#91;'text']}\"\n    for uttr in prompt\n]\n\nprompt = \"&lt;NL&gt;\".join(prompt)\n\nprompt = (\n    prompt\n    + \"&lt;NL&gt;\"\n    + \"\u30b7\u30b9\u30c6\u30e0: \"\n)<\/code><\/pre>\n\n\n\n<pre class=\"wp-block-code\"><code>tokens = tokenizer.convert_ids_to_tokens(\n    tokenizer.encode(prompt, add_special_tokens=False)\n)\nresults = generator.generate_batch(\n    &#91;tokens],\n    max_length=64,\n    sampling_topk=10,\n    sampling_temperature=0.7,\n    include_prompt_in_result=False,\n)\ntext = tokenizer.decode(results&#91;0].sequences_ids&#91;0])\nprint(text)<\/code><\/pre>\n","protected":false},"excerpt":{"rendered":"<p>\u4e45\u3057\u304f\u66f4\u65b0\u3067\u304d\u3066\u3044\u307e\u305b\u3093\u3067\u3057\u305f\u3002 2023\u5e745\u6708\u306bRinna\u793e\u304c\u516c\u958b\u3057\u305f\u65e5\u672c\u8a9e\u306b\u7279\u5316\u3057\u305f36\u5104\u30d1\u30e9\u30e1\u30fc\u30bf\u3092\u6301\u3064\u5bfe\u8a71GPT\u8a00\u8a9e\u30e2\u30c7\u30eb\u3092\u5b9f\u884c\u3057\u3066\u884c\u304d\u307e\u3059\u3002GPU\u30e1\u30e2\u30ea\u30b5\u30a4\u30ba\u306b\u5fdc\u3058\u3066\u3001model\u8aad\u307f\u8fbc\u307f\u306e\u30aa\u30d7\u30b7\u30e7\u30f3\u5909\u66f4\u3067\u304d\u308b\u3088 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[21],"tags":[],"class_list":{"0":"post-1706","1":"post","2":"type-post","3":"status-publish","4":"format-standard","6":"category-ai"},"_links":{"self":[{"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=\/wp\/v2\/posts\/1706","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=1706"}],"version-history":[{"count":32,"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=\/wp\/v2\/posts\/1706\/revisions"}],"predecessor-version":[{"id":1786,"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=\/wp\/v2\/posts\/1706\/revisions\/1786"}],"wp:attachment":[{"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=1706"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=1706"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/fukugyouhistory.tokyo\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=1706"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}