{"id":1241,"date":"2024-04-28T11:32:42","date_gmt":"2024-04-28T11:32:42","guid":{"rendered":"https:\/\/www.nicekj.com\/?p=1241"},"modified":"2024-04-28T11:33:42","modified_gmt":"2024-04-28T11:33:42","slug":"jinyong61xingdaimaniyenengconglingxunliandamoxing","status":"publish","type":"post","link":"https:\/\/www.nicekj.com\/jinyong61xingdaimaniyenengconglingxunliandamoxing.html","title":{"rendered":"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b"},"content":{"rendered":"<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/fc79fc001103347ab5427178cdcd6f26.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/70bdf6078fa2c549a8ec5ddb811f06fb.png\" alt=\"\u52a8\u56fe\u5c01\u9762\" \/><\/figure>\n<\/p>\n<p>\u817e\u5c0f\u4e91\u5bfc\u8bfb<\/p>\n<p>\u672c\u6587\u5e76\u975e\u57fa\u4e8e\u5fae\u8c03\u8bad\u7ec3\u6a21\u578b\uff0c\u800c\u662f\u4ece\u5934\u5f00\u59cb\u8bad\u7ec3\u51fa\u4e00\u4e2a\u5168\u65b0\u7684\u5927\u8bed\u8a00\u6a21\u578b\u7684\u786c\u6838\u6559\u7a0b\u3002\u770b\u5b8c\u672c\u7bc7\uff0c\u4f60\u5c06\u4e86\u89e3\u8bad\u7ec3\u51fa\u4e00\u4e2a\u5927\u6a21\u578b\u7684\u73af\u5883\u51c6\u5907\u3001\u6570\u636e\u51c6\u5907\uff0c\u751f\u6210\u5206\u8bcd\uff0c\u6a21\u578b\u8bad\u7ec3\u3001\u6d4b\u8bd5\u6a21\u578b\u7b49\u73af\u8282\u5206\u522b\u9700\u8981\u505a\u4ec0\u4e48\u3002AI \u5c0f\u767d\u53cb\u597d~\u6587\u4e2d\u4ee3\u7801\u53ef\u4ee5\u76f4\u63a5\u5b9e\u64cd\u8fd0\u884c\u3002\u6b22\u8fce\u9605\u8bfb\u4f53\u9a8c\u3002<\/p>\n<p>\u76ee\u5f55<\/p>\n<p>1 \u51c6\u5907\u8bad\u7ec3\u73af\u5883<\/p>\n<p>2 \u51c6\u5907\u8bad\u7ec3\u6570\u636e<\/p>\n<p>3 \u8bad\u7ec3\u5206\u8bcd\u5668<\/p>\n<p>4 \u8bad\u7ec3\u6a21\u578b<\/p>\n<p>5 \u6d4b\u8bd5\u6a21\u578b<\/p>\n<p>6 \u5b8c\u6574\u4ee3\u7801<\/p>\n<p>\u901a\u8fc7\u8fd9\u7bc7\u6587\u7ae0\uff0c\u4f60\u53ef\u4ee5\u9884\u8bad\u7ec3\u4e00\u4e2a\u5168\u65b0\u5927\u8bed\u8a00\u6a21\u578b\u3002<\/p>\n<p><strong>\u6ce8\u610f\u662f\u5168\u65b0\u7684\u6a21\u578b\uff0c\u4e0d\u662f\u5fae\u8c03\u3002<\/strong><\/p>\n<p>\u5168\u65b0\u8bad\u7ec3\u7684\u597d\u5904\u662f\u8bad\u7ec3\u7684\u6570\u636e\u3001\u8bad\u7ec3\u7684\u53c2\u6570\u90fd\u662f\u53ef\u4fee\u6539\u7684\uff0c\u901a\u8fc7\u8c03\u8bd5\u8fd0\u884c\u6211\u4eec\u53ef\u4ee5\u66f4\u597d\u7684\u7406\u89e3\u5927\u6a21\u578b\u8bad\u7ec3\u8fc7\u7a0b\u3002\u6211\u4eec\u53ef\u4ee5\u7528\u7279\u5b9a\u7c7b\u578b\u6570\u636e\u7684\u8bad\u7ec3\uff0c\u6765\u5b8c\u6210\u7279\u5b9a\u7c7b\u578b\u6570\u636e\u7684\u8f93\u51fa\u3002<\/p>\n<p>\u5173\u4e8e\u5927\u6a21\u578b\u5df2\u7ecf\u6709\u5f88\u591a\u6587\u7ae0\uff0c\u5fae\u8c03\u6a21\u578b\u7684\u6587\u7ae0\u6bd4\u8f83\u591a\uff0c\u5168\u65b0\u9884\u8bad\u7ec3\u5168\u65b0\u6a21\u578b\u7684\u6587\u7ae0\u5f88\u5c11\u3002\u4e2a\u4eba\u89c9\u5f97\u6709\u7684\u4e5f\u8bb2\u7684\u5f88\u590d\u6742\uff0c\u4ee3\u7801\u4e5f\u5f88\u96be\u8dd1\u901a\u3002\u672c\u6587\u4e0d\u4f1a\u8bb2\u7684\u5f88\u590d\u6742\uff0c\u4ee3\u7801\u4e5f\u5f88\u5bb9\u6613\u8fd0\u884c\u3002\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u5c31\u80fd\u8bad\u7ec3\u51fa\u4e00\u4e2a\u5168\u65b0\u5927\u8bed\u8a00\u6a21\u578b\u3002<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/57cc37c667f3f038f4bbfb2594466c26.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<p>\u672c\u6587\u4ee5\u4ee3\u7801\u4e3a\u4e3b\uff0c\u8fd0\u884c\u4ee3\u7801\u9700\u8981 Python \u73af\u5883\u3002<\/p>\n<h2 data-id=\"heading-0\">01\u3001\u51c6\u5907\u8bad\u7ec3\u73af\u5883<\/h2>\n<p>\u6211\u7684\u8bad\u7ec3\u73af\u5883\u57fa\u4e8e\u817e\u8baf\u4e91\u7684 GPU \u673a\u5668\u3002<\/p>\n<p>\u5730\u5740\uff1a<a href=\"https:\/\/link.juejin.cn?target=https%3A%2F%2Flink.zhihu.com%2F%3Ftarget%3Dhttps%253A%2F%2Fcloud.tencent.com%2Fproduct%2Fgpu\" target=\"_blank\" title=\"https:\/\/link.zhihu.com\/?target=https%3A\/\/cloud.tencent.com\/product\/gpu\" ref=\"nofollow noopener noreferrer\" rel=\"noopener\">cloud.tencent.com\/product\/gpu<\/a><\/p>\n\n\n\n\n\n\n<table><thead><tr><th>GPU\u7c7b\u578b\uff1aGN7.2XLARGE32 T4 \u663e\u5361\uff1a1\u9897 \u663e\u5b58\uff1a16GB\uff1b python 3.11\uff1b requirements.txt:<\/th><\/tr><\/thead><\/table>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">ini<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-ini code-block-extension-codeShowNum\" lang=\"ini\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\"><span class=\"hljs-attr\">tokenizers<\/span>==<span class=\"hljs-number\">0.13<\/span>.<span class=\"hljs-number\">3<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\"><span class=\"hljs-attr\">torch<\/span>==<span class=\"hljs-number\">2.0<\/span>.<span class=\"hljs-number\">1<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\"><span class=\"hljs-attr\">transformers<\/span>==<span class=\"hljs-number\">4.30<\/span>.<\/span>\n<\/code><\/pre>\n<h2 data-id=\"heading-1\">02\u3001\u51c6\u5907\u8bad\u7ec3\u6570\u636e<\/h2>\n<p>\u9996\u5148\u6211\u4eec\u8981\u4e3a\u8bad\u7ec3\u51c6\u5907\u6570\u636e\uff0c\u6bd4\u5982\u6211\u5c31\u60f3\u57fa\u4e8e\u300a\u4e09\u56fd\u6f14\u4e49\u300b\u8bad\u7ec3\u4e00\u4e2a\u6a21\u578b\u3002\u4e09\u56fd\u6f14\u4e49\u4e0b\u8f7d\u5730\u5740\uff1a<\/p>\n<p><a href=\"https:\/\/link.juejin.cn?target=https%3A%2F%2Flink.zhihu.com%2F%3Ftarget%3Dhttps%253A%2F%2Fraw.githubusercontent.com%2Fxinzhanguo%2Fhellollm%2Fmain%2Ftext%2Fsanguoyanyi.txt\" target=\"_blank\" title=\"https:\/\/link.zhihu.com\/?target=https%3A\/\/raw.githubusercontent.com\/xinzhanguo\/hellollm\/main\/text\/sanguoyanyi.txt\" ref=\"nofollow noopener noreferrer\" rel=\"noopener\">raw.githubusercontent.com\/xinzhanguo\/\u2026<\/a><\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/89ef7bd66a4d70b71c04d8ba39c55d42.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<h2 data-id=\"heading-2\">03\u3001\u8bad\u7ec3\u5206\u8bcd\u5668<\/h2>\n<p>\u5206\u8bcd\uff08tokenization\uff09\u662f\u628a\u8f93\u5165\u6587\u672c\u5207\u5206\u6210\u6709\u610f\u4e49\u7684\u5b50\u5355\u5143\uff08tokens\uff09\u3002\u901a\u8fc7\u4ee5\u4e0b\u4ee3\u7801\uff0c\u6839\u636e\u6211\u4eec\u7684\u6570\u636e\u751f\u6210\u4e00\u4e2a\u65b0\u7684\u5206\u8bcd\u5668\uff1a<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">python<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-python code-block-extension-codeShowNum\" lang=\"python\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\"><span class=\"hljs-keyword\">from<\/span> tokenizers <span class=\"hljs-keyword\">import<\/span> Tokenizer<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\"><span class=\"hljs-keyword\">from<\/span> tokenizers.models <span class=\"hljs-keyword\">import<\/span> BPE<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\"><span class=\"hljs-keyword\">from<\/span> tokenizers.trainers <span class=\"hljs-keyword\">import<\/span> BpeTrainer<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"4\"><span class=\"hljs-keyword\">from<\/span> tokenizers.normalizers <span class=\"hljs-keyword\">import<\/span> NFKC, <span class=\"hljs-type\">Sequence<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"5\"><span class=\"hljs-keyword\">from<\/span> tokenizers.pre_tokenizers <span class=\"hljs-keyword\">import<\/span> ByteLevel<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"6\"><span class=\"hljs-keyword\">from<\/span> tokenizers.decoders <span class=\"hljs-keyword\">import<\/span> ByteLevel <span class=\"hljs-keyword\">as<\/span> ByteLevelDecoder<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"7\"><span class=\"hljs-keyword\">from<\/span> transformers <span class=\"hljs-keyword\">import<\/span> GPT2TokenizerFast<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"8\"><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"9\"><span class=\"hljs-comment\"># \u6784\u5efa\u5206\u8bcd\u5668 GPT2 \u57fa\u4e8e BPE \u7b97\u6cd5\u5b9e\u73b0<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"10\">tokenizer = Tokenizer(BPE(unk_token=<span class=\"hljs-string\">\"&lt;unk&gt;\"<\/span>))<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"11\">tokenizer.normalizer = <span class=\"hljs-type\">Sequence<\/span>([NFKC()])<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"12\">tokenizer.pre_tokenizer = ByteLevel()<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"13\">tokenizer.decoder = ByteLevelDecoder()<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"14\"><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"15\">special_tokens = [<span class=\"hljs-string\">\"&lt;s&gt;\"<\/span>,<span class=\"hljs-string\">\"&lt;pad&gt;\"<\/span>,<span class=\"hljs-string\">\"&lt;\/s&gt;\"<\/span>,<span class=\"hljs-string\">\"&lt;unk&gt;\"<\/span>,<span class=\"hljs-string\">\"&lt;mask&gt;\"<\/span>]<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"16\">trainer = BpeTrainer(vocab_size=<span class=\"hljs-number\">50000<\/span>, show_progress=<span class=\"hljs-literal\">True<\/span>, inital_alphabet=ByteLevel.alphabet(), special_tokens=special_tokens)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"17\"><span class=\"hljs-comment\"># \u521b\u5efa text \u6587\u4ef6\u5939\uff0c\u5e76\u628a sanguoyanyi.txt \u4e0b\u8f7d\uff0c\u653e\u5230\u76ee\u5f55\u91cc<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"18\">files = [<span class=\"hljs-string\">\"text\/sanguoyanyi.txt\"<\/span>]<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"19\"><span class=\"hljs-comment\"># \u5f00\u59cb\u8bad\u7ec3\u4e86<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"20\">tokenizer.train(files, trainer)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"21\"><span class=\"hljs-comment\"># \u628a\u8bad\u7ec3\u7684\u5206\u8bcd\u901a\u8fc7GPT2\u4fdd\u5b58\u8d77\u6765\uff0c\u4ee5\u65b9\u4fbf\u540e\u7eed\u4f7f\u7528<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"22\">newtokenizer = GPT2TokenizerFast(tokenizer_object=tokenizer)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"23\">newtokenizer.save_pretrained(<span class=\"hljs-string\">\".\/sanguo\"<\/span>)<\/span>\n<\/code><\/pre>\n<p>\u8fd0\u884c\u65f6\u663e\u793a\u5982\u4e0b\u56fe\uff1a<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/54e8c182a1991389f65e3bd3228063a3.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<p>\u6210\u529f\u8fd0\u884c\u4ee3\u7801\u540e\uff0c\u6211\u4eec\u5728 sanguo \u76ee\u5f55\u751f\u6210\u5982\u4e0b\u6587\u4ef6\uff1a<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\"><\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs code-block-extension-codeShowNum\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\">merges.txt<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\">special_tokens_map.json<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\">tokenizer.json<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"4\">tokenizer_config.json<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"5\">vocab.json<\/span>\n<\/code><\/pre>\n<p>\u73b0\u5728\u6211\u4eec\u5df2\u7ecf\u6210\u529f\u8bad\u7ec3\u4e86\u4e00\u4e2a\u5927\u8bed\u8a00\u6a21\u578b\u7684\u5206\u8bcd\u5668\u3002<\/p>\n<h2 data-id=\"heading-3\">04\u3001\u8bad\u7ec3\u6a21\u578b<\/h2>\n<p>\u5229\u7528\u4e0b\u9762\u4ee3\u7801\u8fdb\u884c\u6a21\u578b\u8bad\u7ec3\uff1a<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">ini<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-ini code-block-extension-codeShowNum\" lang=\"ini\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\">from transformers import GPT2Config, GPT2LMHeadModel, GPT2Tokenizer<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\"><span class=\"hljs-comment\"># \u52a0\u8f7d\u5206\u8bcd\u5668<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\"><span class=\"hljs-attr\">tokenizer<\/span> = GPT2Tokenizer.from_pretrained(<span class=\"hljs-string\">\".\/sanguo\"<\/span>)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"4\">tokenizer.add_special_tokens({<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"5\">  \"eos_token\": \"&lt;\/s&gt;\",<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"6\">  \"bos_token\": \"&lt;s&gt;\",<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"7\">  \"unk_token\": \"&lt;unk&gt;\",<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"8\">  \"pad_token\": \"&lt;pad&gt;\",<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"9\">  \"mask_token\": \"&lt;mask&gt;\"<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"10\">})<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"11\"><span class=\"hljs-comment\"># \u914d\u7f6eGPT2\u6a21\u578b\u53c2\u6570<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"12\"><span class=\"hljs-attr\">config<\/span> = GPT2Config(<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"13\">  <span class=\"hljs-attr\">vocab_size<\/span>=tokenizer.vocab_size,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"14\">  <span class=\"hljs-attr\">bos_token_id<\/span>=tokenizer.bos_token_id,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"15\">  <span class=\"hljs-attr\">eos_token_id<\/span>=tokenizer.eos_token_id<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"16\">)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"17\"><span class=\"hljs-comment\"># \u521b\u5efa\u6a21\u578b<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"18\"><span class=\"hljs-attr\">model<\/span> = GPT2LMHeadModel(config)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"19\"><span class=\"hljs-comment\"># \u8bad\u7ec3\u6570\u636e\u6211\u4eec\u7528\u6309\u884c\u5206\u5272<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"20\">from transformers import LineByLineTextDataset<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"21\"><span class=\"hljs-attr\">dataset<\/span> = LineByLineTextDataset(<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"22\">    <span class=\"hljs-attr\">tokenizer<\/span>=tokenizer,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"23\">    <span class=\"hljs-attr\">file_path<\/span>=<span class=\"hljs-string\">\".\/text\/sanguoyanyi.txt\"<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"24\">    <span class=\"hljs-attr\">block_size<\/span>=<span class=\"hljs-number\">32<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"25\">  <span class=\"hljs-comment\"># \u5982\u679c\u8bad\u7ec3\u65f6\u4f60\u7684\u663e\u5b58\u4e0d\u591f<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"26\">  <span class=\"hljs-comment\"># \u53ef\u4ee5\u9002\u5f53\u8c03\u5c0f block_size<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"27\">)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"28\">from transformers import DataCollatorForLanguageModeling<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"29\"><span class=\"hljs-attr\">data_collator<\/span> = DataCollatorForLanguageModeling(<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"30\">    <span class=\"hljs-attr\">tokenizer<\/span>=tokenizer, mlm=<span class=\"hljs-literal\">False<\/span>, mlm_probability=<span class=\"hljs-number\">0.15<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"31\">)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"32\"><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"33\">from transformers import Trainer, TrainingArguments<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"34\"><span class=\"hljs-comment\"># \u914d\u7f6e\u8bad\u7ec3\u53c2\u6570<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"35\"><span class=\"hljs-attr\">training_args<\/span> = TrainingArguments(<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"36\">    <span class=\"hljs-attr\">output_dir<\/span>=<span class=\"hljs-string\">\".\/output\"<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"37\">    <span class=\"hljs-attr\">overwrite_output_dir<\/span>=<span class=\"hljs-literal\">True<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"38\">    <span class=\"hljs-attr\">num_train_epochs<\/span>=<span class=\"hljs-number\">20<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"39\">    <span class=\"hljs-attr\">per_gpu_train_batch_size<\/span>=<span class=\"hljs-number\">16<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"40\">    <span class=\"hljs-attr\">save_steps<\/span>=<span class=\"hljs-number\">2000<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"41\">    <span class=\"hljs-attr\">save_total_limit<\/span>=<span class=\"hljs-number\">2<\/span>,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"42\">)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"43\"><span class=\"hljs-attr\">trainer<\/span> = Trainer(<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"44\">    <span class=\"hljs-attr\">model<\/span>=model,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"45\">    <span class=\"hljs-attr\">args<\/span>=training_args,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"46\">    <span class=\"hljs-attr\">data_collator<\/span>=data_collator,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"47\">    <span class=\"hljs-attr\">train_dataset<\/span>=dataset,<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"48\">)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"49\">trainer.train()<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"50\"><span class=\"hljs-comment\"># \u4fdd\u5b58\u6a21\u578b<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"51\">model.save_pretrained('.\/sanguo')<\/span>\n<\/code><\/pre>\n<p>\u8fd0\u884c\u6bd4\u8f83\u8017\u65f6\uff0c\u663e\u793a\u8bad\u7ec3\u6570\u636e\u5982\u4e0b\u56fe\uff1a<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/77a50b0a8312f4a6580ab885bcf38473.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<p>\u6210\u529f\u8fd0\u884c\u4ee3\u7801\uff0c\u6211\u4eec\u53d1\u73b0 sanguo \u76ee\u5f55\u4e0b\u9762\u591a\u4e86\u4e09\u4e2a\u6587\u4ef6\uff1a<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">arduino<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-arduino code-block-extension-codeShowNum\" lang=\"arduino\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\">config.json<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\">generation_config.json<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\">pytorch_model.bin<\/span>\n<\/code><\/pre>\n<p>\u73b0\u5728\u6211\u4eec\u5c31\u6210\u529f\u751f\u6210\u8bad\u7ec3\u51fa\u57fa\u4e8e\u300a\u4e09\u56fd\u6f14\u4e49\u300b\u7684\u4e00\u4e2a\u5927\u8bed\u8a00\u6a21\u578b\u3002<\/p>\n<h2 data-id=\"heading-4\">05\u3001\u6d4b\u8bd5\u6a21\u578b<\/h2>\n<p>\u6211\u4eec\u7528\u6587\u672c\u751f\u6210\uff0c\u5bf9\u6a21\u578b\u8fdb\u884c\u6d4b\u8bd5\u4ee3\u7801\u5982\u4e0b\uff1a<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">scss<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-scss code-block-extension-codeShowNum\" lang=\"scss\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\">from transformers import pipeline, set_seed<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\">generator = <span class=\"hljs-built_in\">pipeline<\/span>('text-generation', model='.\/sanguo')<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\"><span class=\"hljs-built_in\">set_seed<\/span>(<span class=\"hljs-number\">42<\/span>)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"4\">txt = <span class=\"hljs-built_in\">generator<\/span>(\"\u5415\u5e03\", max_length=<span class=\"hljs-number\">10<\/span>)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"5\"><span class=\"hljs-built_in\">print<\/span>(txt)<\/span>\n<\/code><\/pre>\n<p>\u8fd0\u884c\u663e\u793a\u6a21\u578b\u8f93\u51fa\u4e86\u4e09\u56fd\u76f8\u5173\u7684\u6587\u672c\uff1a\u201c\u5415\u5e03\u5341\u4e8c\u56de \u5f20\u7ffc\u5fb7 \u5f20\u7ffc\u5fb7\u65f6\u66f9\u64cd \u6b66\u4faf\u8ba1\u8ba1\u8ba1\u201d<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/bc47c27589e92c0bff2e4b14f07d9134.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<p>\u518d\u6d4b\u8bd5\u4e00\u6761\uff1a<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">scss<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-scss code-block-extension-codeShowNum\" lang=\"scss\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\">txt = <span class=\"hljs-built_in\">generator<\/span>(\"\u63a5\u7740\u594f\u4e50\", max_length=<span class=\"hljs-number\">10<\/span>)<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\"><span class=\"hljs-built_in\">print<\/span>(txt)<\/span>\n<\/code><\/pre>\n<p>&#8220;\u63a5\u7740\u594f\u4e50u3000\u5374\u8bf4\u66f9\u64cd\u5f15\u519b\u56e0\u4e8c\u4eba&#8221;<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/b62749cba2b2061c9e1474c14ea0ccdf.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<p>\u8fd9\u5185\u5bb9\u4e0d\u5fcd\u76f4\u89c6\uff0c\u5982\u679c\u60f3\u4f18\u5316\uff0c\u6211\u4eec\u4e5f\u53ef\u4ee5\u57fa\u4e8e\u5168\u65b0\u7684\u6a21\u578b\u8fdb\u884c\u5fae\u8c03\u8bad\u7ec3\uff1b\u6211\u4eec\u4e5f\u53ef\u4ee5\u9002\u5f53\u5730\u8c03\u6574\u4e0b\u8bad\u7ec3\u53c2\u6570\uff0c\u4ee5\u8fbe\u5230\u8f83\u597d\u7684\u6548\u679c\u3002<\/p>\n<h2 data-id=\"heading-5\">06\u3001\u5b8c\u6574\u4ee3\u7801<\/h2>\n<p>\u4ee5\u4e0b\u662f\u5b8c\u6574\u4ee3\u7801\uff0c\u4ee3\u7801\u5730\u5740\uff1a<\/p>\n<p><a href=\"https:\/\/link.juejin.cn?target=https%3A%2F%2Flink.zhihu.com%2F%3Ftarget%3Dhttps%253A%2F%2Fgithub.com%2Fxinzhanguo%2Fhellollm%2Fblob%2Fmain%2Fsanguo.py\" target=\"_blank\" title=\"https:\/\/link.zhihu.com\/?target=https%3A\/\/github.com\/xinzhanguo\/hellollm\/blob\/main\/sanguo.py\" ref=\"nofollow noopener noreferrer\" rel=\"noopener\">github.com\/xinzhanguo\/\u2026<\/a><\/p>\n<p>linux \u4e2d\u8fd0\u884c\u65b9\u6cd5\uff1a<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">bash<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-bash code-block-extension-codeShowNum\" lang=\"bash\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\"><span class=\"hljs-comment\"># \u521b\u5efa\u73af\u5883<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\">python3 -m venv ~\/.env<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\"><span class=\"hljs-comment\"># \u52a0\u8f7d\u73af\u5883<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"4\"><span class=\"hljs-built_in\">source<\/span> ~\/.env\/bin\/activate<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"5\"><span class=\"hljs-comment\"># \u4e0b\u8f7d\u4ee3\u7801<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"6\">git <span class=\"hljs-built_in\">clone<\/span> git@github.com:xinzhanguo\/hellollm.git<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"7\"><span class=\"hljs-built_in\">cd<\/span> hellollm<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"8\"><span class=\"hljs-comment\"># \u5b89\u88c5\u4f9d\u8d56<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"9\">pip install -r requirements.txt<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"10\"><span class=\"hljs-comment\"># \u8fd0\u884c\u4ee3\u7801<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"11\">python sanguo.py<\/span>\n<\/code><\/pre>\n<p>\u4ee5\u4e0a\u6211\u4eec\u5c31\u5b8c\u6210\u4e00\u4e2a\u5168\u65b0\u7684\u6a21\u578b\u8bad\u7ec3\u3002\u4ee3\u7801\u53bb\u9664\u6ce8\u91ca\u7a7a\u884c\u603b\u517161\u884c\u3002<\/p>\n<p>\u672c\u6587\u4ee3\u7801\u6a21\u578b\u662f\u57fa\u4e8e GPT2 \u7684\uff0c\u5f53\u7136\u4f60\u4e5f\u53ef\u4ee5\u57fa\u4e8e LLama \u6216\u8005 Bert \u7b49\u6a21\u578b\u53bb\u5b9e\u73b0\u5168\u65b0\u7684\u5927\u8bed\u8a00\u6a21\u578b\u3002<\/p>\n<p>\u4ee3\u7801\u867d\u7136\u4e0d\u662f\u5f88\u591a\uff0c\u4f46\u662f\u5982\u679c\u521d\u6b21\u5c1d\u8bd5\u8fd0\u884c\u7684\u8bdd\u4f60\u4e5f\u8bb8\u4f1a\u9047\u5230\u5f88\u591a\u95ee\u9898\uff0c\u6bd4\u5982\u73af\u5883\u642d\u5efa\u3002\u4e3a\u4e86\u907f\u514d\u5176\u4ed6\u70e6\u607c\uff0c\u6211\u5efa\u8bae\u7528 docker \u65b9\u5f0f\u8fd0\u884c\u4ee3\u7801:<\/p>\n<pre><\/div><div class=\"code-block-extension-headerRight\"><span class=\"code-block-extension-lang\">bash<\/span><div class=\"code-block-extension-copyCodeBtn\">\u590d\u5236\u4ee3\u7801<\/div><\/div><\/div><code class=\"hljs language-bash code-block-extension-codeShowNum\" lang=\"bash\"><span class=\"code-block-extension-codeLine\" data-line-num=\"1\"><span class=\"hljs-comment\"># \u4e0b\u8f7d\u4ee3\u7801<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"2\">git <span class=\"hljs-built_in\">clone<\/span> git@github.com:xinzhanguo\/hellollm.git<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"3\"><span class=\"hljs-built_in\">cd<\/span> hellollm<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"4\"><span class=\"hljs-comment\"># \u7f16\u8bd1\u955c\u50cf<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"5\">docker build -t hellollm:beta .<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"6\"><span class=\"hljs-comment\"># \u53ef\u4ee5\u9009\u62e9\u4ee5GPU\u65b9\u5f0f\u8fd0\u884c<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"7\"><span class=\"hljs-comment\"># docker run -it --gpus all hellollm:beta sh<\/span><\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"8\">docker run -it hellollm:beta sh<\/span>\n<span class=\"code-block-extension-codeLine\" data-line-num=\"9\">python sanguo.py<\/span>\n<\/code><\/pre>\n<p>\u66f4\u591a\u4ee3\u7801\u53ef\u4ee5\u53c2\u8003\uff1aHello LLM!<\/p>\n<p><a href=\"https:\/\/link.juejin.cn?target=https%3A%2F%2Flink.zhihu.com%2F%3Ftarget%3Dhttps%253A%2F%2Fgithub.com%2Fxinzhanguo%2Fhellollm\" target=\"_blank\" title=\"https:\/\/link.zhihu.com\/?target=https%3A\/\/github.com\/xinzhanguo\/hellollm\" ref=\"nofollow noopener noreferrer\" rel=\"noopener\">github.com\/xinzhanguo\/\u2026<\/a><\/p>\n<p>\u4ee5\u4e0a\u5c31\u662f\u672c\u7bc7\u6587\u7ae0\u7684\u5168\u90e8\u5185\u5bb9\uff0c\u6b22\u8fce\u8f6c\u53d1\u5206\u4eab\u3002<\/p>\n<p>-End-<\/p>\n<p>\u539f\u521b\u4f5c\u8005\uff5c\u8f9b\u5360\u56fd<\/p>\n<p>\u6280\u672f\u8d23\u7f16\uff5cjipingjia<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/095318599eea02e1b0449e8db9d6aed9.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>\n<p>\u4f60\u89c9\u5f97\u5927\u6a21\u578b\u6709\u54ea\u4e9b\u5e94\u7528\u573a\u666f\uff1f\u6b22\u8fce\u5728<a href=\"https:\/\/link.juejin.cn?target=https%3A%2F%2Fcloud.tencent.com%2Fdeveloper%2Ftools%2Fexternal-entry%3Fchannel%3Djuejin%26id%3D31\" target=\"_blank\" title=\"https:\/\/cloud.tencent.com\/developer\/tools\/external-entry?channel=juejin&amp;id=31\" ref=\"nofollow noopener noreferrer\" rel=\"noopener\">\u817e\u8baf\u4e91\u5f00\u53d1\u8005\u516c\u4f17\u53f7<\/a>\u8bc4\u8bba\u533a\u8ba8\u8bba\u3002\u6211\u4eec\u5c06\u9009\u53d61\u5219\u6700\u6709\u610f\u4e49\u7684\u5206\u4eab\uff0c\u9001\u51fa\u817e\u8baf\u4e91\u5f00\u53d1\u8005 &#8211; \u9a6c\u514b\u676f1\u4e2a\uff08\u89c1\u4e0b\u56fe\uff09\u30027\u670824\u65e5\u4e2d\u534812\u70b9\u5f00\u5956\u3002<\/p>\n<p>\n<figure class=\"wp-block-image size-large\"><img decoding=\"async\" src=\"https:\/\/www.nicekj.com\/wp-content\/uploads\/replace\/22bcfb016a6568d585101d222c444407.png\" alt=\"\u4ec5\u752861\u884c\u4ee3\u7801\uff0c\u4f60\u4e5f\u80fd\u4ece\u96f6\u8bad\u7ec3\u5927\u6a21\u578b\" \/><\/figure>\n<\/p>","protected":false},"excerpt":{"rendered":"<p>\u672c\u6587\u5e76\u975e\u57fa\u4e8e\u5fae\u8c03\u8bad\u7ec3\u6a21\u578b\uff0c\u800c\u662f\u4ece\u5934\u5f00\u59cb\u8bad\u7ec3\u51fa\u4e00\u4e2a\u5168\u65b0\u7684\u5927\u8bed\u8a00\u6a21\u578b\u7684\u786c\u6838\u6559\u7a0b\u3002\u770b\u5b8c\u672c\u7bc7\uff0c\u4f60\u5c06\u4e86\u89e3\u8bad\u7ec3\u51fa\u4e00\u4e2a\u5927\u6a21\u578b\u7684\u73af\u5883\u51c6\u5907\u3001\u6570\u636e\u51c6\u5907\uff0c\u751f\u6210\u5206\u8bcd\uff0c\u6a21\u578b\u8bad\u7ec3\u3001\u6d4b\u8bd5\u6a21\u578b\u7b49\u73af\u8282\u5206\u522b\u9700\u8981\u505a\u4ec0\u4e48\u3002<\/p>\n","protected":false},"author":1,"featured_media":2836,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"_acf_changed":false,"rank_math_title":"\u5927\u8bed\u8a00\u6a21\u578b\u8bad\u7ec3\uff1a\u4ece\u96f6\u5f00\u59cb\u6784\u5efaAI\u6a21\u578b - \u5948\u65af\u79d1\u6280\u793e\u533a","rank_math_description":"\u8fd9\u7bc7\u6559\u7a0b\u63d0\u4f9b\u4e86\u4ece\u96f6\u5f00\u59cb\u8bad\u7ec3\u5168\u65b0\u5927\u8bed\u8a00\u6a21\u578b\u7684\u6307\u5357\uff0c\u6db5\u76d6\u73af\u5883\u51c6\u5907\u3001\u6570\u636e\u9884\u5904\u7406\u3001\u6a21\u578b\u8bad\u7ec3\u548c\u6d4b\u8bd5\u7b49\u5173\u952e\u6b65\u9aa4\uff0c\u5e2e\u52a9\u60a8\u7406\u89e3\u548c\u6784\u5efa\u81ea\u5df1\u7684AI\u6a21\u578b\u3002","rank_math_focus_keyword":"\u5927\u8bed\u8a00\u6a21\u578b, \u6a21\u578b\u8bad\u7ec3, \u81ea\u7136\u8bed\u8a00\u5904\u7406, AI, GPT","views":"49","footnotes":""},"categories":[3],"tags":[128,129,136,126,127],"collection":[],"class_list":["post-1241","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-fenlei2","tag-128","tag-129","tag-136","tag-gpt","tag-ai"],"acf":[],"_links":{"self":[{"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/posts\/1241","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/comments?post=1241"}],"version-history":[{"count":0,"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/posts\/1241\/revisions"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/media\/2836"}],"wp:attachment":[{"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/media?parent=1241"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/categories?post=1241"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/tags?post=1241"},{"taxonomy":"collection","embeddable":true,"href":"https:\/\/www.nicekj.com\/nicekj2024\/wp\/v2\/collection?post=1241"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}