{"id":1018,"date":"2021-04-12T09:05:00","date_gmt":"2021-04-12T00:05:00","guid":{"rendered":"https:\/\/technologyagency.net\/wordpress\/?p=1018"},"modified":"2021-07-05T00:26:23","modified_gmt":"2021-07-04T15:26:23","slug":"mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d","status":"publish","type":"post","link":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/","title":{"rendered":"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d"},"content":{"rendered":"\n<p>\u65b0\u74b0\u5883\u3092\u69cb\u7bc9\u3059\u308b\u3068\u304d\u5fd8\u308c\u304c\u3061\u306a\u306e\u3067\u3001\u899a\u3048\u66f8\u304d\u3068\u3057\u3066\u6b8b\u3057\u3066\u304a\u304f\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">\uff11\uff0e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/h3>\n\n\n<div class=\"wp-block-syntaxhighlighter-code \"><pre class=\"brush: bash; title: ; notranslate\" title=\"\">\nsudo apt update\nsudo apt upgrade\nsudo apt install mecab libmecab-dev mecab-ipadic-utf8 git make\ncurl xz-utils file\nsudo apt install python3-pip\n<\/pre><\/div>\n\n<div class=\"wp-block-syntaxhighlighter-code \"><pre class=\"brush: bash; title: ; notranslate\" title=\"\">\npip3 install mecab-python3 unidic-lite neologdn\ngit clone --depth 1 https:\/\/github.com\/neologd\/mecab-ipadic-neologd.git\n<\/pre><\/div>\n\n<div class=\"wp-block-syntaxhighlighter-code \"><pre class=\"brush: bash; title: ; notranslate\" title=\"\">\necho yes | mecab-ipadic-neologd\/bin\/install-mecab-ipadic-neologd -n -a\n\nUsage:\n    $ mecab -d \/usr\/lib\/x86_64-linux-gnu\/mecab\/dic\/mecab-ipadic-neologd ...\n<\/pre><\/div>\n\n\n<h3 class=\"wp-block-heading\">\uff12\uff0e\u4f7f\u7528\u65b9\u6cd5<\/h3>\n\n\n<div class=\"wp-block-syntaxhighlighter-code \"><pre class=\"brush: python; title: ; notranslate\" title=\"\">\nimport re\nimport neologdn\nimport subprocess\nimport MeCab\n\nCONTENT_WORD_POS = (&#039;\u540d\u8a5e&#039;, &#039;\u52d5\u8a5e&#039;, &#039;\u5f62\u5bb9\u8a5e&#039;, &#039;\u5f62\u5bb9\u52d5\u8a5e&#039;, &#039;\u526f\u8a5e&#039;)\nSTOP_WORD_POS = (&#039;\u4ee3\u540d\u8a5e&#039;, &#039;\u52a9\u52d5\u8a5e&#039;, &#039;\u975e\u81ea\u7acb&#039;, &#039;\u6570&#039;, &#039;\u4eba\u540d&#039;)\n\n# \u6b63\u898f\u5316\ndef normalize(text):\n  return neologdn.normalize(re.sub(r&#039;&#x5B;0-9]+&#039;, &#039;0&#039;, text).lower())\n\n# \u5f62\u614b\u7d20\u89e3\u6790\ndef analysis(text):\n  cmd = &#039;echo `mecab-config --dicdir`&quot;\/mecab-ipadic-neologd&quot;&#039;\n  path = (subprocess.Popen(cmd, stdout=subprocess.PIPE, shell=True).communicate()&#x5B;0]).decode(&#039;utf-8&#039;)\n  tagger = MeCab.Tagger(&#039;-d {0}&#039;.format(path))\n  tagger.parse(&#039;&#039;)\n  node = tagger.parseToNode(normalize(text))\n  word = &#039;&#039;\n  pre_features = &#x5B;]\n\n  while node:\n    features = node.feature.split(&#039;,&#039;)&#x5B;:6]\n    # \u540d\u8a5e\u3001\u52d5\u8a5e\u3001\u5f62\u5bb9\u8a5e\u3001\u5f62\u5bb9\u52d5\u8a5e\u3001\u526f\u8a5e\u3067\u3042\u308b\u304b\u5224\u5b9a\n    valid = False\n    for pos in CONTENT_WORD_POS:\n      valid = pos in features or valid\n    # \u4ee5\u4e0b\u306b\u8a72\u5f53\u3059\u308b\u5834\u5408\u306f\u9664\u5916\uff08\u30b9\u30c8\u30c3\u30d7\u30ef\u30fc\u30c9\uff09\n    for pos in STOP_WORD_POS:\n      valid = (not pos in features) and valid\n    if valid:\n      if (&#039;\u540d\u8a5e\u63a5\u7d9a&#039; in pre_features and &#039;\u540d\u8a5e&#039; in features) or (&#039;\u63a5\u5c3e&#039; in features):\n        word += &#039;{0}&#039;.format(node.surface)\n      else:\n        word += &#039; {0}&#039;.format(node.surface)\n      #print(&#039;{0} {1}&#039;.format(node.surface, features))\n    pre_features = features\n    node = node.next\n  return word&#x5B;1:]\n\n<\/pre><\/div>","protected":false},"excerpt":{"rendered":"<p>\u65b0\u74b0\u5883\u3092\u69cb\u7bc9\u3059\u308b\u3068\u304d\u5fd8\u308c\u304c\u3061\u306a\u306e\u3067\u3001\u899a\u3048\u66f8\u304d\u3068\u3057\u3066\u6b8b\u3057\u3066\u304a\u304f\u3002 \uff11\uff0e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb \uff12\uff0e\u4f7f\u7528\u65b9\u6cd5<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[41],"tags":[],"class_list":["post-1018","post","type-post","status-publish","format-standard","hentry","category-python"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v27.3 - https:\/\/yoast.com\/product\/yoast-seo-wordpress\/ -->\n<title>mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d - I want to lead an easy life.<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d\/\" \/>\n<meta property=\"og:locale\" content=\"ja_JP\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d - I want to lead an easy life.\" \/>\n<meta property=\"og:description\" content=\"\u65b0\u74b0\u5883\u3092\u69cb\u7bc9\u3059\u308b\u3068\u304d\u5fd8\u308c\u304c\u3061\u306a\u306e\u3067\u3001\u899a\u3048\u66f8\u304d\u3068\u3057\u3066\u6b8b\u3057\u3066\u304a\u304f\u3002 \uff11\uff0e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb \uff12\uff0e\u4f7f\u7528\u65b9\u6cd5\" \/>\n<meta property=\"og:url\" content=\"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d\/\" \/>\n<meta property=\"og:site_name\" content=\"I want to lead an easy life.\" \/>\n<meta property=\"article:published_time\" content=\"2021-04-12T00:05:00+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2021-07-04T15:26:23+00:00\" \/>\n<meta name=\"author\" content=\"hide6644\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"\u57f7\u7b46\u8005\" \/>\n\t<meta name=\"twitter:data1\" content=\"hide6644\" \/>\n\t<meta name=\"twitter:label2\" content=\"\u63a8\u5b9a\u8aad\u307f\u53d6\u308a\u6642\u9593\" \/>\n\t<meta name=\"twitter:data2\" content=\"1\u5206\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\\\/\\\/schema.org\",\"@graph\":[{\"@type\":\"Article\",\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/#article\",\"isPartOf\":{\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/\"},\"author\":{\"name\":\"hide6644\",\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/#\\\/schema\\\/person\\\/a25355beaa102da2b2d79b00f5865b63\"},\"headline\":\"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d\",\"datePublished\":\"2021-04-12T00:05:00+00:00\",\"dateModified\":\"2021-07-04T15:26:23+00:00\",\"mainEntityOfPage\":{\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/\"},\"wordCount\":1,\"commentCount\":0,\"articleSection\":[\"Python\"],\"inLanguage\":\"ja\",\"potentialAction\":[{\"@type\":\"CommentAction\",\"name\":\"Comment\",\"target\":[\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/#respond\"]}]},{\"@type\":\"WebPage\",\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/\",\"url\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/\",\"name\":\"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d - I want to lead an easy life.\",\"isPartOf\":{\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/#website\"},\"datePublished\":\"2021-04-12T00:05:00+00:00\",\"dateModified\":\"2021-07-04T15:26:23+00:00\",\"author\":{\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/#\\\/schema\\\/person\\\/a25355beaa102da2b2d79b00f5865b63\"},\"breadcrumb\":{\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/#breadcrumb\"},\"inLanguage\":\"ja\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/\"]}]},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/2021\\\/04\\\/12\\\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\\\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"\u30db\u30fc\u30e0\",\"item\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/#website\",\"url\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/\",\"name\":\"I want to lead an easy life.\",\"description\":\"Technical Notes\",\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"ja\"},{\"@type\":\"Person\",\"@id\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/#\\\/schema\\\/person\\\/a25355beaa102da2b2d79b00f5865b63\",\"name\":\"hide6644\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"ja\",\"@id\":\"https:\\\/\\\/secure.gravatar.com\\\/avatar\\\/a5df48aece572798f5aacd2dd90331e28bd249c13f736badb5116e3d43c5d5e9?s=96&d=mm&r=g\",\"url\":\"https:\\\/\\\/secure.gravatar.com\\\/avatar\\\/a5df48aece572798f5aacd2dd90331e28bd249c13f736badb5116e3d43c5d5e9?s=96&d=mm&r=g\",\"contentUrl\":\"https:\\\/\\\/secure.gravatar.com\\\/avatar\\\/a5df48aece572798f5aacd2dd90331e28bd249c13f736badb5116e3d43c5d5e9?s=96&d=mm&r=g\",\"caption\":\"hide6644\"},\"url\":\"https:\\\/\\\/technologyagency.net\\\/wordpress\\\/author\\\/hide6644\\\/\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d - I want to lead an easy life.","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d\/","og_locale":"ja_JP","og_type":"article","og_title":"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d - I want to lead an easy life.","og_description":"\u65b0\u74b0\u5883\u3092\u69cb\u7bc9\u3059\u308b\u3068\u304d\u5fd8\u308c\u304c\u3061\u306a\u306e\u3067\u3001\u899a\u3048\u66f8\u304d\u3068\u3057\u3066\u6b8b\u3057\u3066\u304a\u304f\u3002 \uff11\uff0e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb \uff12\uff0e\u4f7f\u7528\u65b9\u6cd5","og_url":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d\/","og_site_name":"I want to lead an easy life.","article_published_time":"2021-04-12T00:05:00+00:00","article_modified_time":"2021-07-04T15:26:23+00:00","author":"hide6644","twitter_card":"summary_large_image","twitter_misc":{"\u57f7\u7b46\u8005":"hide6644","\u63a8\u5b9a\u8aad\u307f\u53d6\u308a\u6642\u9593":"1\u5206"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"Article","@id":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/#article","isPartOf":{"@id":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/"},"author":{"name":"hide6644","@id":"https:\/\/technologyagency.net\/wordpress\/#\/schema\/person\/a25355beaa102da2b2d79b00f5865b63"},"headline":"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d","datePublished":"2021-04-12T00:05:00+00:00","dateModified":"2021-07-04T15:26:23+00:00","mainEntityOfPage":{"@id":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/"},"wordCount":1,"commentCount":0,"articleSection":["Python"],"inLanguage":"ja","potentialAction":[{"@type":"CommentAction","name":"Comment","target":["https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/#respond"]}]},{"@type":"WebPage","@id":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/","url":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/","name":"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d - I want to lead an easy life.","isPartOf":{"@id":"https:\/\/technologyagency.net\/wordpress\/#website"},"datePublished":"2021-04-12T00:05:00+00:00","dateModified":"2021-07-04T15:26:23+00:00","author":{"@id":"https:\/\/technologyagency.net\/wordpress\/#\/schema\/person\/a25355beaa102da2b2d79b00f5865b63"},"breadcrumb":{"@id":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/#breadcrumb"},"inLanguage":"ja","potentialAction":[{"@type":"ReadAction","target":["https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/"]}]},{"@type":"BreadcrumbList","@id":"https:\/\/technologyagency.net\/wordpress\/2021\/04\/12\/mecab%e8%a8%ad%e5%ae%9a%e3%81%ae%e8%a6%9a%e3%81%88%e6%9b%b8%e3%81%8d\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"\u30db\u30fc\u30e0","item":"https:\/\/technologyagency.net\/wordpress\/"},{"@type":"ListItem","position":2,"name":"mecab\u8a2d\u5b9a\u306e\u899a\u3048\u66f8\u304d"}]},{"@type":"WebSite","@id":"https:\/\/technologyagency.net\/wordpress\/#website","url":"https:\/\/technologyagency.net\/wordpress\/","name":"I want to lead an easy life.","description":"Technical Notes","potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/technologyagency.net\/wordpress\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"ja"},{"@type":"Person","@id":"https:\/\/technologyagency.net\/wordpress\/#\/schema\/person\/a25355beaa102da2b2d79b00f5865b63","name":"hide6644","image":{"@type":"ImageObject","inLanguage":"ja","@id":"https:\/\/secure.gravatar.com\/avatar\/a5df48aece572798f5aacd2dd90331e28bd249c13f736badb5116e3d43c5d5e9?s=96&d=mm&r=g","url":"https:\/\/secure.gravatar.com\/avatar\/a5df48aece572798f5aacd2dd90331e28bd249c13f736badb5116e3d43c5d5e9?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/a5df48aece572798f5aacd2dd90331e28bd249c13f736badb5116e3d43c5d5e9?s=96&d=mm&r=g","caption":"hide6644"},"url":"https:\/\/technologyagency.net\/wordpress\/author\/hide6644\/"}]}},"_links":{"self":[{"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/posts\/1018","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/comments?post=1018"}],"version-history":[{"count":6,"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/posts\/1018\/revisions"}],"predecessor-version":[{"id":1140,"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/posts\/1018\/revisions\/1140"}],"wp:attachment":[{"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/media?parent=1018"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/categories?post=1018"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/technologyagency.net\/wordpress\/wp-json\/wp\/v2\/tags?post=1018"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}