{"id":10666,"date":"2023-07-30T14:30:50","date_gmt":"2023-07-30T05:30:50","guid":{"rendered":"https:\/\/www.sambuichi.jp\/?p=10666"},"modified":"2023-08-24T09:34:59","modified_gmt":"2023-08-24T00:34:59","slug":"winods10%e3%81%aepython3%e7%92%b0%e5%a2%83%e3%81%a7%e6%97%a5%e6%9c%ac%e8%aa%9e%e8%a7%a3%e6%9e%90mecab","status":"publish","type":"post","link":"https:\/\/www.sambuichi.jp\/?p=10666","title":{"rendered":"Winods10\u306ePython3\u74b0\u5883\u3067\u65e5\u672c\u8a9e\u89e3\u6790(MeCab)"},"content":{"rendered":"<p>Views: 8<\/p><div id=\"header\">\n<h1>Winods10\u306ePython3\u74b0\u5883\u3067\u65e5\u672c\u8a9e\u89e3\u6790(MeCab)<\/h1>\n<div id=\"toc\" class=\"toc2\">\n<div id=\"toctitle\">\u76ee\u6b21<\/div>\n<ul class=\"sectlevel1\">\n<li><a href=\"#_mecab\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\">1. MeCab\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/a><\/li>\n<li><a href=\"#_mecab_python3\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\">2. mecab-python3\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/a><\/li>\n<li><a href=\"#_\u8f9e\u66f8\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\">3. \u8f9e\u66f8\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/a><\/li>\n<li><a href=\"#_\u540d\u8a5e\u306e\u62bd\u51fa\">4. \u540d\u8a5e\u306e\u62bd\u51fa<\/a><\/li>\n<\/ul>\n<\/div>\n<\/div>\n<div id=\"content_adoc\">\n<div id=\"preamble\">\n<div class=\"sectionbody\">\n<div class=\"paragraph\">\n<p>Nobuyuki SAMBUICHI<br \/>\n<a href=\"https:\/\/www.iso.org\/committee\/5648297.html\">ISO\/TC295 Audit data services<\/a>\/SG1 Semantic model Convener<\/p>\n<\/div>\n<div class=\"paragraph\">\n<p>Winods10\u306ePython3\u74b0\u5883\u3067\u65e5\u672c\u8a9e\u89e3\u6790\u306eMeCab\u3092\u5229\u7528\u53ef\u80fd\u3068\u3057\u307e\u3057\u305f\u3002<\/p>\n<\/div>\n<\/div>\n<\/div>\n<div class=\"sect1\">\n<h2 id=\"_mecab\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\">1. MeCab\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/h2>\n<div class=\"sectionbody\">\n<div class=\"paragraph\">\n<p>MeCab\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u306b\u3001\u30cd\u30c3\u30c8\u8a18\u4e8b\u3067\u3088\u304f\u7d39\u4ecb\u3055\u308c\u3066\u3044\u308b\u6b21\u306e\u30b5\u30a4\u30c8\u304b\u3089\u30a4\u30f3\u30b9\u30c8\u30fc\u30e9\u3092\u30c0\u30a6\u30f3\u30ed\u30fc\u30c9\u3057\u307e\u3057\u305f\u3002<\/p>\n<\/div>\n<div class=\"paragraph\">\n<p><a href=\"https:\/\/github.com\/ikegami-yukino\/mecab\/releases\/tag\/v0.996.2\">https:\/\/github.com\/ikegami-yukino\/mecab\/releases\/tag\/v0.996.2<\/a><\/p>\n<\/div>\n<div class=\"imageblock\">\n<div class=\"content\">\n<img decoding=\"async\" src=\"https:\/\/www.sambuichi.jp\/wp-content\/uploads\/2023\/07\/230730Picture10.png\" alt=\"230730Picture10\">\n<\/div>\n<\/div>\n<\/div>\n<\/div>\n<div class=\"sect1\">\n<h2 id=\"_mecab_python3\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\">2. mecab-python3\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/h2>\n<div class=\"sectionbody\">\n<div class=\"listingblock\">\n<div class=\"content\">\n<pre class=\"highlight\"><code class=\"language-ps\" data-lang=\"ps\">pip install mecab-python3<\/code><\/pre>\n<\/div>\n<\/div>\n<div class=\"paragraph\">\n<p>\u6a19\u6e96\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3067 C:\\Program Files\\MeCab \u306b\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3057\u307e\u3057\u305f\u3002<\/p>\n<\/div>\n<\/div>\n<\/div>\n<div class=\"sect1\">\n<h2 id=\"_\u8f9e\u66f8\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\">3. \u8f9e\u66f8\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/h2>\n<div class=\"sectionbody\">\n<div class=\"paragraph\">\n<p>ChatGPT\u304c\u63d0\u6848\u3057\u3066\u304f\u308c\u305fPython\u30b3\u30fc\u30c9\u3067\u540d\u8a5e\u3092\u62bd\u51fa\u3059\u308b\u30c6\u30b9\u30c8\u30d7\u30ed\u30b0\u30e9\u30e0\u3092\u8a66\u4f5c\u3057\u305f\u3002<br \/>\n\u6b21\u306e\u7b87\u6240\u304c\u554f\u984c\u3068\u306a\u3063\u305f\u3002<\/p>\n<\/div>\n<div class=\"listingblock\">\n<div class=\"content\">\n<pre class=\"highlight\"><code class=\"language-py\" data-lang=\"py\">    # MeCab\u3092\u521d\u671f\u5316\r\n    mecab = MeCab.Tagger(\"-d C:\/path\/to\/mecab\/dic -Owakati\")  # dicrc\u306e\u30d1\u30b9\u3092\u6307\u5b9a\u3057\u3066\u304f\u3060\u3055\u3044<\/code><\/pre>\n<\/div>\n<\/div>\n<div class=\"paragraph\">\n<p>\u554f\u984c 1 \u30d1\u30b9\u4e2d\u306b\u7a7a\u767d\u304c\u3042\u308b\u305f\u3081\u30d1\u30b9\u304c\u6b63\u3057\u304f\u5224\u65ad\u3055\u308c\u306a\u3044\u3002<br \/>\n\u5bfe\u7b56 1 &#8216;\u30d1\u30b9\u6307\u5b9a&#8217;\u3068\u30b7\u30f3\u30b0\u30eb\u30af\u30a9\u30fc\u30c8\u3067\u56f2\u3063\u305f\u3002<\/p>\n<\/div>\n<div class=\"paragraph\">\n<p>\u554f\u984c 2 mecabrc\u306f\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3055\u308c\u3066\u3044\u308b\u304c\u3001dicrc\u304c\u306a\u3044\u3068\u3044\u3046\u30a8\u30e9\u30fc\u304c\u51fa\u3066\u3057\u307e\u3046\u3002<br \/>\n\u5bfe\u7b56 2 IPA\u8f9e\u66f8\u3092\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3057\u305d\u306e\u500b\u6240\u3092\u6307\u5b9a\u3057\u305f\u3002<\/p>\n<\/div>\n<div class=\"listingblock\">\n<div class=\"content\">\n<pre class=\"highlight\"><code class=\"language-ps\" data-lang=\"ps\">&gt; pip install unidic-lite<\/code><\/pre>\n<\/div>\n<\/div>\n<div class=\"listingblock\">\n<div class=\"content\">\n<pre class=\"highlight\"><code class=\"language-py\" data-lang=\"py\">    # MeCab\u3092\u521d\u671f\u5316\r\n    mecab = MeCab.Tagger(\"-d 'C:\\\\Program Files\\\\MeCab\\\\dic\\\\ipadic' -Owakati\")  # mecabrc\u304c\u3042\u308b\u30c7\u30a3\u30ec\u30af\u30c8\u30ea\u3092\u6307\u5b9a\u3057\u3066\u304f\u3060\u3055\u3044<\/code><\/pre>\n<\/div>\n<\/div>\n<div class=\"paragraph\">\n<p>\u554f\u984c 3 \u6b63\u3057\u304f\u54c1\u8a5e\u304c\u5206\u89e3\u3055\u308c\u306a\u3044<br \/>\n\u5bfe\u7b56 3 -Owakati\u306e\u6307\u5b9a\u304c\u9593\u9055\u3044\u3002\u8336\u7b45\u3092\u6307\u5b9a\u3059\u308b\u3002<\/p>\n<\/div>\n<div class=\"listingblock\">\n<div class=\"content\">\n<pre class=\"highlight\"><code class=\"language-py\" data-lang=\"py\">    # MeCab\u3092\u521d\u671f\u5316\r\n    mecab = MeCab.Tagger(\"-d 'C:\\\\Program Files\\\\MeCab\\\\dic\\\\ipadic' -Ochasen\")  # dicrc\u304c\u3042\u308b\u30c7\u30a3\u30ec\u30af\u30c8\u30ea\u3092\u6307\u5b9a\u3057\u3066\u304f\u3060\u3055\u3044<\/code><\/pre>\n<\/div>\n<\/div>\n<\/div>\n<\/div>\n<div class=\"sect1\">\n<h2 id=\"_\u540d\u8a5e\u306e\u62bd\u51fa\">4. \u540d\u8a5e\u306e\u62bd\u51fa<\/h2>\n<div class=\"sectionbody\">\n<div class=\"paragraph\">\n<p>ChatGPT\u306f\u3001\u65e5\u672c\u8a9e\u304c\u82e6\u624b\u79d1\u76ee\u306e\u3088\u3046\u306a\u306e\u3067\u3001\u6b21\u306e\u30cd\u30c3\u30c8\u8a18\u4e8b\u3092\u53c2\u8003\u306b\u3057\u3066\u30c6\u30b9\u30c8\u30d7\u30ed\u30b0\u30e9\u30e0\u3092\u4f5c\u6210\u3057\u305f\u3002<\/p>\n<\/div>\n<div class=\"paragraph\">\n<p><a href=\"https:\/\/note.com\/junmaeda\/n\/n39b8b286da13\">https:\/\/note.com\/junmaeda\/n\/n39b8b286da13<\/a><\/p>\n<\/div>\n<div class=\"listingblock\">\n<div class=\"title\">chasentest.py<\/div>\n<div class=\"content\">\n<pre class=\"highlight\"><code class=\"language-py\" data-lang=\"py\">import MeCab\r\n\r\ntext = \"\u89e3\u6790\u3057\u305f\u3044\u30c6\u30ad\u30b9\u30c8\u3092\u5165\u308c\u308b\u3002\"\r\n# mecab = MeCab.Tagger(\"-Ochasen\")\r\nmecab = MeCab.Tagger(\"-d 'C:\\\\Program Files\\\\MeCab\\\\dic\\\\ipadic' -Ochasen\")  # dicrc\u304c\u3042\u308b\u30c7\u30a3\u30ec\u30af\u30c8\u30ea\u3092\u6307\u5b9a\u3057\u3066\u304f\u3060\u3055\u3044\r\n\r\nnouns = [line.split()[0] for line in mecab.parse(text).splitlines()\r\n               if \"\u540d\u8a5e\" in line.split()[-1]]\r\n\r\nfor str in nouns:\r\n   print(str)<\/code><\/pre>\n<\/div>\n<\/div>\n<div class=\"paragraph\">\n<p>mecab = MeCab.Tagger\u3000\u3067\u5f62\u614b\u7d20\u89e3\u6790\u30a8\u30f3\u30b8\u30f3\u306b\u8336\u7b45\u3092\u6307\u5b9a\u3057\u305f\u3002<br \/>\nmecab.parse(text).splitlines()\u3000\u3067\u6587\u3092\u5f62\u614b\u7d20\u5358\u4f4d\u306b\u5206\u5272\u3057\u305f\u30c7\u30fc\u30bf\u304c\u8fd4\u3055\u308c\u308b\u306e\u3067\u3001\u89e3\u6790\u30c7\u30fc\u30bf\u306e\u7d42\u308f\u308a\u306b\u3042\u308b\u54c1\u8a5e\u30c7\u30fc\u30bf\u3092\u9078\u629e\u6761\u4ef6\u3068\u3057\u3066\u300c\u540d\u8a5e\u300d\u306e\u3082\u306e\u3060\u3051\u3092\u53d6\u308a\u51fa\u3059\u51e6\u7406\u3002<\/p>\n<\/div>\n<\/div>\n<\/div>\n<\/div>\n<div id=\"footer\">\n<div id=\"footer-text\">\nLast updated 2023-07-30 14:40:21 +0900\n<\/div>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>Views: 8 Winods10\u306ePython3\u74b0\u5883\u3067\u65e5\u672c\u8a9e\u89e3\u6790(MeCab) \u76ee\u6b21 1. MeCab\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb 2. mecab-python3\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb 3. \u8f9e\u66f8\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb 4. \u540d\u8a5e\u306e\u62bd\u51fa Nobu [&hellip;]<\/p>\n","protected":false},"author":2,"featured_media":10658,"comment_status":"open","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":[],"categories":[11],"tags":[],"_links":{"self":[{"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=\/wp\/v2\/posts\/10666"}],"collection":[{"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=10666"}],"version-history":[{"count":3,"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=\/wp\/v2\/posts\/10666\/revisions"}],"predecessor-version":[{"id":10815,"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=\/wp\/v2\/posts\/10666\/revisions\/10815"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=\/wp\/v2\/media\/10658"}],"wp:attachment":[{"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=10666"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=10666"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.sambuichi.jp\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=10666"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}