{"id":14921,"date":"2013-09-17T21:00:58","date_gmt":"2013-09-17T12:00:58","guid":{"rendered":"http:\/\/www.sssg.org\/blogs\/hiro345\/?p=14921"},"modified":"2013-09-18T20:02:20","modified_gmt":"2013-09-18T11:02:20","slug":"java%e3%81%ae%e5%bd%a2%e6%85%8b%e7%b4%a0%e8%a7%a3%e6%9e%90sen%e3%82%92%e4%bd%bf%e3%81%84%e3%81%9f%e3%81%84%e6%99%82%e3%81%ab%e3%81%af","status":"publish","type":"post","link":"https:\/\/www.hiro345.net\/blogs\/hiro345\/archives\/14921.html","title":{"rendered":"Java\u306e\u5f62\u614b\u7d20\u89e3\u6790Sen\u3092\u4f7f\u3044\u305f\u3044\u6642\u306b\u306f"},"content":{"rendered":"<p>Java\u306e\u5f62\u614b\u7d20\u89e3\u6790Sen\u3092\u4f7f\u3044\u305f\u3044\u6642\u306b\u306f\u3001svn.java.net\u304b\u3089\u30c1\u30a7\u30c3\u30af\u30a2\u30a6\u30c8\u3057\u3066\u81ea\u5206\u3067\u30d3\u30eb\u30c9\u3059\u308c\u3070\u826f\u3044\u3088\u3046\u3067\u3059\u3002Mecab\u3068\u304b\u4e45\u3057\u3076\u308a\u306b\u307f\u305f\u306e\u3067Mecab\u306eJava\u79fb\u690d\u7248\u3067\u3042\u308bSen\u306b\u3064\u3044\u3066\u8abf\u3079\u3066\u307f\u305f\u3089\u3001zip\u304c\u5165\u624b\u3067\u304d\u306a\u304f\u306a\u3063\u3066\u3044\u307e\u3057\u305f\u3002<a href=\"https:\/\/java.net\/projects\/sen\">Sen &#8211; Project Kenai<\/a>\u306f\u307e\u3060\u898b\u308c\u307e\u3059\u306d\u3002LGPL-2.1\u306e\u30e9\u30a4\u30bb\u30f3\u30b9\u3067\u3059\u3002<br \/>\n<!--more--><br \/>\niconv\u3057\u3066\u3044\u308b\u306e\u306f\u8b66\u544a\u304c\u51fa\u306a\u3044\u3088\u3046\u306b\u3057\u3066\u3044\u308b\u3060\u3051\u306a\u306e\u3067\u5b9f\u884c\u3057\u306a\u304f\u3066\u3082\u304b\u307e\u3044\u307e\u305b\u3093\u3002ipadic\u306f\u914d\u5e03\u7528URL\u304c\u5909\u308f\u3063\u3066\u3044\u307e\u3057\u305f\u3002<\/p>\n<pre class=\"brush: bash; gutter: true\">\r\n$ svn co https:\/\/svn.java.net\/svn\/sen~svn\/tags\/SEN_1_2_2_1\/sen\r\n$ cd sen\r\n$ iconv -f Windows-31J -t EUC-JP src\/java\/net\/java\/sen\/SenUtils.java &gt; SenUtils.java\r\n$ ant\r\n$ cd dic\r\n$ sed -i &#039;s%http:\/\/chasen.aist-nara.ac.jp\/stable\/ipadic%http:\/\/chasen.naist.jp\/stable\/ipadic%&#039; build.xml\r\n$ ant\r\n<\/pre>\n<p>\u3068\u3044\u3046\u3053\u3068\u3067\u624b\u5143\u306b\u6b8b\u3057\u3066\u304a\u304d\u307e\u3057\u305f\u3002\u3053\u308c\u3067\u3044\u3064\u3067\u3082\u4f7f\u3048\u308b\uff08\u306f\u305a\uff09\u3002<\/p>\n<p>Sen\u304c\u306a\u304f\u3066\u3082\u3001\u300c<a href=\"http:\/\/www.mwsoft.jp\/programming\/munou\/lucene_gosen.html\">Java\u88fd\u5f62\u614b\u7d20\u89e3\u6790\u30e9\u30a4\u30d6\u30e9\u30ea\u300clucene-gosen\u300d\u3092\u8a66\u3057\u3066\u307f\u308b<\/a>\u300d\u3068\u304b\u3001\u300c<a href=\"http:\/\/www.mwsoft.jp\/programming\/lucene\/kuromoji.html\">Java\u88fd\u5f62\u614b\u7d20\u89e3\u6790\u5668\u300cKuromoji\u300d\u3092\u8a66\u3057\u3066\u307f\u308b<\/a>\u300d\u3068\u304b\u3001\u300c<a href=\"http:\/\/www.mwsoft.jp\/programming\/munou\/igo_install.html\">Java\u88fd\u5f62\u614b\u7d20\u89e3\u6790\u30a8\u30f3\u30b8\u30f3\u300cIgo\u300d\u3092\u8a66\u3057\u3066\u307f\u308b<\/a>\u300d\u3068\u304b\u898b\u308b\u3068\u3001\u8272\u3005\u3042\u308a\u307e\u3059\u304b\u3089\u3001\u305d\u3061\u3089\u3092\u4f7f\u3046\u3068\u3044\u3044\u304b\u3082\u3057\u308c\u307e\u305b\u3093\u3002<\/p>\n<p><a href=\"http:\/\/chasen-legacy.sourceforge.jp\/\">chasen legacy &#8212; an old morphological analyzer<\/a>\u3068\u304b\u3001<a href=\"http:\/\/nlp.ist.i.kyoto-u.ac.jp\/index.php?JUMAN\">JUMAN &#8211; KUROHASHI-KAWAHARA LAB<\/a>\u3001<a href=\"http:\/\/www.phontron.com\/kytea\/index-ja.html\">KyTea (\u4eac\u90fd\u30c6\u30ad\u30b9\u30c8\u89e3\u6790\u30c4\u30fc\u30eb\u30ad\u30c3\u30c8)<\/a>\u3001<a href=\"http:\/\/kakasi.namazu.org\/\">KAKASI &#8211; \u6f22\u5b57\u2192\u304b\u306a(\u30ed\u30fc\u30de\u5b57)\u5909\u63db\u30d7\u30ed\u30b0\u30e9\u30e0<\/a>\u3068\u304b\u5f62\u614b\u7d20\u89e3\u6790\u306f\u6b74\u53f2\u304c\u3042\u308a\u307e\u3059\u306d\u3002KAKASI\u304cSKK\u306e\u9006\u6587\u5b57\u304b\u3089\u304d\u3066\u3044\u308b\u3068\u306f\u77e5\u308a\u307e\u305b\u3093\u3067\u3057\u305f\u3002<\/p>\n<p>\u3053\u3046\u3044\u3046\u6b74\u53f2\u306e\u4e2d\u3067\u300c<a href=\"http:\/\/mecab.googlecode.com\/svn\/trunk\/mecab\/doc\/index.html\">MeCab: Yet Another Part-of-Speech and Morphological Analyzer<\/a>\u300d\u3082\u300c<a href=\"http:\/\/code.google.com\/p\/lucene-gosen\/\">lucene-gosen &#8211; Japanese analysis for Apache Lucene\/Solr 3.6 and 4.4 &#8211; Google Project Hosting<\/a>\u300d\u3082\u66f4\u65b0\u304c\u7d9a\u3044\u3066\u3044\u308b\u306e\u306f\u3001\u51c4\u3044\u3067\u3059\u306d\u3002<\/p>\n<ul>\n<li><a type=\"amzn\" asin=\"4873114705\">\u5165\u9580 \u81ea\u7136\u8a00\u8a9e\u51e6\u7406<\/a><\/li>\n<li><a type=\"amzn\" asin=\"4774141755\">Apache Solr\u5165\u9580 \u2015\u30aa\u30fc\u30d7\u30f3\u30bd\u30fc\u30b9\u5168\u6587\u691c\u7d22\u30a8\u30f3\u30b8\u30f3<\/a><\/li>\n<li><a type=\"amzn\" asin=\"4339024511\">\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306e\u57fa\u790e <\/a><\/li>\n<li><a type=\"amzn\" asin=\"4873115132\">\u5165\u9580 \u30bd\u30fc\u30b7\u30e3\u30eb\u30c7\u30fc\u30bf \u2015\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0\u3001\u5206\u6790\u3001\u53ef\u8996\u5316\u306e\u30c6\u30af\u30cb\u30c3\u30af <\/a><\/li>\n<li><a type=\"amzn\" asin=\"4873113644\">\u96c6\u5408\u77e5\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0<\/a><\/li>\n<\/ul>\n<div>\n<iframe loading=\"lazy\" style=\"width: 120px; height: 240px;\" src=\"\/\/rcm-jp.amazon.co.jp\/e\/cm?t=hiro345-22&amp;o=9&amp;p=8&amp;l=as1&amp;asins=4873114705&amp;ref=tf_til&amp;fc1=000000&amp;IS2=1&amp;lt1=_blank&amp;m=amazon&amp;lc1=0000FF&amp;bc1=000000&amp;bg1=FFFFFF&amp;f=ifr\" height=\"240\" width=\"320\" frameborder=\"0\" marginwidth=\"0\" marginheight=\"0\" scrolling=\"no\"><\/iframe><iframe loading=\"lazy\" style=\"width: 120px; height: 240px;\" src=\"\/\/rcm-jp.amazon.co.jp\/e\/cm?t=hiro345-22&amp;o=9&amp;p=8&amp;l=as1&amp;asins=4774141755&amp;ref=tf_til&amp;fc1=000000&amp;IS2=1&amp;lt1=_blank&amp;m=amazon&amp;lc1=0000FF&amp;bc1=000000&amp;bg1=FFFFFF&amp;f=ifr\" height=\"240\" width=\"320\" frameborder=\"0\" marginwidth=\"0\" marginheight=\"0\" scrolling=\"no\"><\/iframe><iframe loading=\"lazy\" style=\"width: 120px; height: 240px;\" src=\"\/\/rcm-jp.amazon.co.jp\/e\/cm?t=hiro345-22&amp;o=9&amp;p=8&amp;l=as1&amp;asins=4339024511&amp;ref=tf_til&amp;fc1=000000&amp;IS2=1&amp;lt1=_blank&amp;m=amazon&amp;lc1=0000FF&amp;bc1=000000&amp;bg1=FFFFFF&amp;f=ifr\" height=\"240\" width=\"320\" frameborder=\"0\" marginwidth=\"0\" marginheight=\"0\" scrolling=\"no\"><\/iframe><iframe loading=\"lazy\" style=\"width: 120px; height: 240px;\" src=\"\/\/rcm-jp.amazon.co.jp\/e\/cm?t=hiro345-22&amp;o=9&amp;p=8&amp;l=as1&amp;asins=4873115132&amp;ref=tf_til&amp;fc1=000000&amp;IS2=1&amp;lt1=_blank&amp;m=amazon&amp;lc1=0000FF&amp;bc1=000000&amp;bg1=FFFFFF&amp;f=ifr\" height=\"240\" width=\"320\" frameborder=\"0\" marginwidth=\"0\" marginheight=\"0\" scrolling=\"no\"><\/iframe><iframe loading=\"lazy\" style=\"width: 120px; height: 240px;\" src=\"\/\/rcm-jp.amazon.co.jp\/e\/cm?t=hiro345-22&amp;o=9&amp;p=8&amp;l=as1&amp;asins=4873113644&amp;ref=tf_til&amp;fc1=000000&amp;IS2=1&amp;lt1=_blank&amp;m=amazon&amp;lc1=0000FF&amp;bc1=000000&amp;bg1=FFFFFF&amp;f=ifr\" height=\"240\" width=\"320\" frameborder=\"0\" marginwidth=\"0\" marginheight=\"0\" scrolling=\"no\"><\/iframe>\n<\/div>\n","protected":false},"excerpt":{"rendered":"<p>Java\u306e\u5f62\u614b\u7d20\u89e3\u6790Sen\u3092\u4f7f\u3044\u305f\u3044\u6642\u306b\u306f\u3001svn.java.net\u304b\u3089\u30c1\u30a7\u30c3\u30af\u30a2\u30a6\u30c8\u3057\u3066\u81ea\u5206\u3067\u30d3\u30eb\u30c9\u3059\u308c\u3070\u826f\u3044\u3088\u3046\u3067\u3059\u3002Mecab\u3068\u304b\u4e45\u3057\u3076\u308a\u306b\u307f\u305f\u306e\u3067Mecab\u306eJava\u79fb\u690d\u7248\u3067\u3042\u308bSen\u306b\u3064\u3044\u3066\u8abf\u3079\u3066\u307f\u305f\u3089\u3001zip &hellip; <a href=\"https:\/\/www.hiro345.net\/blogs\/hiro345\/archives\/14921.html\">\u7d9a\u304d\u3092\u8aad\u3080 <span class=\"meta-nav\">&rarr;<\/span><\/a><\/p>\n","protected":false},"author":2,"featured_media":0,"comment_status":"closed","ping_status":"closed","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[2],"tags":[],"class_list":["post-14921","post","type-post","status-publish","format-standard","hentry","category-java"],"_links":{"self":[{"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/posts\/14921","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/comments?post=14921"}],"version-history":[{"count":5,"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/posts\/14921\/revisions"}],"predecessor-version":[{"id":14930,"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/posts\/14921\/revisions\/14930"}],"wp:attachment":[{"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/media?parent=14921"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/categories?post=14921"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/www.hiro345.net\/blogs\/hiro345\/wp-json\/wp\/v2\/tags?post=14921"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}