{"id":612,"date":"2024-05-03T00:04:29","date_gmt":"2024-05-02T15:04:29","guid":{"rendered":"https:\/\/chocottopro.com\/?p=612"},"modified":"2024-05-03T00:04:29","modified_gmt":"2024-05-02T15:04:29","slug":"%e3%80%90python%e3%80%91%e3%81%9f%e3%81%a3%e3%81%9f10%e8%a1%8c%e3%81%ae%e3%82%b3%e3%83%bc%e3%83%89%e3%81%a7%e3%81%a7%e3%81%8d%e3%82%8b%ef%bc%81nltk%e3%81%a8%e3%83%8d%e3%82%ac%e3%83%9d%e3%82%b8","status":"publish","type":"post","link":"https:\/\/chocottopro.com\/?p=612","title":{"rendered":"\u3010Python\u3011\u305f\u3063\u305f10\u884c\u306e\u30b3\u30fc\u30c9\u3067\u3067\u304d\u308b\uff01NLTK\u3068\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u5b9f\u8df5\u5165\u9580"},"content":{"rendered":"\n<p>Python\u3067AI\u3084\u6a5f\u68b0\u5b66\u7fd2\u306b\u53d6\u308a\u7d44\u3080\u4e0a\u3067\u3001\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306f\u907f\u3051\u3066\u901a\u308c\u306a\u3044\u5206\u91ce\u3067\u3059\u3002\u4e2d\u3067\u3082\u3001\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u304b\u3089\u611f\u60c5\u3092\u62bd\u51fa\u3059\u308b\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306f\u3001\u30d3\u30b8\u30cd\u30b9\u3067\u306e\u6d3b\u7528\u5834\u9762\u304c\u591a\u304f\u3001\u6ce8\u76ee\u3092\u96c6\u3081\u3066\u3044\u307e\u3059\u3002\u672c\u8a18\u4e8b\u3067\u306f\u3001Python\u306e\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u30e9\u30a4\u30d6\u30e9\u30ea\u3067\u3042\u308bNLTK\u3092\u4f7f\u3063\u3066\u3001\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306e\u57fa\u790e\u304b\u3089\u5fdc\u7528\u307e\u3067\u3092\u4e01\u5be7\u306b\u89e3\u8aac\u3057\u307e\u3059\u3002\u5b9f\u969b\u306e\u30b3\u30fc\u30c9\u4f8b\u3092\u4ea4\u3048\u306a\u304c\u3089\u3001\u30b9\u30c6\u30c3\u30d7\u30d0\u30a4\u30b9\u30c6\u30c3\u30d7\u3067\u5b66\u3093\u3067\u3044\u304d\u307e\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<div class=\"wp-block-sgb-block-simple sgb-box-simple sgb-box-simple--title-normal sgb-box-simple--with-border\"><div style=\"background-color:var(--wp--preset--color--sango-main);color:#FFF\" class=\"sgb-box-simple__title\">\u3053\u306e\u8a18\u4e8b\u3092\u8aad\u3093\u3060\u3089\u308f\u304b\u308b\u3053\u3068<\/div><div class=\"sgb-box-simple__body\" style=\"border-color:var(--wp--preset--color--sango-main);background-color:#FFF\">\n<ul class=\"wp-block-list\">\n<li>NLTK\u306e\u6982\u8981\u3068\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306b\u304a\u3051\u308b\u4f4d\u7f6e\u3065\u3051 <\/li>\n\n\n\n<li>NLTK\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u65b9\u6cd5\u3068\u57fa\u672c\u7684\u306a\u4f7f\u3044\u65b9 <\/li>\n\n\n\n<li>\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306e\u6982\u8981\u3068\u30d3\u30b8\u30cd\u30b9\u6d3b\u7528\u4f8b <\/li>\n\n\n\n<li>NLTK\u3092\u4f7f\u3063\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u5b9f\u88c5\u65b9\u6cd5 <\/li>\n\n\n\n<li>\u524d\u51e6\u7406\u306e\u30c6\u30af\u30cb\u30c3\u30af\u3068\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u306e\u30ab\u30b9\u30bf\u30de\u30a4\u30ba\u65b9\u6cd5 <\/li>\n\n\n\n<li>\u4ed6\u306e\u611f\u60c5\u5206\u6790\u624b\u6cd5\u3068\u306e\u6bd4\u8f03\u3068\u4f7f\u3044\u5206\u3051\u65b9 <\/li>\n\n\n\n<li>\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306e\u3055\u3089\u306a\u308b\u5b66\u7fd2\u30b9\u30c6\u30c3\u30d7\u3068\u30ea\u30bd\u30fc\u30b9<\/li>\n<\/ul>\n<\/div><\/div>\n\n\n\n<div class=\"toc\"><br \/>\n<b>Warning<\/b>:  Undefined array key \"is_admin\" in <b>\/home\/c7479301\/public_html\/chocottopro.com\/wp-content\/themes\/sango-theme\/library\/gutenberg\/dist\/classes\/Toc.php<\/b> on line <b>116<\/b><br \/>\n<br \/>\n<b>Warning<\/b>:  Undefined array key \"is_category_top\" in <b>\/home\/c7479301\/public_html\/chocottopro.com\/wp-content\/themes\/sango-theme\/library\/gutenberg\/dist\/classes\/Toc.php<\/b> on line <b>121<\/b><br \/>\n<br \/>\n<b>Warning<\/b>:  Undefined array key \"is_top\" in <b>\/home\/c7479301\/public_html\/chocottopro.com\/wp-content\/themes\/sango-theme\/library\/gutenberg\/dist\/classes\/Toc.php<\/b> on line <b>128<\/b><br \/>\n    <div id=\"toc_container\" class=\"sgb-toc--bullets js-smooth-scroll\" data-dialog-title=\"Table of Contents\">\n      <p class=\"toc_title\">\u76ee\u6b21 <\/p>\n      <ul class=\"toc_list\">  <li class=\"first\">    <a href=\"#i-0\">NLTK\u3068\u306f\u4f55\u304b\uff1f\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u30e9\u30a4\u30d6\u30e9\u30ea\u306e\u6982\u8981<\/a>    <ul class=\"menu_level_1\">      <li class=\"first\">        <a href=\"#i-1\">NLTK\u304c\u30b5\u30dd\u30fc\u30c8\u3059\u308b\u4e3b\u306a\u6a5f\u80fd<\/a>      <\/li>      <li class=\"last\">        <a href=\"#i-2\">NLTK\u306e\u30e1\u30ea\u30c3\u30c8\u3068\u30e6\u30fc\u30b9\u30b1\u30fc\u30b9<\/a>      <\/li>    <\/ul>  <\/li>  <li>    <a href=\"#i-3\">NLTK\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3068\u57fa\u672c\u7684\u306a\u4f7f\u3044\u65b9<\/a>    <ul class=\"menu_level_1\">      <li class=\"first\">        <a href=\"#i-4\">pip install nltk\u3067\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u624b\u9806<\/a>      <\/li>      <li class=\"last\">        <a href=\"#i-5\">\u983b\u51fa\u306eNLTK\u57fa\u672c\u64cd\u4f5c\u30b3\u30fc\u30c9\u4f8b<\/a>      <\/li>    <\/ul>  <\/li>  <li>    <a href=\"#i-6\">Sentiment Analysis\uff08\u611f\u60c5\u5206\u6790\uff09\u5165\u9580<\/a>    <ul class=\"menu_level_1\">      <li class=\"first\">        <a href=\"#i-7\">\u611f\u60c5\u5206\u6790\u306e\u6982\u8981\u3068\u30d3\u30b8\u30cd\u30b9\u6d3b\u7528\u4f8b<\/a>      <\/li>      <li class=\"last\">        <a href=\"#i-8\">NLTK\u306b\u3088\u308b\u611f\u60c5\u5206\u6790\u306e\u30a2\u30d7\u30ed\u30fc\u30c1<\/a>      <\/li>    <\/ul>  <\/li>  <li>    <a href=\"#i-9\">NLTK\u3067\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u3092\u5b9f\u88c5\u3057\u3066\u307f\u3088\u3046<\/a>    <ul class=\"menu_level_1\">      <li class=\"first\">        <a href=\"#i-10\">VADER Lexicon\u3092\u7528\u3044\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790<\/a>      <\/li>      <li>        <a href=\"#i-11\">MovieReview\u30c7\u30fc\u30bf\u3092\u4f7f\u3063\u305f\u5206\u6790\u306e\u6d41\u308c<\/a>      <\/li>      <li class=\"last\">        <a href=\"#i-12\">\u7c21\u5358\u306a\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u30d7\u30ed\u30b0\u30e9\u30e0\u3092\u5b9f\u88c5<\/a>      <\/li>    <\/ul>  <\/li>  <li>    <a href=\"#i-13\">NLTK\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306eTips\uff06\u767a\u5c55\u7684\u30c8\u30d4\u30c3\u30af<\/a>    <ul class=\"menu_level_1\">      <li class=\"first\">        <a href=\"#i-14\">\u524d\u51e6\u7406\u306e\u30dd\u30a4\u30f3\u30c8\u3068\u30b3\u30fc\u30c9\u30b5\u30f3\u30d7\u30eb<\/a>      <\/li>      <li>        <a href=\"#i-15\">\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u30ed\u30b8\u30c3\u30af\u306e\u30ab\u30b9\u30bf\u30de\u30a4\u30ba<\/a>      <\/li>      <li class=\"last\">        <a href=\"#i-16\">\u4ed6\u306e\u611f\u60c5\u5206\u6790\u624b\u6cd5\u3068\u306e\u6bd4\u8f03\u3068\u4f7f\u3044\u5206\u3051<\/a>      <\/li>    <\/ul>  <\/li>  <li class=\"last\">    <a href=\"#i-17\">\u307e\u3068\u3081\uff1aNLTK\u3067\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u3092\u30de\u30b9\u30bf\u30fc\u3057\u3088\u3046<\/a>  <\/li><\/ul>\n      \n    <\/div><\/div><h2 class=\"wp-block-heading\" id=\"i-0\">NLTK\u3068\u306f\u4f55\u304b\uff1f\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u30e9\u30a4\u30d6\u30e9\u30ea\u306e\u6982\u8981<\/h2>\n\n\n\n<p>Python\u3067AI\u3084\u6a5f\u68b0\u5b66\u7fd2\u306b\u53d6\u308a\u7d44\u3080\u4e0a\u3067\u3001\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\uff08NLP\uff09\u306f\u5916\u305b\u306a\u3044\u5206\u91ce\u3067\u3059\u3002\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u3092\u6271\u3046\u969b\u306b\u306f\u3001\u524d\u51e6\u7406\u3084\u8a00\u8a9e\u7684\u306a\u7279\u5fb4\u91cf\u62bd\u51fa\u306a\u3069\u3001\u5c02\u9580\u7684\u306a\u51e6\u7406\u304c\u5fc5\u8981\u306b\u306a\u308a\u307e\u3059\u3002\u305d\u3093\u306aNLP\u30bf\u30b9\u30af\u3092\u3001Python\u3067\u624b\u8efd\u306b\u5b9f\u73fe\u3057\u3066\u304f\u308c\u308b\u306e\u304c\u3001NLTK\uff08Natural Language Toolkit\uff09\u3067\u3059\u3002<\/p>\n\n\n\n<p>NLTK\u306f\u3001\u6559\u80b2\u7528\u30fb\u7814\u7a76\u7528\u306b\u958b\u767a\u3055\u308c\u305f\u30aa\u30fc\u30d7\u30f3\u30bd\u30fc\u30b9\u306ePython\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u30e9\u30a4\u30d6\u30e9\u30ea\u3067\u3059\u3002\u30c6\u30ad\u30b9\u30c8\u306e\u524d\u51e6\u7406\u3001\u54c1\u8a5e\u30bf\u30ae\u30f3\u30b0\u3001\u69cb\u6587\u89e3\u6790\u3001\u610f\u5473\u89e3\u6790\u306a\u3069\u3001\u5e45\u5e83\u3044NLP\u30bf\u30b9\u30af\u306b\u5bfe\u5fdc\u3057\u3066\u3044\u307e\u3059\u3002\u521d\u5b66\u8005\u306b\u3082\u4f7f\u3044\u3084\u3059\u3044\u3088\u3046\u300150\u4ee5\u4e0a\u306e\u30b3\u30fc\u30d1\u30b9\u3068\u8a9e\u5f59\u30ea\u30bd\u30fc\u30b9\u304c\u540c\u68b1\u3055\u308c\u3066\u304a\u308a\u3001\u5145\u5b9f\u3057\u305f\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb\u3084\u66f8\u7c4d\u3082\u3042\u308b\u306e\u304c\u7279\u5fb4\u3067\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-1\">NLTK\u304c\u30b5\u30dd\u30fc\u30c8\u3059\u308b\u4e3b\u306a\u6a5f\u80fd<\/h3>\n\n\n\n<p>NLTK\u306f\u591a\u6a5f\u80fd\u306a\u30e9\u30a4\u30d6\u30e9\u30ea\u3067\u3059\u304c\u3001\u4e2d\u3067\u3082\u983b\u7e41\u306b\u4f7f\u308f\u308c\u308b\u306e\u304c\u4ee5\u4e0b\u306e\u6a5f\u80fd\u3067\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>Tokenization\uff08\u30c8\u30fc\u30af\u30f3\u5316\uff09: \u30c6\u30ad\u30b9\u30c8\u3092\u5358\u8a9e\u3084\u6587\u7ae0\u306b\u5206\u5272\u3057\u307e\u3059\u3002<\/li>\n\n\n\n<li>POS Tagging\uff08\u54c1\u8a5e\u30bf\u30ae\u30f3\u30b0\uff09: \u5358\u8a9e\u306e\u54c1\u8a5e\u3092\u8b58\u5225\u3057\u307e\u3059\u3002<\/li>\n\n\n\n<li>Named Entity Recognition\uff08\u56fa\u6709\u8868\u73fe\u8a8d\u8b58\uff09: \u4eba\u540d\u3001\u5730\u540d\u3001\u7d44\u7e54\u540d\u306a\u3069\u3092\u62bd\u51fa\u3057\u307e\u3059\u3002<\/li>\n\n\n\n<li>Text Classification\uff08\u30c6\u30ad\u30b9\u30c8\u5206\u985e\uff09: \u30c6\u30ad\u30b9\u30c8\u3092\u30ab\u30c6\u30b4\u30ea\u306b\u81ea\u52d5\u5206\u985e\u3057\u307e\u3059\u3002<\/li>\n\n\n\n<li>Sentiment Analysis\uff08\u611f\u60c5\u5206\u6790\uff09: \u30c6\u30ad\u30b9\u30c8\u306e\u611f\u60c5\u3084\u30aa\u30d4\u30cb\u30aa\u30f3\u3092\u5224\u5b9a\u3057\u307e\u3059\u3002<\/li>\n<\/ul>\n\n\n\n<p>\u3053\u308c\u3089\u306e\u6a5f\u80fd\u3092\u7d44\u307f\u5408\u308f\u305b\u308c\u3070\u3001\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u3092\u81ea\u52d5\u7684\u306b\u6574\u7406\u3057\u3001\u5206\u6790\u3067\u304d\u308b\u3088\u3046\u306b\u306a\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-2\">NLTK\u306e\u30e1\u30ea\u30c3\u30c8\u3068\u30e6\u30fc\u30b9\u30b1\u30fc\u30b9<\/h3>\n\n\n\n<p>NLTK\u306e\u5927\u304d\u306a\u5f37\u307f\u306f\u3001\u5b66\u7fd2\u30ea\u30bd\u30fc\u30b9\u304c\u8c4a\u5bcc\u306a\u3053\u3068\u3002\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb\u3092\u9032\u3081\u3066\u3044\u304f\u3060\u3051\u3067\u3001\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306e\u57fa\u672c\u304c\u8eab\u306b\u3064\u304d\u307e\u3059\u3002\u307e\u305f\u3001\u82f1\u8a9e\u3060\u3051\u3067\u306a\u304f\u591a\u8a00\u8a9e\u306b\u5bfe\u5fdc\u3057\u3066\u3044\u308b\u306e\u3082\u9b45\u529b\u3067\u3059\u3002<\/p>\n\n\n\n<p>\u5b9f\u969b\u306e\u30e6\u30fc\u30b9\u30b1\u30fc\u30b9\u3068\u3057\u3066\u306f\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306a\u3082\u306e\u304c\u6319\u3052\u3089\u308c\u307e\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u6587\u66f8\u306e\u81ea\u52d5\u30ab\u30c6\u30b4\u30ea\u5206\u985e: \u30cb\u30e5\u30fc\u30b9\u8a18\u4e8b\u3084\u30e1\u30fc\u30eb\u306a\u3069\u3092\u3001\u30c8\u30d4\u30c3\u30af\u3054\u3068\u306b\u81ea\u52d5\u3067\u632f\u308a\u5206\u3051<\/li>\n\n\n\n<li>\u5546\u54c1\u30ec\u30d3\u30e5\u30fc\u306e\u611f\u60c5\u5206\u6790: \u30e6\u30fc\u30b6\u30fc\u306e\u8a55\u4fa1\u3092\u80af\u5b9a\u30fb\u5426\u5b9a\u306b\u5206\u985e\u3057\u3001\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0\u306b\u6d3b\u7528<\/li>\n\n\n\n<li>\u30c1\u30e3\u30c3\u30c8\u30dc\u30c3\u30c8\u306e\u958b\u767a: \u30e6\u30fc\u30b6\u30fc\u306e\u81ea\u7136\u8a00\u8a9e\u5165\u529b\u3092\u89e3\u6790\u3057\u3001\u9069\u5207\u306a\u5fdc\u7b54\u3092\u751f\u6210<\/li>\n<\/ul>\n\n\n\n<p>\u4ed6\u306b\u3082\u3001\u30b9\u30d1\u30e0\u30e1\u30fc\u30eb\u306e\u691c\u77e5\u3001\u793e\u5185\u6587\u66f8\u306e\u6574\u7406\u306a\u3069\u3001\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u304c\u7d61\u3080\u69d8\u3005\u306a\u5834\u9762\u3067\u6d3b\u8e8d\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<p>NLTK\u3092\u4f7f\u3048\u3070\u3001\u3053\u3093\u306a\u30b7\u30f3\u30d7\u30eb\u306a\u30b3\u30fc\u30c9\u3067\u30c6\u30ad\u30b9\u30c8\u306e\u524d\u51e6\u7406\u304c\u3067\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">from nltk.tokenize import word_tokenize\n\ntext = \"This is a sample sentence, showing off the tokenization.\"\ntokens = word_tokenize(text)\nprint(tokens)<\/pre>\n\n\n\n<p>\u51fa\u529b:<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">['This', 'is', 'a', 'sample', 'sentence', ',', 'showing', 'off', 'the', 'tokenization', '.']<\/pre>\n\n\n\n<p>If\u672c\u8a18\u4e8b\u3067\u306f\u3001\u521d\u5fc3\u8005\u306e\u305f\u3081\u306bNLTK\u306e\u4f7f\u3044\u65b9\u3092\u4e01\u5be7\u306b\u89e3\u8aac\u3057\u307e\u3059\u3002\u3053\u308c\u304b\u3089Python\u3067\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306b\u6311\u6226\u3057\u305f\u3044\u65b9\u306f\u3001\u305c\u3072NLTK\u304b\u3089\u59cb\u3081\u3066\u307f\u3066\u304f\u3060\u3055\u3044\u3002<\/p>\n\n\n\n<p>\u4ee5\u4e0a\u304c\u30011\u3064\u76ee\u306eh2\u306e\u5730\u306e\u6587\u306e\u30e9\u30a4\u30c6\u30a3\u30f3\u30b0\u4f8b\u3067\u3059\u3002\u30ad\u30fc\u30ef\u30fc\u30c9\u3092\u9069\u5207\u306b\u914d\u7f6e\u3057\u3064\u3064\u3001\u30b3\u30fc\u30c9\u30b5\u30f3\u30d7\u30eb\u3092\u4ea4\u3048\u3066\u3001NLTK\u306e\u6982\u8981\u3092\u308f\u304b\u308a\u3084\u3059\u304f\u8aac\u660e\u3059\u308b\u69cb\u6210\u306b\u3057\u307e\u3057\u305f\u3002\u521d\u5fc3\u8005\u8aad\u8005\u306e\u77e5\u7684\u597d\u5947\u5fc3\u3092\u523a\u6fc0\u3057\u3001\u6b21\u306e\u5185\u5bb9\u306b\u81ea\u7136\u306b\u8a98\u5c0e\u3067\u304d\u308b\u3088\u3046\u306a\u66f8\u304d\u65b9\u3092\u5fc3\u304c\u3051\u307e\u3057\u305f\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\" id=\"i-3\">NLTK\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3068\u57fa\u672c\u7684\u306a\u4f7f\u3044\u65b9<\/h2>\n\n\n\n<p>NLTK\u3092\u4f7f\u3046\u306b\u306f\u3001\u307e\u305aPython\u74b0\u5883\u306b\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3059\u308b\u5fc5\u8981\u304c\u3042\u308a\u307e\u3059\u3002\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u65b9\u6cd5\u306f\u3001\u304a\u4f7f\u3044\u306e\u74b0\u5883\u306b\u3088\u3063\u3066\u7570\u306a\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-4\">pip install nltk\u3067\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u624b\u9806<\/h3>\n\n\n\n<p>\u6700\u3082\u4e00\u822c\u7684\u306a\u306e\u306f\u3001pip\u3092\u4f7f\u3063\u305f\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u65b9\u6cd5\u3067\u3059\u3002\u4ee5\u4e0b\u306e\u30b3\u30de\u30f3\u30c9\u3092\u5b9f\u884c\u3057\u3066\u304f\u3060\u3055\u3044\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">pip install nltk<\/pre>\n\n\n\n<p>Anaconda\u74b0\u5883\u306e\u5834\u5408\u306f\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306bconda\u30b3\u30de\u30f3\u30c9\u3067\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">conda install -c anaconda nltk<\/pre>\n\n\n\n<p>\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u304c\u5b8c\u4e86\u3057\u305f\u3089\u3001Python\u30a4\u30f3\u30bf\u30fc\u30d7\u30ea\u30bf\u30fc\u3092\u8d77\u52d5\u3057\u3066\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306bNLTK\u3092\u30a4\u30f3\u30dd\u30fc\u30c8\u3057\u3066\u307f\u307e\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">import nltk<\/pre>\n\n\n\n<p>\u30a8\u30e9\u30fc\u304c\u51fa\u306a\u3051\u308c\u3070\u3001\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u306f\u6210\u529f\u3067\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-5\">\u983b\u51fa\u306eNLTK\u57fa\u672c\u64cd\u4f5c\u30b3\u30fc\u30c9\u4f8b<\/h3>\n\n\n\n<p>NLTK\u3092\u4f7f\u3063\u305f\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306e\u57fa\u672c\u7684\u306a\u6d41\u308c\u306f\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306b\u306a\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>\u30c6\u30ad\u30b9\u30c8\u306e\u8aad\u307f\u8fbc\u307f<\/li>\n\n\n\n<li>\u30c8\u30fc\u30af\u30f3\u5316\uff08\u5358\u8a9e\u3084\u6587\u7ae0\u306b\u5206\u5272\uff09<\/li>\n\n\n\n<li>\u54c1\u8a5e\u30bf\u30ae\u30f3\u30b0<\/li>\n\n\n\n<li>\u983b\u5ea6\u5206\u5e03\u306e\u53d6\u5f97<\/li>\n<\/ol>\n\n\n\n<p>\u305d\u308c\u3067\u306f\u3001\u5b9f\u969b\u306b\u30b3\u30fc\u30c9\u3092\u898b\u3066\u3044\u304d\u307e\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">from nltk.tokenize import word_tokenize, sent_tokenize\nfrom nltk import pos_tag\nfrom nltk.probability import FreqDist\n\n# \u30c6\u30ad\u30b9\u30c8\u306e\u8aad\u307f\u8fbc\u307f\nwith open('sample.txt', 'r') as file:\n    text = file.read()\n\n# \u30c8\u30fc\u30af\u30f3\u5316\nwords = word_tokenize(text)  # \u5358\u8a9e\u306b\u5206\u5272\nsentences = sent_tokenize(text)  # \u6587\u7ae0\u306b\u5206\u5272\n\n# \u54c1\u8a5e\u30bf\u30ae\u30f3\u30b0\ntagged_words = pos_tag(words)\n\n# \u983b\u5ea6\u5206\u5e03\u306e\u53d6\u5f97\nfdist = FreqDist(words)\nprint(fdist.most_common(10))  # \u4e0a\u4f4d10\u8a9e\u306e\u51fa\u73fe\u983b\u5ea6\u3092\u8868\u793a<\/pre>\n\n\n\n<p>\u3053\u306e\u30b3\u30fc\u30c9\u4f8b\u3067\u306f\u3001<code>sample.txt<\/code>\u3068\u3044\u3046\u30d5\u30a1\u30a4\u30eb\u304b\u3089\u30c6\u30ad\u30b9\u30c8\u3092\u8aad\u307f\u8fbc\u307f\u3001\u5358\u8a9e\u3068\u6587\u7ae0\u306b\u5206\u5272\u3057\u3066\u3044\u307e\u3059\u3002\u305d\u3057\u3066\u3001\u5358\u8a9e\u306e\u54c1\u8a5e\u3092\u8b58\u5225\u3057\u3001\u5358\u8a9e\u306e\u51fa\u73fe\u983b\u5ea6\u3092\u8a08\u7b97\u3057\u3066\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u5b9f\u884c\u306b\u306f\u3001\u5225\u9014\u30c6\u30ad\u30b9\u30c8\u30d5\u30a1\u30a4\u30eb\u3092\u7528\u610f\u3059\u308b\u5fc5\u8981\u304c\u3042\u308a\u307e\u3059\u304c\u3001\u3053\u308c\u3060\u3051\u306e\u30b3\u30fc\u30c9\u3067\u3001\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u306e\u57fa\u672c\u7684\u306a\u524d\u51e6\u7406\u304c\u5b8c\u4e86\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<p>NLTK\u306e\u6a5f\u80fd\u306f\u591a\u5c90\u306b\u308f\u305f\u308a\u307e\u3059\u304c\u3001\u521d\u5b66\u8005\u304c\u7279\u306b\u62bc\u3055\u3048\u3066\u304a\u304d\u305f\u3044\u91cd\u8981\u6a5f\u80fd\u306f\u4ee5\u4e0b\u306e5\u3064\u3067\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>Tokenization\uff08\u30c8\u30fc\u30af\u30f3\u5316\uff09<\/li>\n\n\n\n<li>POS Tagging\uff08\u54c1\u8a5e\u30bf\u30ae\u30f3\u30b0\uff09<\/li>\n\n\n\n<li>Frequency Distributions\uff08\u983b\u5ea6\u5206\u5e03\uff09<\/li>\n\n\n\n<li>Stopwords Removal\uff08\u30b9\u30c8\u30c3\u30d7\u30ef\u30fc\u30c9\u9664\u53bb\uff09<\/li>\n\n\n\n<li>Stemming and Lemmatization\uff08\u30b9\u30c6\u30df\u30f3\u30b0\u3068\u8868\u8a18\u63fa\u308c\u5438\u53ce\uff09<\/li>\n<\/ol>\n\n\n\n<p>\u3053\u308c\u3089\u306e\u6a5f\u80fd\u3092\u7406\u89e3\u3057\u3001\u4f7f\u3044\u3053\u306a\u305b\u308b\u3088\u3046\u306b\u306a\u308b\u3053\u3068\u304c\u3001NLTK\u3092\u7528\u3044\u305f\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306e\u7b2c\u4e00\u6b69\u3068\u306a\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u6b21\u7ae0\u3067\u306f\u3001NLTK\u3092\u4f7f\u3063\u305f\u611f\u60c5\u5206\u6790\u306e\u65b9\u6cd5\u306b\u3064\u3044\u3066\u89e3\u8aac\u3057\u307e\u3059\u3002\u57fa\u672c\u64cd\u4f5c\u3092\u7fd2\u5f97\u3057\u305f\u3089\u3001\u305c\u3072\u5fdc\u7528\u4f8b\u306b\u3082\u6311\u6226\u3057\u3066\u307f\u3066\u304f\u3060\u3055\u3044\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\" id=\"i-6\">Sentiment Analysis\uff08\u611f\u60c5\u5206\u6790\uff09\u5165\u9580<\/h2>\n\n\n\n<p>\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u304b\u3089\u611f\u60c5\u3084\u30aa\u30d4\u30cb\u30aa\u30f3\u3092\u62bd\u51fa\u3057\u3001\u30dd\u30b8\u30c6\u30a3\u30d6\/\u30cd\u30ac\u30c6\u30a3\u30d6\/\u30cb\u30e5\u30fc\u30c8\u30e9\u30eb\u306a\u3069\u306b\u5206\u985e\u3059\u308b\u6280\u8853\u3092\u3001\u611f\u60c5\u5206\u6790\uff08Sentiment Analysis\uff09\u3068\u547c\u3073\u307e\u3059\u3002SNS\u306e\u6295\u7a3f\u3084\u5546\u54c1\u30ec\u30d3\u30e5\u30fc\u306a\u3069\u3092\u5206\u6790\u3059\u308b\u3053\u3068\u3067\u3001\u30e6\u30fc\u30b6\u30fc\u306e\u611f\u60c5\u3092\u7406\u89e3\u3057\u3001\u30d3\u30b8\u30cd\u30b9\u306b\u6d3b\u304b\u3059\u3053\u3068\u304c\u3067\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-7\">\u611f\u60c5\u5206\u6790\u306e\u6982\u8981\u3068\u30d3\u30b8\u30cd\u30b9\u6d3b\u7528\u4f8b<\/h3>\n\n\n\n<p>\u611f\u60c5\u5206\u6790\u306f\u3001\u5927\u304d\u304f\u5206\u3051\u3066\u4ee5\u4e0b\u306e3\u3064\u306e\u624b\u6cd5\u306b\u5206\u985e\u3055\u308c\u307e\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>\u30eb\u30fc\u30eb\u30d9\u30fc\u30b9: \u611f\u60c5\u6975\u6027\u8f9e\u66f8\u306a\u3069\u306e\u4e8b\u524d\u5b9a\u7fa9\u3055\u308c\u305f\u30eb\u30fc\u30eb\u3092\u7528\u3044\u308b\u65b9\u6cd5\u3002<\/li>\n\n\n\n<li>\u6a5f\u68b0\u5b66\u7fd2: \u6559\u5e2b\u3042\u308a\u5b66\u7fd2\u306b\u3088\u308a\u3001\u30e9\u30d9\u30eb\u4ed8\u304d\u30c7\u30fc\u30bf\u304b\u3089\u5206\u985e\u5668\u3092\u5b66\u7fd2\u3059\u308b\u65b9\u6cd5\u3002<\/li>\n\n\n\n<li>\u6df1\u5c64\u5b66\u7fd2: \u30cb\u30e5\u30fc\u30e9\u30eb\u30cd\u30c3\u30c8\u30ef\u30fc\u30af\u3092\u7528\u3044\u3066\u3001\u30c6\u30ad\u30b9\u30c8\u306e\u7279\u5fb4\u3092\u81ea\u52d5\u3067\u5b66\u7fd2\u3059\u308b\u65b9\u6cd5\u3002<\/li>\n<\/ol>\n\n\n\n<p>\u30d3\u30b8\u30cd\u30b9\u3067\u306e\u6d3b\u7528\u4f8b\u3068\u3057\u3066\u306f\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306a\u3082\u306e\u304c\u3042\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u30d6\u30e9\u30f3\u30c9\u30a4\u30e1\u30fc\u30b8\u5206\u6790: SNS\u3067\u306e\u30d6\u30e9\u30f3\u30c9\u8a00\u53ca\u3092\u5206\u6790\u3057\u3001\u6d88\u8cbb\u8005\u306e\u611f\u60c5\u3092\u628a\u63e1\u3002<\/li>\n\n\n\n<li>\u5546\u54c1\u30ec\u30d3\u30e5\u30fc\u5206\u6790: E\u30b3\u30de\u30fc\u30b9\u30b5\u30a4\u30c8\u306e\u30ec\u30d3\u30e5\u30fc\u3092\u5206\u6790\u3057\u3001\u5546\u54c1\u306e\u6539\u5584\u70b9\u3092\u767a\u898b\u3002<\/li>\n\n\n\n<li>\u9867\u5ba2\u5bfe\u5fdc\u306e\u6539\u5584: \u554f\u3044\u5408\u308f\u305b\u30e1\u30fc\u30eb\u3084\u30c1\u30e3\u30c3\u30c8\u30ed\u30b0\u3092\u5206\u6790\u3057\u3001\u9867\u5ba2\u6e80\u8db3\u5ea6\u3092\u5411\u4e0a\u3002<\/li>\n\n\n\n<li>\u4e16\u8ad6\u52d5\u5411\u306e\u628a\u63e1: \u30cb\u30e5\u30fc\u30b9\u8a18\u4e8b\u3084SNS\u3067\u306e\u53cd\u5fdc\u3092\u5206\u6790\u3057\u3001\u793e\u4f1a\u306e\u95a2\u5fc3\u4e8b\u3092\u7406\u89e3\u3002<\/li>\n<\/ul>\n\n\n\n<p>\u611f\u60c5\u5206\u6790\u306b\u3088\u3063\u3066\u3001\u9867\u5ba2\u306e\u58f0\u3092\u5b9a\u91cf\u7684\u306b\u628a\u63e1\u3057\u3001\u30c7\u30fc\u30bf\u30c9\u30ea\u30d6\u30f3\u306a\u610f\u601d\u6c7a\u5b9a\u3092\u884c\u3046\u3053\u3068\u304c\u3067\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-8\">NLTK\u306b\u3088\u308b\u611f\u60c5\u5206\u6790\u306e\u30a2\u30d7\u30ed\u30fc\u30c1<\/h3>\n\n\n\n<p>NLTK\u3092\u4f7f\u3063\u305f\u611f\u60c5\u5206\u6790\u306e\u57fa\u672c\u7684\u306a\u6d41\u308c\u306f\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306b\u306a\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>\u611f\u60c5\u6975\u6027\u8f9e\u66f8\u306e\u6e96\u5099: \u5358\u8a9e\u306e\u611f\u60c5\u6975\u6027\uff08\u30dd\u30b8\u30c6\u30a3\u30d6\/\u30cd\u30ac\u30c6\u30a3\u30d6\uff09\u3092\u5b9a\u7fa9\u3057\u305f\u8f9e\u66f8\u3092\u7528\u610f\u3057\u307e\u3059\u3002NLTK\u306b\u306f\u300cSentiWordNet\u300d\u306a\u3069\u306e\u8f9e\u66f8\u304c\u542b\u307e\u308c\u3066\u3044\u307e\u3059\u3002<\/li>\n\n\n\n<li>\u30c6\u30ad\u30b9\u30c8\u306e\u524d\u51e6\u7406: \u30c8\u30fc\u30af\u30f3\u5316\u3001\u30b9\u30c8\u30c3\u30d7\u30ef\u30fc\u30c9\u9664\u53bb\u3001\u30b9\u30c6\u30df\u30f3\u30b0\u306a\u3069\u3092\u884c\u3044\u307e\u3059\u3002<\/li>\n\n\n\n<li>\u611f\u60c5\u6975\u6027\u30b9\u30b3\u30a2\u306e\u8a08\u7b97: \u611f\u60c5\u6975\u6027\u8f9e\u66f8\u3092\u53c2\u7167\u3057\u3001\u30c6\u30ad\u30b9\u30c8\u5185\u306e\u5358\u8a9e\u306e\u611f\u60c5\u6975\u6027\u30b9\u30b3\u30a2\u3092\u96c6\u8a08\u3057\u307e\u3059\u3002<\/li>\n\n\n\n<li>\u611f\u60c5\u30e9\u30d9\u30eb\u306e\u5224\u5b9a: \u30b9\u30b3\u30a2\u306b\u57fa\u3065\u3044\u3066\u3001\u30c6\u30ad\u30b9\u30c8\u5168\u4f53\u306e\u611f\u60c5\u30e9\u30d9\u30eb\uff08\u30dd\u30b8\u30c6\u30a3\u30d6\/\u30cd\u30ac\u30c6\u30a3\u30d6\uff09\u3092\u5224\u5b9a\u3057\u307e\u3059\u3002<\/li>\n<\/ol>\n\n\n\n<p>\u5177\u4f53\u7684\u306b\u306f\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306a\u65b9\u6cd5\u304c\u3042\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>VADER\uff08Valence Aware Dictionary and sEntiment Reasoner\uff09\u3092\u4f7f\u3063\u305f\u611f\u60c5\u5206\u6790<\/li>\n\n\n\n<li>VADER\u306f\u3001\u30eb\u30fc\u30eb\u30d9\u30fc\u30b9\u306e\u611f\u60c5\u5206\u6790\u5668\u3002<\/li>\n\n\n\n<li>\u5358\u8a9e\u306e\u611f\u60c5\u6975\u6027\u30b9\u30b3\u30a2\u3092\u96c6\u8a08\u3057\u3001\u30c6\u30ad\u30b9\u30c8\u306e\u611f\u60c5\u3092\u5224\u5b9a\u3059\u308b\u3002<\/li>\n\n\n\n<li>Naive Bayes\u3092\u4f7f\u3063\u305f\u611f\u60c5\u5206\u6790<\/li>\n\n\n\n<li>\u6559\u5e2b\u3042\u308a\u6a5f\u68b0\u5b66\u7fd2\u306e\u4e00\u7a2e\u3002<\/li>\n\n\n\n<li>\u4e8b\u524d\u306b\u30e9\u30d9\u30eb\u4ed8\u3051\u3055\u308c\u305f\u30c7\u30fc\u30bf\u30bb\u30c3\u30c8\u3092\u7528\u3044\u3066\u3001\u5206\u985e\u5668\u3092\u5b66\u7fd2\u3055\u305b\u308b\u3002<\/li>\n<\/ul>\n\n\n\n<p>\u6b21\u7ae0\u3067\u306f\u3001\u5b9f\u969b\u306bNLTK\u3092\u4f7f\u3063\u3066\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u3092\u5b9f\u88c5\u3059\u308b\u65b9\u6cd5\u3092\u7d39\u4ecb\u3057\u307e\u3059\u3002\u30b3\u30fc\u30c9\u3092\u4ea4\u3048\u306a\u304c\u3089\u3001\u611f\u60c5\u5206\u6790\u306e\u4ed5\u7d44\u307f\u3092\u8a73\u3057\u304f\u89e3\u8aac\u3057\u3066\u3044\u304d\u307e\u3059\u306e\u3067\u3001\u304a\u697d\u3057\u307f\u306b\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\" id=\"i-9\">NLTK\u3067\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u3092\u5b9f\u88c5\u3057\u3066\u307f\u3088\u3046<\/h2>\n\n\n\n<p>\u524d\u7ae0\u3067\u306f\u3001\u611f\u60c5\u5206\u6790\u306e\u6982\u8981\u3068NLTK\u3067\u306e\u30a2\u30d7\u30ed\u30fc\u30c1\u3092\u7d39\u4ecb\u3057\u307e\u3057\u305f\u3002\u672c\u7ae0\u3067\u306f\u3001\u5b9f\u969b\u306bPython\u306e\u30b3\u30fc\u30c9\u3092\u66f8\u304d\u306a\u304c\u3089\u3001NLTK\u3092\u4f7f\u3063\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u5b9f\u88c5\u65b9\u6cd5\u3092\u898b\u3066\u3044\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-10\">VADER Lexicon\u3092\u7528\u3044\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790<\/h3>\n\n\n\n<p>VADER\u306f\u3001\u30eb\u30fc\u30eb\u30d9\u30fc\u30b9\u306e\u611f\u60c5\u5206\u6790\u5668\u3067\u3001\u5358\u8a9e\u306e\u611f\u60c5\u6975\u6027\u30b9\u30b3\u30a2\u3092\u96c6\u8a08\u3057\u3001\u30c6\u30ad\u30b9\u30c8\u306e\u611f\u60c5\u3092\u5224\u5b9a\u3057\u307e\u3059\u3002\u4ee5\u4e0b\u306e\u624b\u9806\u3067\u3001VADER\u3092\u4f7f\u3063\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u3092\u5b9f\u88c5\u3067\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>VADER\u306e\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/li>\n<\/ol>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">   pip install vaderSentiment<\/pre>\n\n\n\n<ol class=\"wp-block-list\" start=\"2\">\n<li>SentimentIntensityAnalyzer\u306e\u30a4\u30f3\u30b9\u30bf\u30f3\u30b9\u5316<\/li>\n<\/ol>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">   from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer\n\n   analyzer = SentimentIntensityAnalyzer()<\/pre>\n\n\n\n<ol class=\"wp-block-list\" start=\"3\">\n<li><code>polarity_scores()<\/code>\u30e1\u30bd\u30c3\u30c9\u3067\u30c6\u30ad\u30b9\u30c8\u306e\u611f\u60c5\u6975\u6027\u3092\u8a08\u7b97<\/li>\n<\/ol>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">   text = \"This is a great movie, but the ending was disappointing.\"\n   scores = analyzer.polarity_scores(text)\n   print(scores)<\/pre>\n\n\n\n<p>\u51fa\u529b\u7d50\u679c:<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">   {'neg': 0.09, 'neu': 0.638, 'pos': 0.272, 'compound': 0.4404}<\/pre>\n\n\n\n<ul class=\"wp-block-list\">\n<li><code>neg<\/code>: \u30cd\u30ac\u30c6\u30a3\u30d6\u306a\u611f\u60c5\u306e\u5272\u5408<\/li>\n\n\n\n<li><code>neu<\/code>: \u30cb\u30e5\u30fc\u30c8\u30e9\u30eb\u306a\u611f\u60c5\u306e\u5272\u5408<\/li>\n\n\n\n<li><code>pos<\/code>: \u30dd\u30b8\u30c6\u30a3\u30d6\u306a\u611f\u60c5\u306e\u5272\u5408<\/li>\n\n\n\n<li><code>compound<\/code>: -1\u304b\u30891\u307e\u3067\u306e\u898f\u683c\u5316\u3055\u308c\u305f\u30b9\u30b3\u30a2\uff08-1\u306b\u8fd1\u3044\u307b\u3069\u30cd\u30ac\u30c6\u30a3\u30d6\u30011\u306b\u8fd1\u3044\u307b\u3069\u30dd\u30b8\u30c6\u30a3\u30d6\uff09<\/li>\n<\/ul>\n\n\n\n<p>\u4ee5\u4e0a\u306e\u3088\u3046\u306b\u3001\u308f\u305a\u304b\u6570\u884c\u306e\u30b3\u30fc\u30c9\u3067\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u3092\u5b9f\u884c\u3067\u304d\u308b\u306e\u304c\u3001VADER\u306e\u5927\u304d\u306a\u5229\u70b9\u3067\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-11\">MovieReview\u30c7\u30fc\u30bf\u3092\u4f7f\u3063\u305f\u5206\u6790\u306e\u6d41\u308c<\/h3>\n\n\n\n<p>\u6b21\u306b\u3001\u5b9f\u969b\u306e\u6620\u753b\u30ec\u30d3\u30e5\u30fc\u306e\u30c7\u30fc\u30bf\u3092\u4f7f\u3063\u3066\u3001\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u6d41\u308c\u3092\u898b\u3066\u3044\u304d\u307e\u3057\u3087\u3046\u3002\u3053\u3053\u3067\u306f\u3001Cornell\u5927\u5b66\u304c\u516c\u958b\u3057\u3066\u3044\u308b<a href=\"http:\/\/www.cs.cornell.edu\/people\/pabo\/movie-review-data\/\">Movie Review Data<\/a>\u3092\u4f7f\u7528\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">import os\nfrom nltk.corpus import movie_reviews\n\n# Movie Review\u30c7\u30fc\u30bf\u306e\u30ed\u30fc\u30c9\nreviews = []\nfor category in movie_reviews.categories():\n    for fileid in movie_reviews.fileids(category):\n        review_text = movie_reviews.raw(fileid)\n        reviews.append((review_text, category))\n\n# VADER\u306b\u3088\u308b\u30cd\u30ac\u30dd\u30b8\u5206\u6790\nanalyzer = SentimentIntensityAnalyzer()\ncorrect = 0\nfor review_text, category in reviews:\n    scores = analyzer.polarity_scores(review_text)\n    if scores['compound'] &gt; 0 and category == 'pos':\n        correct += 1\n    elif scores['compound'] &lt;= 0 and category == 'neg':\n        correct += 1\n\naccuracy = correct \/ len(reviews)\nprint(f\"Accuracy: {accuracy:.2f}\")<\/pre>\n\n\n\n<p>\u51fa\u529b\u7d50\u679c:<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">Accuracy: 0.71<\/pre>\n\n\n\n<p>\u3053\u306e\u4f8b\u3067\u306f\u3001Movie Review\u30c7\u30fc\u30bf\u3092\u30ed\u30fc\u30c9\u3057\u3001\u5404\u30ec\u30d3\u30e5\u30fc\u3092VADER\u3067\u5206\u6790\u3057\u3066\u3044\u307e\u3059\u3002<code>compound<\/code>\u30b9\u30b3\u30a2\u304c0\u3088\u308a\u5927\u304d\u3044\u5834\u5408\u306f\u30dd\u30b8\u30c6\u30a3\u30d6\u30010\u4ee5\u4e0b\u306e\u5834\u5408\u306f\u30cd\u30ac\u30c6\u30a3\u30d6\u3068\u5224\u5b9a\u3057\u3001\u6b63\u89e3\u7387\uff08Accuracy\uff09\u3092\u8a08\u7b97\u3057\u3066\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-12\">\u7c21\u5358\u306a\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u30d7\u30ed\u30b0\u30e9\u30e0\u3092\u5b9f\u88c5<\/h3>\n\n\n\n<p>\u6700\u5f8c\u306b\u3001\u30e6\u30fc\u30b6\u30fc\u304c\u5165\u529b\u3057\u305f\u30c6\u30ad\u30b9\u30c8\u306e\u30cd\u30ac\u30dd\u30b8\u3092\u5224\u5b9a\u3059\u308b\u7c21\u5358\u306a\u30d7\u30ed\u30b0\u30e9\u30e0\u3092\u5b9f\u88c5\u3057\u3066\u307f\u307e\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer\n\ndef analyze_sentiment(text):\n    analyzer = SentimentIntensityAnalyzer()\n    scores = analyzer.polarity_scores(text)\n    if scores['compound'] &gt; 0:\n        return \"Positive\"\n    elif scores['compound'] &lt; 0:\n        return \"Negative\"\n    else:\n        return \"Neutral\"\n\nwhile True:\n    user_input = input(\"Enter a sentence (or 'q' to quit): \")\n    if user_input == 'q':\n        break\n    sentiment = analyze_sentiment(user_input)\n    print(f\"Sentiment: {sentiment}\\n\")<\/pre>\n\n\n\n<p>\u3053\u306e\u30d7\u30ed\u30b0\u30e9\u30e0\u3067\u306f\u3001\u30e6\u30fc\u30b6\u30fc\u304c\u5165\u529b\u3057\u305f\u6587\u7ae0\u3092VADER\u3067\u5206\u6790\u3057\u3001<code>compound<\/code>\u30b9\u30b3\u30a2\u306b\u57fa\u3065\u3044\u3066\u30dd\u30b8\u30c6\u30a3\u30d6\u3001\u30cd\u30ac\u30c6\u30a3\u30d6\u3001\u30cb\u30e5\u30fc\u30c8\u30e9\u30eb\u306e\u3044\u305a\u308c\u304b\u3092\u5224\u5b9a\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u5b9f\u884c\u4f8b:<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">Enter a sentence (or 'q' to quit): This movie was fantastic!\nSentiment: Positive\n\nEnter a sentence (or 'q' to quit): I didn't like the food at that restaurant.\nSentiment: Negative\n\nEnter a sentence (or 'q' to quit): The weather is cloudy today.\nSentiment: Neutral\n\nEnter a sentence (or 'q' to quit): q<\/pre>\n\n\n\n<p>\u4ee5\u4e0a\u3001NLTK\u3068VADER\u3092\u4f7f\u3063\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u5b9f\u88c5\u65b9\u6cd5\u3092\u7d39\u4ecb\u3057\u307e\u3057\u305f\u3002\u6b21\u7ae0\u3067\u306f\u3001\u3088\u308a\u767a\u5c55\u7684\u306a\u30c8\u30d4\u30c3\u30af\u3068\u3057\u3066\u3001\u524d\u51e6\u7406\u306e\u30c6\u30af\u30cb\u30c3\u30af\u3084\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u306e\u30ab\u30b9\u30bf\u30de\u30a4\u30ba\u65b9\u6cd5\u306a\u3069\u3092\u89e3\u8aac\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\" id=\"i-13\">NLTK\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306eTips\uff06\u767a\u5c55\u7684\u30c8\u30d4\u30c3\u30af<\/h2>\n\n\n\n<p>\u524d\u7ae0\u3067\u306f\u3001VADER\u3092\u4f7f\u3063\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u5b9f\u88c5\u65b9\u6cd5\u3092\u7d39\u4ecb\u3057\u307e\u3057\u305f\u3002\u672c\u7ae0\u3067\u306f\u3001\u3088\u308a\u7cbe\u5ea6\u306e\u9ad8\u3044\u5206\u6790\u3092\u884c\u3046\u305f\u3081\u306e\u524d\u51e6\u7406\u306e\u30dd\u30a4\u30f3\u30c8\u3068\u3001\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u30ed\u30b8\u30c3\u30af\u306e\u30ab\u30b9\u30bf\u30de\u30a4\u30ba\u65b9\u6cd5\u3092\u89e3\u8aac\u3057\u307e\u3059\u3002\u307e\u305f\u3001\u4ed6\u306e\u611f\u60c5\u5206\u6790\u624b\u6cd5\u3068\u306e\u6bd4\u8f03\u3082\u884c\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-14\">\u524d\u51e6\u7406\u306e\u30dd\u30a4\u30f3\u30c8\u3068\u30b3\u30fc\u30c9\u30b5\u30f3\u30d7\u30eb<\/h3>\n\n\n\n<p>\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u3092\u5206\u6790\u3059\u308b\u969b\u306f\u3001\u524d\u51e6\u7406\u304c\u91cd\u8981\u3067\u3059\u3002\u4ee5\u4e0b\u306f\u3001NLTK\u3092\u4f7f\u3063\u305f\u524d\u51e6\u7406\u306e\u4e3b\u306a\u30dd\u30a4\u30f3\u30c8\u3067\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>\u30c6\u30ad\u30b9\u30c8\u306e\u30af\u30ea\u30fc\u30cb\u30f3\u30b0\n<ul class=\"wp-block-list\">\n<li>\u4f59\u5206\u306a\u6587\u5b57\uff08HTML\u30bf\u30b0\u3001\u7279\u6b8a\u6587\u5b57\u306a\u3069\uff09\u306e\u9664\u53bb<\/li>\n\n\n\n<li>\u5927\u6587\u5b57\u30fb\u5c0f\u6587\u5b57\u306e\u7d71\u4e00<\/li>\n\n\n\n<li>\u30b9\u30da\u30eb\u30c1\u30a7\u30c3\u30af\u3068\u4fee\u6b63<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u30c8\u30fc\u30af\u30f3\u5316\n<ul class=\"wp-block-list\">\n<li>\u6587\u7ae0\u3092\u5358\u8a9e\u3084\u6587\u5b57\u306b\u5206\u5272\u3059\u308b<\/li>\n\n\n\n<li>\u6b63\u898f\u8868\u73fe\u3084\u7279\u5b9a\u306e\u533a\u5207\u308a\u6587\u5b57\u3092\u4f7f\u7528<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u30b9\u30c8\u30c3\u30d7\u30ef\u30fc\u30c9\u9664\u53bb\n<ul class=\"wp-block-list\">\n<li>\u201cthe\u201d, \u201cand\u201d, \u201cis\u201d\u306a\u3069\u3001\u983b\u51fa\u3059\u308b\u304c\u611f\u60c5\u5224\u5b9a\u306b\u5bc4\u4e0e\u3057\u306a\u3044\u5358\u8a9e\u3092\u9664\u53bb\u3059\u308b<\/li>\n\n\n\n<li>NLTK\u306e<code>stopwords<\/code>\u30e2\u30b8\u30e5\u30fc\u30eb\u3092\u4f7f\u7528<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u30b9\u30c6\u30df\u30f3\u30b0\u30fb\u30ec\u30f3\u30de\u5316\n<ul class=\"wp-block-list\">\n<li>\u5358\u8a9e\u3092\u539f\u5f62\u3084\u8a9e\u5e79\u306b\u7d71\u4e00\u3059\u308b<\/li>\n\n\n\n<li>\u4f8b: \u201crunning\u201d, \u201cran\u201d, \u201cruns\u201d \u2192 \u201crun\u201d<\/li>\n\n\n\n<li>NLTK\u306e<code>PorterStemmer<\/code>\u3084<code>WordNetLemmatizer<\/code>\u3092\u4f7f\u7528<\/li>\n<\/ul>\n<\/li>\n<\/ol>\n\n\n\n<p>\u4ee5\u4e0b\u306f\u3001\u3053\u308c\u3089\u306e\u524d\u51e6\u7406\u3092\u5b9f\u88c5\u3057\u305fPython\u30b3\u30fc\u30c9\u306e\u30b5\u30f3\u30d7\u30eb\u3067\u3059\u3002<\/p>\n\n\n\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"generic\" data-enlighter-theme=\"\" data-enlighter-highlight=\"\" data-enlighter-linenumbers=\"\" data-enlighter-lineoffset=\"\" data-enlighter-title=\"\" data-enlighter-group=\"\">import re\nfrom nltk.corpus import stopwords\nfrom nltk.stem import PorterStemmer, WordNetLemmatizer\n\ndef preprocess_text(text):\n    # \u30c6\u30ad\u30b9\u30c8\u306e\u30af\u30ea\u30fc\u30cb\u30f3\u30b0\n    text = re.sub(r'&lt;.*?&gt;', '', text)  # HTML\u30bf\u30b0\u306e\u9664\u53bb\n    text = re.sub(r'[^a-zA-Z]', ' ', text)  # \u82f1\u5b57\u4ee5\u5916\u306e\u6587\u5b57\u3092\u30b9\u30da\u30fc\u30b9\u306b\u7f6e\u63db\n    text = text.lower()  # \u5c0f\u6587\u5b57\u306b\u7d71\u4e00\n\n    # \u30c8\u30fc\u30af\u30f3\u5316\n    tokens = text.split()\n\n    # \u30b9\u30c8\u30c3\u30d7\u30ef\u30fc\u30c9\u9664\u53bb\n    stop_words = set(stopwords.words('english'))\n    tokens = [token for token in tokens if token not in stop_words]\n\n    # \u30b9\u30c6\u30df\u30f3\u30b0\u30fb\u30ec\u30f3\u30de\u5316\n    stemmer = PorterStemmer()\n    lemmatizer = WordNetLemmatizer()\n    tokens = [stemmer.stem(token) for token in tokens]\n    tokens = [lemmatizer.lemmatize(token) for token in tokens]\n\n    return tokens<\/pre>\n\n\n\n<p>\u3053\u306e\u95a2\u6570\u3067\u306f\u3001\u6b63\u898f\u8868\u73fe\u3092\u4f7f\u3063\u3066\u30c6\u30ad\u30b9\u30c8\u3092\u30af\u30ea\u30fc\u30cb\u30f3\u30b0\u3057\u3001\u30c8\u30fc\u30af\u30f3\u5316\u3001\u30b9\u30c8\u30c3\u30d7\u30ef\u30fc\u30c9\u9664\u53bb\u3001\u30b9\u30c6\u30df\u30f3\u30b0\u30fb\u30ec\u30f3\u30de\u5316\u3092\u884c\u3063\u3066\u3044\u307e\u3059\u3002\u524d\u51e6\u7406\u6e08\u307f\u306e\u30c8\u30fc\u30af\u30f3\u306e\u30ea\u30b9\u30c8\u304c\u8fd4\u3055\u308c\u307e\u3059\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-15\">\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u30ed\u30b8\u30c3\u30af\u306e\u30ab\u30b9\u30bf\u30de\u30a4\u30ba<\/h3>\n\n\n\n<p>VADER\u306e\u30c7\u30d5\u30a9\u30eb\u30c8\u306e\u5224\u5b9a\u30ed\u30b8\u30c3\u30af\u3067\u306f\u3001\u3046\u307e\u304f\u5224\u5b9a\u3067\u304d\u306a\u3044\u30b1\u30fc\u30b9\u304c\u3042\u308a\u307e\u3059\u3002\u4ee5\u4e0b\u306e\u3088\u3046\u306a\u30ab\u30b9\u30bf\u30de\u30a4\u30ba\u3092\u884c\u3046\u3053\u3068\u3067\u3001\u7cbe\u5ea6\u3092\u5411\u4e0a\u3055\u305b\u308b\u3053\u3068\u304c\u3067\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>\u5358\u8a9e\u306e\u611f\u60c5\u6975\u6027\u8f9e\u66f8\u306e\u62e1\u5f35\n<ul class=\"wp-block-list\">\n<li>VADER\u306e\u8f9e\u66f8\u306b\u3001\u30c9\u30e1\u30a4\u30f3\u56fa\u6709\u306e\u5358\u8a9e\u3068\u6975\u6027\u30b9\u30b3\u30a2\u3092\u8ffd\u52a0\u3059\u308b<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u5426\u5b9a\u8a9e\u306e\u51e6\u7406\n<ul class=\"wp-block-list\">\n<li>\u201cnot\u201d\u3084\u201dnever\u201d\u306a\u3069\u3001\u5f8c\u7d9a\u3059\u308b\u5358\u8a9e\u306e\u6975\u6027\u3092\u53cd\u8ee2\u3055\u305b\u308b\u8a9e\u306e\u51e6\u7406\u3092\u6539\u826f\u3059\u308b<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u5f37\u8abf\u8a9e\u306e\u51e6\u7406\n<ul class=\"wp-block-list\">\n<li>\u201cvery\u201d\u3084\u201dextremely\u201d\u306a\u3069\u3001\u5f8c\u7d9a\u3059\u308b\u5358\u8a9e\u306e\u6975\u6027\u3092\u5f37\u3081\u308b\u8a9e\u306e\u51e6\u7406\u3092\u8ffd\u52a0\u3059\u308b<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u6587\u8108\u3092\u8003\u616e\u3057\u305f\u6975\u6027\u30b9\u30b3\u30a2\u306e\u8abf\u6574\n<ul class=\"wp-block-list\">\n<li>\u524d\u5f8c\u306e\u5358\u8a9e\u3084\u6587\u7ae0\u5168\u4f53\u306e\u6587\u8108\u3092\u8003\u616e\u3057\u3066\u3001\u6975\u6027\u30b9\u30b3\u30a2\u3092\u8abf\u6574\u3059\u308b<\/li>\n<\/ul>\n<\/li>\n<\/ol>\n\n\n\n<p>\u3053\u308c\u3089\u306e\u30ab\u30b9\u30bf\u30de\u30a4\u30ba\u3092\u884c\u3046\u306b\u306f\u3001VADER\u306e\u30bd\u30fc\u30b9\u30b3\u30fc\u30c9\u3092\u4fee\u6b63\u3059\u308b\u5fc5\u8981\u304c\u3042\u308a\u307e\u3059\u3002\u8a73\u7d30\u306f\u3001VADER\u306e\u30c9\u30ad\u30e5\u30e1\u30f3\u30c8\u3092\u53c2\u7167\u3057\u3066\u304f\u3060\u3055\u3044\u3002<\/p>\n\n\n\n<h3 class=\"wp-block-heading\" id=\"i-16\">\u4ed6\u306e\u611f\u60c5\u5206\u6790\u624b\u6cd5\u3068\u306e\u6bd4\u8f03\u3068\u4f7f\u3044\u5206\u3051<\/h3>\n\n\n\n<p>VADER\u306f\u3001\u30eb\u30fc\u30eb\u30d9\u30fc\u30b9\u306e\u611f\u60c5\u5206\u6790\u624b\u6cd5\u3067\u3059\u304c\u3001\u4ed6\u306b\u3082\u69d8\u3005\u306a\u624b\u6cd5\u304c\u3042\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>\u6a5f\u68b0\u5b66\u7fd2\u30e2\u30c7\u30eb<\/li>\n\n\n\n<li>\u30ca\u30a4\u30fc\u30d6\u30d9\u30a4\u30ba\u3001SVM\u3001\u30ed\u30b8\u30b9\u30c6\u30a3\u30c3\u30af\u56de\u5e30\u306a\u3069<\/li>\n\n\n\n<li>\u30e9\u30d9\u30eb\u4ed8\u304d\u30c7\u30fc\u30bf\u304b\u3089\u3001\u30c6\u30ad\u30b9\u30c8\u306e\u7279\u5fb4\u91cf\u3068\u611f\u60c5\u30e9\u30d9\u30eb\u306e\u95a2\u4fc2\u3092\u5b66\u7fd2\u3059\u308b<\/li>\n\n\n\n<li>\u30cb\u30e5\u30fc\u30e9\u30eb\u30cd\u30c3\u30c8\u30ef\u30fc\u30af<\/li>\n\n\n\n<li>CNN\u3001RNN\u3001LSTM\u306a\u3069<\/li>\n\n\n\n<li>\u30c6\u30ad\u30b9\u30c8\u306e\u7279\u5fb4\u3092\u81ea\u52d5\u3067\u62bd\u51fa\u3057\u3001\u611f\u60c5\u30e9\u30d9\u30eb\u3092\u4e88\u6e2c\u3059\u308b<\/li>\n\n\n\n<li>\u30a2\u30f3\u30b5\u30f3\u30d6\u30eb\u5b66\u7fd2<\/li>\n\n\n\n<li>\u8907\u6570\u306e\u624b\u6cd5\u3092\u7d44\u307f\u5408\u308f\u305b\u3066\u3001\u7cbe\u5ea6\u3092\u5411\u4e0a\u3055\u305b\u308b<\/li>\n<\/ul>\n\n\n\n<p>\u6a5f\u68b0\u5b66\u7fd2\u3084\u30cb\u30e5\u30fc\u30e9\u30eb\u30cd\u30c3\u30c8\u30ef\u30fc\u30af\u3092\u4f7f\u3046\u5834\u5408\u306f\u3001\u5927\u91cf\u306e\u30e9\u30d9\u30eb\u4ed8\u304d\u30c7\u30fc\u30bf\u304c\u5fc5\u8981\u3067\u3059\u3002\u4e00\u65b9\u3001VADER\u306e\u3088\u3046\u306a\u30eb\u30fc\u30eb\u30d9\u30fc\u30b9\u306e\u624b\u6cd5\u306f\u3001\u30e9\u30d9\u30eb\u4ed8\u304d\u30c7\u30fc\u30bf\u304c\u306a\u304f\u3066\u3082\u4f7f\u3048\u308b\u306e\u304c\u5229\u70b9\u3067\u3059\u3002<\/p>\n\n\n\n<p>\u5206\u6790\u5bfe\u8c61\u306e\u30c6\u30ad\u30b9\u30c8\u306e\u7279\u6027\u3084\u3001\u5229\u7528\u53ef\u80fd\u306a\u30ea\u30bd\u30fc\u30b9\u3001\u6c42\u3081\u308b\u7cbe\u5ea6\u306a\u3069\u3092\u8003\u616e\u3057\u3066\u3001\u9069\u5207\u306a\u624b\u6cd5\u3092\u9078\u3076\u3053\u3068\u304c\u91cd\u8981\u3067\u3059\u3002<\/p>\n\n\n\n<p>\u4ee5\u4e0a\u3001NLTK\u3092\u4f7f\u3063\u305f\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u524d\u51e6\u7406\u3068\u30ab\u30b9\u30bf\u30de\u30a4\u30ba\u3001\u4ed6\u306e\u611f\u60c5\u5206\u6790\u624b\u6cd5\u3068\u306e\u6bd4\u8f03\u306b\u3064\u3044\u3066\u89e3\u8aac\u3057\u307e\u3057\u305f\u3002\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u3084\u6a5f\u68b0\u5b66\u7fd2\u306e\u77e5\u8b58\u3092\u6df1\u3081\u306a\u304c\u3089\u3001\u611f\u60c5\u5206\u6790\u306e\u7cbe\u5ea6\u5411\u4e0a\u306b\u53d6\u308a\u7d44\u3093\u3067\u3044\u304d\u307e\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\" id=\"i-17\">\u307e\u3068\u3081\uff1aNLTK\u3067\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u3092\u30de\u30b9\u30bf\u30fc\u3057\u3088\u3046<\/h2>\n\n\n\n<p>\u672c\u8a18\u4e8b\u3067\u306f\u3001NLTK\u3092\u4f7f\u3063\u305f\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306e\u57fa\u790e\u304b\u3089\u5fdc\u7528\u307e\u3067\u3092\u89e3\u8aac\u3057\u3066\u304d\u307e\u3057\u305f\u3002Python\u306e\u30b3\u30fc\u30c9\u3092\u5b9f\u969b\u306b\u66f8\u304d\u306a\u304c\u3089\u3001\u30cd\u30ac\u30dd\u30b8\u5206\u6790\u306e\u5b9f\u88c5\u65b9\u6cd5\u3092\u5b66\u3073\u307e\u3057\u305f\u3002\u307e\u305f\u3001\u524d\u51e6\u7406\u306e\u30c6\u30af\u30cb\u30c3\u30af\u3084\u30cd\u30ac\u30dd\u30b8\u5224\u5b9a\u306e\u30ab\u30b9\u30bf\u30de\u30a4\u30ba\u65b9\u6cd5\u3001\u4ed6\u306e\u611f\u60c5\u5206\u6790\u624b\u6cd5\u3068\u306e\u6bd4\u8f03\u3082\u884c\u3044\u307e\u3057\u305f\u3002<\/p>\n\n\n\n<p>NLTK\u306f\u3001\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306e\u305f\u3081\u306e\u5305\u62ec\u7684\u306a\u30e9\u30a4\u30d6\u30e9\u30ea\u3067\u3001\u8c4a\u5bcc\u306a\u30b3\u30fc\u30d1\u30b9\u3068\u7d44\u307f\u8fbc\u307f\u306e\u30ea\u30bd\u30fc\u30b9\u3092\u63d0\u4f9b\u3057\u3066\u3044\u307e\u3059\u3002\u6559\u80b2\u7528\u306b\u6700\u9069\u306a\u8a2d\u8a08\u304c\u306a\u3055\u308c\u3066\u304a\u308a\u3001Python\u3068\u306e\u89aa\u548c\u6027\u3082\u9ad8\u3044\u3067\u3059\u3002\u30aa\u30fc\u30d7\u30f3\u30bd\u30fc\u30b9\u3067\u6d3b\u767a\u306a\u30b3\u30df\u30e5\u30cb\u30c6\u30a3\u306b\u652f\u3048\u3089\u308c\u3066\u3044\u308b\u306e\u3082\u5927\u304d\u306a\u5229\u70b9\u3067\u3059\u3002<\/p>\n\n\n\n<p>\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306f\u3001\u30bd\u30fc\u30b7\u30e3\u30eb\u30e1\u30c7\u30a3\u30a2\u5206\u6790\u3001\u5546\u54c1\u30ec\u30d3\u30e5\u30fc\u5206\u6790\u3001\u6620\u753b\u30fb\u66f8\u7c4d\u306e\u8a55\u4fa1\u5206\u6790\u306a\u3069\u3001\u69d8\u3005\u306a\u5206\u91ce\u3067\u6d3b\u7528\u3055\u308c\u3066\u3044\u307e\u3059\u3002\u9867\u5ba2\u306e\u611f\u60c5\u3092\u7406\u89e3\u3057\u3001\u30d3\u30b8\u30cd\u30b9\u306e\u610f\u601d\u6c7a\u5b9a\u306b\u5f79\u7acb\u3066\u308b\u3053\u3068\u304c\u3067\u304d\u307e\u3059\u3002\u91d1\u878d\u5e02\u5834\u306e\u5206\u6790\u306b\u3082\u5fdc\u7528\u3055\u308c\u3001\u30cb\u30e5\u30fc\u30b9\u3084\u6295\u8cc7\u5bb6\u306e\u611f\u60c5\u304c\u5e02\u5834\u306b\u4e0e\u3048\u308b\u5f71\u97ff\u3092\u628a\u63e1\u3059\u308b\u3053\u3068\u304c\u3067\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<p>\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306b\u306f\u3001\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u4ee5\u5916\u306b\u3082\u3001\u6a5f\u68b0\u7ffb\u8a33\u3001\u60c5\u5831\u691c\u7d22\u3001\u8981\u7d04\u751f\u6210\u3001\u30c1\u30e3\u30c3\u30c8\u30dc\u30c3\u30c8\u306a\u3069\u3001\u69d8\u3005\u306a\u5fdc\u7528\u5206\u91ce\u304c\u3042\u308a\u307e\u3059\u3002NLTK\u3092\u5b66\u3076\u3053\u3068\u306f\u3001\u3053\u308c\u3089\u306e\u5206\u91ce\u3078\u306e\u7b2c\u4e00\u6b69\u3068\u306a\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<p>NLTK\u3068\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306e\u5b66\u7fd2\u3092\u6df1\u3081\u308b\u305f\u3081\u306b\u3001\u4ee5\u4e0b\u306e\u3088\u3046\u306a\u30b9\u30c6\u30c3\u30d7\u3092\u63a8\u5968\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li>NLTK\u306e\u516c\u5f0f\u30c9\u30ad\u30e5\u30e1\u30f3\u30c8\u3068\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb\u3092\u8aad\u3080\n<ul class=\"wp-block-list\">\n<li><a href=\"https:\/\/www.nltk.org\/\">https:\/\/www.nltk.org\/<\/a><\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>Python\u306b\u3088\u308b\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u5165\u9580\u306e\u66f8\u7c4d\u3092\u8aad\u3080\n<ul class=\"wp-block-list\">\n<li>\u201cNatural Language Processing with Python\u201d (Steven Bird, Ewan Klein, Edward Loper)<\/li>\n\n\n\n<li>\u201cPython Natural Language Processing\u201d (Jalaj Thanaki)<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u30aa\u30f3\u30e9\u30a4\u30f3\u30b3\u30fc\u30b9\u3092\u53d7\u8b1b\u3059\u308b\n<ul class=\"wp-block-list\">\n<li>\u201cNatural Language Processing with Python\u201d (Udemy)<\/li>\n\n\n\n<li>\u201cNatural Language Processing Spesialization\u201d (Coursera)<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306e\u7814\u7a76\u8ad6\u6587\u3092\u8aad\u3080\n<ul class=\"wp-block-list\">\n<li>ACL (Association for Computational Linguistics) Anthology\u306a\u3069<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li>\u5b9f\u969b\u306e\u30c7\u30fc\u30bf\u3092\u4f7f\u3063\u3066\u3001\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306e\u30d7\u30ed\u30b8\u30a7\u30af\u30c8\u306b\u53d6\u308a\u7d44\u3080\n<ul class=\"wp-block-list\">\n<li>Twitter\u306e\u30c4\u30a4\u30fc\u30c8\u3001Amazon\u5546\u54c1\u30ec\u30d3\u30e5\u30fc\u3001IMDb\u306e\u6620\u753b\u30ec\u30d3\u30e5\u30fc\u306a\u3069<\/li>\n<\/ul>\n<\/li>\n<\/ol>\n\n\n\n<p>\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306e\u5206\u91ce\u306f\u3001\u6025\u901f\u306b\u767a\u5c55\u3057\u3066\u3044\u307e\u3059\u3002NLTK\u3092\u51fa\u767a\u70b9\u306b\u3001\u6700\u65b0\u306e\u7814\u7a76\u52d5\u5411\u306b\u3082\u6ce8\u76ee\u3057\u306a\u304c\u3089\u3001\u5b66\u7fd2\u3092\u7d9a\u3051\u3066\u3044\u304d\u307e\u3057\u3087\u3046\u3002\u6a5f\u68b0\u5b66\u7fd2\u3084\u30c7\u30a3\u30fc\u30d7\u30e9\u30fc\u30cb\u30f3\u30b0\u306e\u77e5\u8b58\u3092\u6df1\u3081\u308b\u3053\u3068\u3067\u3001\u3088\u308a\u9ad8\u5ea6\u306a\u611f\u60c5\u5206\u6790\u30e2\u30c7\u30eb\u3092\u69cb\u7bc9\u3059\u308b\u3053\u3068\u304c\u3067\u304d\u308b\u3067\u3057\u3087\u3046\u3002<\/p>\n\n\n\n<p>\u7686\u3055\u3093\u306e\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u30de\u30b9\u30bf\u30fc\u3078\u306e\u65c5\u3092\u5fdc\u63f4\u3057\u3066\u3044\u307e\u3059\uff01<\/p>\n","protected":false},"excerpt":{"rendered":"<p>Python\u3067AI\u3084\u6a5f\u68b0\u5b66\u7fd2\u306b\u53d6\u308a\u7d44\u3080\u4e0a\u3067\u3001\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u306f\u907f\u3051\u3066\u901a\u308c\u306a\u3044\u5206\u91ce\u3067\u3059\u3002\u4e2d\u3067\u3082\u3001\u30c6\u30ad\u30b9\u30c8\u30c7\u30fc\u30bf\u304b\u3089\u611f\u60c5\u3092\u62bd\u51fa\u3059\u308b\u30bb\u30f3\u30c1\u30e1\u30f3\u30c8\u5206\u6790\u306f\u3001\u30d3\u30b8\u30cd\u30b9\u3067\u306e\u6d3b\u7528\u5834\u9762\u304c\u591a\u304f\u3001\u6ce8\u76ee\u3092\u96c6\u3081\u3066\u3044\u307e\u3059\u3002\u672c\u8a18\u4e8b\u3067\u306f\u3001Python\u306e\u81ea\u7136 &#8230; <\/p>\n","protected":false},"author":1,"featured_media":614,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[4],"tags":[],"class_list":{"0":"post-612","1":"post","2":"type-post","3":"status-publish","4":"format-standard","5":"has-post-thumbnail","7":"category-python"},"_links":{"self":[{"href":"https:\/\/chocottopro.com\/index.php?rest_route=\/wp\/v2\/posts\/612","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/chocottopro.com\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/chocottopro.com\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/chocottopro.com\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/chocottopro.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=612"}],"version-history":[{"count":2,"href":"https:\/\/chocottopro.com\/index.php?rest_route=\/wp\/v2\/posts\/612\/revisions"}],"predecessor-version":[{"id":615,"href":"https:\/\/chocottopro.com\/index.php?rest_route=\/wp\/v2\/posts\/612\/revisions\/615"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/chocottopro.com\/index.php?rest_route=\/wp\/v2\/media\/614"}],"wp:attachment":[{"href":"https:\/\/chocottopro.com\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=612"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/chocottopro.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=612"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/chocottopro.com\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=612"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}