{"id":3075,"date":"2022-04-15T15:28:50","date_gmt":"2022-04-15T06:28:50","guid":{"rendered":"https:\/\/aiacademy.jp\/media\/?p=3075"},"modified":"2024-01-19T14:08:18","modified_gmt":"2024-01-19T05:08:18","slug":"%e3%80%90%e8%87%aa%e7%84%b6%e8%a8%80%e8%aa%9e%e5%87%a6%e7%90%86%e3%80%91tf-idf%e3%81%a8%e3%81%af","status":"publish","type":"post","link":"https:\/\/aiacademy.jp\/media\/?p=3075","title":{"rendered":"\u3010\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u3011TF-IDF\u3068\u306f"},"content":{"rendered":"\n<div class=\"toc\">    <div id=\"toc_container\" class=\"sgb-toc--no-bullets js-smooth-scroll\" data-dialog-title=\"Table of Contents\">\n      <p class=\"toc_title\">\u76ee\u6b21 <\/p>\n      <ul class=\"toc_list\">  <li class=\"first\">    <span><\/span>    <ul class=\"menu_level_1\">      <li class=\"first last\">        <a href=\"#i-0\"> TF-IDF\u3068\u306f<\/a>      <\/li>    <\/ul>  <\/li>  <li class=\"last\">    <a href=\"#i-1\">\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u3092\u5b66\u3076\u306b\u306f<\/a>  <\/li><\/ul>\n      \n    <\/div><\/div><div class=\"toc\"><p><\/p>\n<\/div><h2 class=\"wp-block-heading\" id=\"i-0\"> TF-IDF\u3068\u306f<\/h2>\n\n\n\n<p>TF-IDF\uff08tf-idf; term frequency \u2013 inverse document frequency\uff09\u3068\u306f\u3001<strong>\u6587\u66f8\u4e2d\u306b\u542b\u307e\u308c\u308b\u5358\u8a9e\u306e\u91cd\u8981\u5ea6\u3092\u8a55\u4fa1\u3059\u308b\u624b\u6cd5\u306e1\u3064\u3067\u3001\u5358\u8a9e\u306e\u91cd\u8981\u5ea6\u3092\u7b97\u51fa\u3057\u305f\u3044\u5834\u5408\u306b\u7528\u3044\u3089\u308c\u307e\u3059\u3002<\/strong><\/p>\n\n\n\n<p>Python\u3067\u306fscikit-learan\u306e<a href=\"https:\/\/scikit-learn.org\/stable\/modules\/generated\/sklearn.feature_extraction.text.TfidfVectorizer.html\" rel=\"nofollow noopener\" target=\"_blank\">TfidfVectorizer<\/a>\u306a\u3069\u3092\u7528\u3044\u308b\u3053\u3068\u3067\u3001\u8a08\u7b97\u51fa\u6765\u307e\u3059\u3002<\/p>\n\n\n\n<p><\/p>\n\n\n\n<p><a href=\"https:\/\/aiacademy.jp\/media\/?p=3068\">\u95a2\u9023\uff1aBag of Words\u3068\u306f<\/a><\/p>\n\n\n\n<p><a href=\"https:\/\/aiacademy.jp\/media\/?p=1916\">\u95a2\u9023\uff1a&nbsp;scikit-learn\uff08sklearn\uff09\u3068\u306f\uff1f<\/a><\/p>\n\n\n\n<p><a href=\"https:\/\/aiacademy.jp\/texts\/#natural\" title=\"\u95a2\u9023\uff1a\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7de8\">\u95a2\u9023\uff1a\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7de8<\/a><\/p>\n\n\n\n<p><\/p>\n\n\n\n<h1 class=\"wp-block-heading\" id=\"i-1\">\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u3092\u5b66\u3076\u306b\u306f<\/h1>\n\n\n\n<p>\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u3092\u5b66\u3076\u306b\u9650\u3089\u305a\u3001\u6a5f\u68b0\u5b66\u7fd2\u6280\u8853\u3092\u5b66\u3076\u4e0a\u3067\u304a\u3059\u3059\u3081\u306a\u306e\u306f\u3001\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2\u304b\u3089\u3044\u3064\u3067\u3082\u8cea\u554f\u3067\u304d\u308b\u74b0\u5883\u3067\u5b66\u3076\u3053\u3068\u304c\u5927\u5207\u3067\u3059\u3002<\/p>\n\n\n\n<p><a href=\"https:\/\/aiacademy.jp\/bootcamp\">AI Academy Bootcamp<\/a>\u306a\u3089\u3001<a rel=\"noreferrer noopener\" href=\"https:\/\/aiacademy.jp\/bootcamp\" target=\"_blank\">\uff16\u30f6\u670835,000\u5186\u306b\u3066\u30c1\u30e3\u30c3\u30c8\u3067\u8cea\u554f\u3057\u653e\u984c\u306e\u74b0\u5883\u3067\u3001\u6a5f\u68b0\u5b66\u7fd2\u3084\u30c7\u30fc\u30bf\u5206\u6790\u304c\u5b66\u3079\u308b\u30b5\u30fc\u30d3\u30b9<\/a>\u3092\u63d0\u4f9b\u3057\u3066\u304a\u308a\u307e\u3059\u3002<br>\u6570\u5341\u540d\u5728\u7c4d\u3057\u3066\u3044\u308b\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3084\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2\u306b\u8cea\u554f\u3057\u653e\u984c\u306e\u74b0\u5883\u3067\u30c7\u30fc\u30bf\u5206\u6790\u3001\u7d71\u8a08\u3001\u6a5f\u68b0\u5b66\u7fd2\u3001SQL\u7b49\u304c\u5b66\u3079\u307e\u3059\u3002AI\u4eba\u6750\u306b\u5fc5\u8981\u306a\u30b9\u30ad\u30eb\u3092\u52b9\u7387\u3088\u304f\u4f53\u7cfb\u7684\u306b\u8eab\u306b\u4ed8\u3051\u305f\u3044\u65b9\u306f\u662f\u975e\u3054\u691c\u8a0e\u304f\u3060\u3055\u3044\u3002<\/p>\n\n\n\n<figure class=\"wp-block-image\"><a href=\"https:\/\/aiacademy.jp\/bootcamp\"><img loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"341\" src=\"https:\/\/aiacademy.jp\/media\/wp-content\/uploads\/2021\/12\/bootcamp_ad_72ppi-1024x341.png\" alt=\"\" class=\"wp-image-691\" srcset=\"https:\/\/aiacademy.jp\/media\/wp-content\/uploads\/2021\/12\/bootcamp_ad_72ppi-1024x341.png 1024w, https:\/\/aiacademy.jp\/media\/wp-content\/uploads\/2021\/12\/bootcamp_ad_72ppi-300x100.png 300w, https:\/\/aiacademy.jp\/media\/wp-content\/uploads\/2021\/12\/bootcamp_ad_72ppi-768x256.png 768w, https:\/\/aiacademy.jp\/media\/wp-content\/uploads\/2021\/12\/bootcamp_ad_72ppi-940x313.png 940w, https:\/\/aiacademy.jp\/media\/wp-content\/uploads\/2021\/12\/bootcamp_ad_72ppi.png 1200w\" sizes=\"auto, (max-width: 1024px) 100vw, 1024px\"><\/a><\/figure>\n","protected":false},"excerpt":{"rendered":"<p>\u76ee\u6b21 TF-IDF\u3068\u306f \u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u3092\u5b66\u3076\u306b\u306f TF-IDF\u3068\u306f TF-IDF\uff08tf-idf; term frequency \u2013 inverse document frequency\uff09\u3068\u306f\u3001\u6587\u66f8\u4e2d\u306b\u542b\u307e\u308c\u308b\u5358\u8a9e\u306e\u91cd\u8981\u5ea6\u3092 &#8230; <\/p>\n","protected":false},"author":1,"featured_media":3077,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[85,154,137],"tags":[],"class_list":{"0":"post-3075","1":"post","2":"type-post","3":"status-publish","4":"format-standard","5":"has-post-thumbnail","7":"category-python","8":"category-154","9":"category-137"},"_links":{"self":[{"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=\/wp\/v2\/posts\/3075","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=3075"}],"version-history":[{"count":3,"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=\/wp\/v2\/posts\/3075\/revisions"}],"predecessor-version":[{"id":3988,"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=\/wp\/v2\/posts\/3075\/revisions\/3988"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=\/wp\/v2\/media\/3077"}],"wp:attachment":[{"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=3075"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=3075"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/aiacademy.jp\/media\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=3075"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}