{"id":701,"date":"2024-03-21T12:02:46","date_gmt":"2024-03-21T03:02:46","guid":{"rendered":"https:\/\/elosove.com\/?p=701"},"modified":"2024-04-10T17:12:11","modified_gmt":"2024-04-10T08:12:11","slug":"silero-vad%e3%81%ae%e4%bd%bf%e3%81%84%e6%96%b9-%e9%9f%b3%e5%a3%b0%e5%8c%ba%e9%96%93%e8%aa%8d%e8%ad%98","status":"publish","type":"post","link":"https:\/\/elosove.com\/?p=701","title":{"rendered":"Silero VAD\u306e\u4f7f\u3044\u65b9 | \u97f3\u58f0\u533a\u9593\u8a8d\u8b58"},"content":{"rendered":"\n<p class=\"wp-block-paragraph\">whisper\u3084rinna\u306a\u3069\u306e\u91cd\u3044\u97f3\u58f0\u8a8d\u8b58\u51e6\u7406\u3092\u3059\u308b\u524d\u306b\u3001\u30b5\u30a6\u30f3\u30c9\u30d5\u30a1\u30a4\u30eb\u5185\u3067\u767a\u8a71\u90e8\u5206\u306e\u307f\u3092\u629c\u304d\u53d6\u308b\u8efd\u3044\u51e6\u7406\u3092\u631f\u307f\u305f\u3044\u6642\u304c\u3042\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u8abf\u3079\u305f\u6642\u70b9\u3067\u3059\u3050\u306b\u5b9f\u88c5\u51fa\u6765\u305d\u3046\u306a\u96f0\u56f2\u6c17\u306e\u3082\u306e\u306f\u4e0b\u8a18\u306e5\u3064\u3050\u3089\u3044\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li><a href=\"https:\/\/qiita.com\/oozzZZZZ\/items\/4685648b2a674c375703\">N cross\u6cd5 (python) | Qiita<\/a> <\/li>\n\n\n\n<li><a href=\"https:\/\/qiita.com\/ikuo0\/items\/0d5798db824f3df074af\">\u97f3\u58f0\u6709\u52b9\u533a\u9593\u3068\u30e2\u30fc\u30e9\u306e\u691c\u51fa (Python) | Qiita<\/a> <\/li>\n\n\n\n<li><a href=\"https:\/\/github.com\/wiseman\/py-webrtcvad\">py-webrtcvad | github<\/a> <\/li>\n\n\n\n<li><a href=\"https:\/\/github.com\/ina-foss\/inaSpeechSegmenter\">inaSpeechSegmenter | github<\/a> <\/li>\n\n\n\n<li><a href=\"https:\/\/github.com\/snakers4\/silero-vad\">silero-vad  | github<\/a> <\/li>\n<\/ul>\n\n\n\n<p class=\"wp-block-paragraph\">\u4eca\u56de\u306f\u624b\u6301\u3061\u306e\u97f3\u58f0\u30d5\u30a1\u30a4\u30eb\u3068\u76f8\u6027\u304c\u826f\u304b\u3063\u305fSilero VAD\u3092\u4f7f\u3063\u3066\u307f\u305f\u306e\u3067\u3059\u304c\u3001\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u5185\u5bb9\u4ee5\u5916\u306e\u65e5\u672c\u8a9e\u8a18\u4e8b\u304c\u5c11\u306a\u304b\u3063\u305f\u306e\u3067\u4f7f\u3044\u65b9\u306b\u3064\u3044\u3066\u66f8\u3044\u3066\u307f\u307e\u3057\u305f\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u60f3\u5b9a\u74b0\u5883\u306fWindows\u3067\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\"><\/p>\n\n\n\n<div id=\"ez-toc-container\" class=\"ez-toc-v2_0_71 counter-hierarchy ez-toc-counter ez-toc-grey ez-toc-container-direction\">\n<div class=\"ez-toc-title-container\">\n<p class=\"ez-toc-title\" style=\"cursor:inherit\">Table of Contents<\/p>\n<span class=\"ez-toc-title-toggle\"><a href=\"#\" class=\"ez-toc-pull-right ez-toc-btn ez-toc-btn-xs ez-toc-btn-default ez-toc-toggle\" aria-label=\"Toggle Table of Content\"><span class=\"ez-toc-js-icon-con\"><span class=\"\"><span class=\"eztoc-hide\" style=\"display:none;\">Toggle<\/span><span class=\"ez-toc-icon-toggle-span\"><svg style=\"fill: #999;color:#999\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" class=\"list-377408\" width=\"20px\" height=\"20px\" viewBox=\"0 0 24 24\" fill=\"none\"><path d=\"M6 6H4v2h2V6zm14 0H8v2h12V6zM4 11h2v2H4v-2zm16 0H8v2h12v-2zM4 16h2v2H4v-2zm16 0H8v2h12v-2z\" fill=\"currentColor\"><\/path><\/svg><svg style=\"fill: #999;color:#999\" class=\"arrow-unsorted-368013\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"10px\" height=\"10px\" viewBox=\"0 0 24 24\" version=\"1.2\" baseProfile=\"tiny\"><path d=\"M18.2 9.3l-6.2-6.3-6.2 6.3c-.2.2-.3.4-.3.7s.1.5.3.7c.2.2.4.3.7.3h11c.3 0 .5-.1.7-.3.2-.2.3-.5.3-.7s-.1-.5-.3-.7zM5.8 14.7l6.2 6.3 6.2-6.3c.2-.2.3-.5.3-.7s-.1-.5-.3-.7c-.2-.2-.4-.3-.7-.3h-11c-.3 0-.5.1-.7.3-.2.2-.3.5-.3.7s.1.5.3.7z\"\/><\/svg><\/span><\/span><\/span><\/a><\/span><\/div>\n<nav><ul class='ez-toc-list ez-toc-list-level-1 ' ><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-1\" href=\"https:\/\/elosove.com\/?p=701\/#%E3%82%A4%E3%83%B3%E3%82%B9%E3%83%88%E3%83%BC%E3%83%AB\" title=\"\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\">\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-2'><a class=\"ez-toc-link ez-toc-heading-2\" href=\"https:\/\/elosove.com\/?p=701\/#utils_vadpy%E3%81%AE%E4%BD%BF%E3%81%84%E6%96%B9\" title=\"utils_vad.py\u306e\u4f7f\u3044\u65b9\">utils_vad.py\u306e\u4f7f\u3044\u65b9<\/a><ul class='ez-toc-list-level-3' ><li class='ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-3\" href=\"https:\/\/elosove.com\/?p=701\/#%E3%83%A2%E3%83%87%E3%83%AB%E3%81%AE%E3%83%AD%E3%83%BC%E3%83%89\" title=\"\u30e2\u30c7\u30eb\u306e\u30ed\u30fc\u30c9\">\u30e2\u30c7\u30eb\u306e\u30ed\u30fc\u30c9<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-4\" href=\"https:\/\/elosove.com\/?p=701\/#%E3%83%95%E3%82%A1%E3%82%A4%E3%83%AB%E3%81%AE%E8%AA%AD%E3%81%BF%E8%BE%BC%E3%81%BF\" title=\"\u30d5\u30a1\u30a4\u30eb\u306e\u8aad\u307f\u8fbc\u307f\">\u30d5\u30a1\u30a4\u30eb\u306e\u8aad\u307f\u8fbc\u307f<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-5\" href=\"https:\/\/elosove.com\/?p=701\/#%E6%A4%9C%E5%87%BA\" title=\"\u691c\u51fa\">\u691c\u51fa<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-6\" href=\"https:\/\/elosove.com\/?p=701\/#%E6%A4%9C%E5%87%BA%E3%81%AE%E9%80%B2%E6%8D%97%E8%A1%A8%E7%A4%BA\" title=\"\u691c\u51fa\u306e\u9032\u6357\u8868\u793a\">\u691c\u51fa\u306e\u9032\u6357\u8868\u793a<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-7\" href=\"https:\/\/elosove.com\/?p=701\/#%E6%A4%9C%E5%87%BA%E5%8C%BA%E9%96%93%E3%81%AE%E4%BF%9D%E5%AD%98\" title=\"\u691c\u51fa\u533a\u9593\u306e\u4fdd\u5b58\">\u691c\u51fa\u533a\u9593\u306e\u4fdd\u5b58<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-8\" href=\"https:\/\/elosove.com\/?p=701\/#%E7%99%BA%E8%A9%B1%E5%8C%BA%E9%96%93%E3%81%AE%E5%8F%AF%E8%A6%96%E5%8C%96\" title=\"\u767a\u8a71\u533a\u9593\u306e\u53ef\u8996\u5316\">\u767a\u8a71\u533a\u9593\u306e\u53ef\u8996\u5316<\/a><\/li><li class='ez-toc-page-1 ez-toc-heading-level-3'><a class=\"ez-toc-link ez-toc-heading-9\" href=\"https:\/\/elosove.com\/?p=701\/#stream%E5%87%A6%E7%90%86\" title=\"stream\u51e6\u7406\">stream\u51e6\u7406<\/a><\/li><\/ul><\/li><\/ul><\/nav><\/div>\n<h2 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"%E3%82%A4%E3%83%B3%E3%82%B9%E3%83%88%E3%83%BC%E3%83%AB\"><\/span>\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<span class=\"ez-toc-section-end\"><\/span><\/h2>\n\n\n\n<p class=\"wp-block-paragraph\"><a href=\"https:\/\/github.com\/snakers4\/silero-vad\/wiki\/Examples-and-Dependencies#dependencies\">\u516c\u5f0f\u306b\u5f93\u3044<\/a>\u30e9\u30a4\u30d6\u30e9\u30ea\u3092\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>pytorch &gt;= 1.12.0  | \u4eca\u56de\u306f2.2.1+cu118\u3092\u4f7f\u7528<\/li>\n\n\n\n<li>torchaudio &gt;= 0.9.0  | \u4eca\u56de\u306f2.2.1+cu118\u3092\u4f7f\u7528<\/li>\n<\/ul>\n\n\n\n<p class=\"wp-block-paragraph\">\u30e2\u30c7\u30eb\u306e\u30c0\u30a6\u30f3\u30ed\u30fc\u30c9\u306fpythn\u30b3\u30fc\u30c9\u3067\u5b9f\u884c\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">(\u624b\u52d5\u3067\u76f4\u63a5\u30e2\u30c7\u30eb\u3092DL\u3059\u308b\u5834\u5408\u306f<a href=\"https:\/\/github.com\/snakers4\/silero-vad\/tree\/master\/files\">\u3053\u3053\u304b\u3089<\/a>\u3002)<\/p>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"import torch\n# download example\ntorch.hub.download_url_to_file('https:\/\/models.silero.ai\/vad_models\/en.wav', 'en_example.wav')\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> torch<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># download example<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">torch.hub.download_url_to_file(<\/span><span style=\"color: #CE9178\">&#39;https:\/\/models.silero.ai\/vad_models\/en.wav&#39;<\/span><span style=\"color: #D4D4D4\">, <\/span><span style=\"color: #CE9178\">&#39;en_example.wav&#39;<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">\u4e0a\u8a18\u3092\u5b9f\u884c\u3059\u308b\u3068\u4e0b\u8a18\u306e\u30d5\u30a9\u30eb\u30c0\u306b2\u3064\u306e\u30e2\u30c7\u30eb\u304c\u30c0\u30a6\u30f3\u30ed\u30fc\u30c9\u3055\u308c\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">&#8220;C:\\Users\\\u81ea\u5206\\.cache\\torch\\hub\\snakers4_silero-vad_master\\files&#8221;<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>jit\u30e2\u30c7\u30eb : silero_vad.jit<\/li>\n\n\n\n<li>ONNX\u30e2\u30c7\u30eb : silero_vad.onnx<\/li>\n<\/ul>\n\n\n\n<p class=\"wp-block-paragraph\">\u30e2\u30c7\u30eb\u306e\u9055\u3044\u306f<a href=\"https:\/\/github.com\/snakers4\/silero-vad\/wiki\/Performance-Metrics#silero-vad-performance-metrics\">\u516c\u5f0f<\/a>\u306b\u3088\u308b\u3068\u3001ONNX\u30e2\u30c7\u30eb\u306e\u65b9\u304c\u30d5\u30a1\u30a4\u30eb\u304c\u91cd\u3044\u5206\u51e6\u7406\u304c4-5\u500d\u901f\u3044\u53ef\u80fd\u6027\u304c\u3042\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u3069\u3061\u3089\u306e\u30e2\u30c7\u30eb\u3082CPU1\u30b9\u30ec\u30c3\u30c9\u3067\u52d5\u4f5c\u3055\u305b\u308b\u30d1\u30d5\u30a9\u30fc\u30de\u30f3\u30b9\u306b\u6700\u9069\u5316\u3055\u308c\u3066\u3044\u3066\u65e2\u306b\u91cf\u5b50\u5316\u6e08\u307f\u3067\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u4eca\u56de\u306f\u8efd\u3055\u91cd\u8996\u3067jit\u30e2\u30c7\u30eb\u3092\u4f7f\u7528\u3057\u3066\u3044\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h2 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"utils_vadpy%E3%81%AE%E4%BD%BF%E3%81%84%E6%96%B9\"><\/span>utils_vad.py\u306e\u4f7f\u3044\u65b9<span class=\"ez-toc-section-end\"><\/span><\/h2>\n\n\n\n<p class=\"wp-block-paragraph\">\u516c\u5f0f\u901a\u308a\u30c0\u30a6\u30f3\u30ed\u30fc\u30c9\u3059\u308b\u3068\u4e0b\u8a18\u306e\u30d5\u30a9\u30eb\u30c0\u306b\u4e00\u5f0f\u30b3\u30fc\u30c9\u304c\u4fdd\u5b58\u3055\u308c\u3066\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li>&#8220;C:\\Users\\\u81ea\u5206\\.cache\\torch\\hub\\snakers4_silero-vad_master&#8221;<\/li>\n<\/ul>\n\n\n\n<p class=\"wp-block-paragraph\">\u624b\u52d5\u3067\u30e2\u30c7\u30eb\u3092\u30c0\u30a6\u30f3\u30ed\u30fc\u30c9\u3057\u305f\u5834\u5408\u306f\u4e0b\u8a18\u304b\u3089utils_vad.py\u3092\u6301\u3063\u3066\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<ul class=\"wp-block-list\">\n<li><a href=\"https:\/\/github.com\/snakers4\/silero-vad\/tree\/master\">utils_vad.py<\/a><\/li>\n<\/ul>\n\n\n\n<p class=\"wp-block-paragraph\">\u4ee5\u964d\u306f\u5b9f\u884c\u30d5\u30a1\u30a4\u30eb\u3067utils_vad\u3092\u8aad\u307f\u8fbc\u3093\u3067\u4f7f\u7528\u3059\u308b\u3053\u3068\u3092\u60f3\u5b9a\u3057\u3066\u3044\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"%E3%83%A2%E3%83%87%E3%83%AB%E3%81%AE%E3%83%AD%E3%83%BC%E3%83%89\"><\/span>\u30e2\u30c7\u30eb\u306e\u30ed\u30fc\u30c9<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"import torch\ntorch.set_num_threads(1)\nfrom utils_vad import init_jit_model\n\n# jit\u30e2\u30c7\u30eb\u306e\u30ed\u30fc\u30c9\nmodel = init_jit_model(os.path.join('&lt;pass to download model&gt;', 'silero_vad.jit'))\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> torch<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">torch.set_num_threads(<\/span><span style=\"color: #B5CEA8\">1<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">from<\/span><span style=\"color: #D4D4D4\"> utils_vad <\/span><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> init_jit_model<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># jit\u30e2\u30c7\u30eb\u306e\u30ed\u30fc\u30c9<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">model = init_jit_model(os.path.join(<\/span><span style=\"color: #CE9178\">&#39;&lt;pass to download model&gt;&#39;<\/span><span style=\"color: #D4D4D4\">, <\/span><span style=\"color: #CE9178\">&#39;silero_vad.jit&#39;<\/span><span style=\"color: #D4D4D4\">))<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"%E3%83%95%E3%82%A1%E3%82%A4%E3%83%AB%E3%81%AE%E8%AA%AD%E3%81%BF%E8%BE%BC%E3%81%BF\"><\/span>\u30d5\u30a1\u30a4\u30eb\u306e\u8aad\u307f\u8fbc\u307f<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"import torch\ntorch.set_num_threads(1)\nfrom utils_vad import read_audio\n\nSAMPLING_RATE = 16000\nwav = read_audio('test.wav', sampling_rate=SAMPLING_RATE)\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> torch<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">torch.set_num_threads(<\/span><span style=\"color: #B5CEA8\">1<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">from<\/span><span style=\"color: #D4D4D4\"> utils_vad <\/span><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> read_audio<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">SAMPLING_RATE = <\/span><span style=\"color: #B5CEA8\">16000<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">wav = read_audio(<\/span><span style=\"color: #CE9178\">&#39;test.wav&#39;<\/span><span style=\"color: #D4D4D4\">, <\/span><span style=\"color: #9CDCFE\">sampling_rate<\/span><span style=\"color: #D4D4D4\">=SAMPLING_RATE)<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">\u5909\u6570wav\u306ftorch.Tensor\u578b\u3067\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u5165\u529b\u30d5\u30a1\u30a4\u30eb\u306e\u30b5\u30f3\u30d7\u30ea\u30f3\u30b0\u30ec\u30fc\u30c8\u306f8kHz\u304b16kHz\u306e\u307f\u306a\u306e\u306744.1kHz\u306e\u5834\u5408\u306fffmpeg\u306a\u3069\u3067\u30b5\u30f3\u30d7\u30ea\u30f3\u30b0\u30ec\u30fc\u30c8\u3092\u4e0b\u3052\u3066\u304b\u3089\u5165\u308c\u308b\u5fc5\u8981\u304c\u3042\u308a\u307e\u3059\u3002<\/p>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"# cmd \u30b5\u30f3\u30d7\u30ea\u30f3\u30b0\u30ec\u30fc\u30c8\u5909\u66f4\u30b5\u30f3\u30d7\u30eb\u30b3\u30de\u30f3\u30c9\nffmpeg -i teset.wav -ar 16000 output.wav\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #6A9955\"># cmd \u30b5\u30f3\u30d7\u30ea\u30f3\u30b0\u30ec\u30fc\u30c8\u5909\u66f4\u30b5\u30f3\u30d7\u30eb\u30b3\u30de\u30f3\u30c9<\/span><\/span>\n<span class=\"line\"><span style=\"color: #DCDCAA\">ffmpeg<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #569CD6\">-i<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #CE9178\">teset.wav<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #569CD6\">-ar<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #B5CEA8\">16000<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #CE9178\">output.wav<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"%E6%A4%9C%E5%87%BA\"><\/span>\u691c\u51fa<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"import torch\ntorch.set_num_threads(1)\nfrom utils_vad import get_speech_timestamps\n\nSAMPLING_RATE = 16000\n# \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\n# \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\nspeech_timestamps = get_speech_timestamps(wav, model, sampling_rate=SAMPLING_RATE, return_seconds=True)\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> torch<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">torch.set_num_threads(<\/span><span style=\"color: #B5CEA8\">1<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">from<\/span><span style=\"color: #D4D4D4\"> utils_vad <\/span><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> get_speech_timestamps<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">SAMPLING_RATE = <\/span><span style=\"color: #B5CEA8\">16000<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">speech_timestamps = get_speech_timestamps(wav, model, <\/span><span style=\"color: #9CDCFE\">sampling_rate<\/span><span style=\"color: #D4D4D4\">=SAMPLING_RATE, <\/span><span style=\"color: #9CDCFE\">return_seconds<\/span><span style=\"color: #D4D4D4\">=<\/span><span style=\"color: #569CD6\">True<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">\u51e6\u7406\u304c\u7d42\u308f\u308b\u3068\u5909\u6570speech_timestamps\u306b\u767a\u8a71\u3057\u305f\u30d5\u30a1\u30a4\u30eb\u5185\u3067\u306e\u79d2\u6570\u304c\u4fdd\u5b58\u3055\u308c\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u30d5\u30a9\u30fc\u30de\u30c3\u30c8\u306f\u4e0b\u8a18\u306e\u3088\u3046\u306a\u611f\u3058\u3067\u3001start\u3068end\u30ad\u30fc\u3092\u6301\u3064\u8f9e\u66f8\u8981\u7d20\u306e\u30ea\u30b9\u30c8\u914d\u5217\u304c\u5e30\u3063\u3066\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">[{&#8216;start&#8217;: 1, &#8216;end&#8217;: 2}, {&#8216;start&#8217;: 5, &#8216;end&#8217;: 8}&#8230;]<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"%E6%A4%9C%E5%87%BA%E3%81%AE%E9%80%B2%E6%8D%97%E8%A1%A8%E7%A4%BA\"><\/span>\u691c\u51fa\u306e\u9032\u6357\u8868\u793a<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"import torch\ntorch.set_num_threads(1)\nfrom utils_vad import get_speech_timestamps\nfrom tqdm import tqdm\n\nSAMPLING_RATE = 16000\npbar = None\n\ndef my_progress_update(progress):\n    # tqdm\u3092\u4f7f\u308f\u306a\u3044\u5834\u5408\u306f\u5358\u306bprogress\u5024\u3092\u8868\u793a\n    # print(f&quot;Progress: {progress}%&quot;)\n    \n    # tqdm\u3092\u4f7f\u3046\u5834\u5408\n    if (pbar is None):\n      pbar = tqdm()\n    pbar.update(progress - pbar.n)\n    \n# \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\n# \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\nspeech_timestamps = get_speech_timestamps(  wav, model,\n                                            sampling_rate=SAMPLING_RATE,\n                                            progress_tracking_callback=my_progress_update)\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> torch<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">torch.set_num_threads(<\/span><span style=\"color: #B5CEA8\">1<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">from<\/span><span style=\"color: #D4D4D4\"> utils_vad <\/span><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> get_speech_timestamps<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">from<\/span><span style=\"color: #D4D4D4\"> tqdm <\/span><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> tqdm<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">SAMPLING_RATE = <\/span><span style=\"color: #B5CEA8\">16000<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">pbar = <\/span><span style=\"color: #569CD6\">None<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #569CD6\">def<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #DCDCAA\">my_progress_update<\/span><span style=\"color: #D4D4D4\">(<\/span><span style=\"color: #9CDCFE\">progress<\/span><span style=\"color: #D4D4D4\">):<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">    <\/span><span style=\"color: #6A9955\"># tqdm\u3092\u4f7f\u308f\u306a\u3044\u5834\u5408\u306f\u5358\u306bprogress\u5024\u3092\u8868\u793a<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">    <\/span><span style=\"color: #6A9955\"># print(f&quot;Progress: {progress}%&quot;)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">    <\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">    <\/span><span style=\"color: #6A9955\"># tqdm\u3092\u4f7f\u3046\u5834\u5408<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">    <\/span><span style=\"color: #C586C0\">if<\/span><span style=\"color: #D4D4D4\"> (pbar <\/span><span style=\"color: #569CD6\">is<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #569CD6\">None<\/span><span style=\"color: #D4D4D4\">):<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">      pbar = tqdm()<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">    pbar.update(progress - pbar.n)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">    <\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">speech_timestamps = get_speech_timestamps(  wav, model,<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">                                            <\/span><span style=\"color: #9CDCFE\">sampling_rate<\/span><span style=\"color: #D4D4D4\">=SAMPLING_RATE,<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">                                            <\/span><span style=\"color: #9CDCFE\">progress_tracking_callback<\/span><span style=\"color: #D4D4D4\">=my_progress_update)<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">get_speech_timestamps\u30e1\u30bd\u30c3\u30c9\u306eprogress_tracking_callback\u306b\u95a2\u6570\u3092\u5165\u308c\u308b\u3068\u30b3\u30fc\u30eb\u30d0\u30c3\u30af\u3057\u3066\u304f\u308c\u308b\u306e\u3067\u9032\u6357\u7387\u3092\u53d6\u5f97\u51fa\u6765\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"%E6%A4%9C%E5%87%BA%E5%8C%BA%E9%96%93%E3%81%AE%E4%BF%9D%E5%AD%98\"><\/span>\u691c\u51fa\u533a\u9593\u306e\u4fdd\u5b58<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<p class=\"wp-block-paragraph\">\u4fdd\u5b58\u6642\u306f\u30bf\u30a4\u30e0\u30b9\u30bf\u30f3\u30d7\u3092\u79d2\u6570\u3067\u306f\u306a\u304f\u30b5\u30f3\u30d7\u30eb\u3067\u53d6\u5f97(return_seconds=True\u3092\u6d88\u3059)<\/p>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"import torch\ntorch.set_num_threads(1)\nfrom utils_vad import (get_speech_timestamps, collect_chunks, drop_chunks)\n\nSAMPLING_RATE = 16000\n# \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\n# \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\nspeech_timestamps = get_speech_timestamps(wav, model, sampling_rate=SAMPLING_RATE)\n\n####################################\n# \u767a\u8a71\u533a\u9593\u3092\u307e\u3068\u3081\u3066\u4e00\u3064\u306e\u30d5\u30a1\u30a4\u30eb\u306b\u3059\u308b\n####################################\nsave_data = collect_chunks(speech_timestamps ,wav)\nsave_audio('save.wav', save_data)\n\n####################################\n# \u767a\u8a71\u533a\u9593\u3092\u4e00\u3064\u3065\u3064\u5225\u306e\u30d5\u30a1\u30a4\u30eb\u306b\u3059\u308b\n####################################\nfor idx, time_stamp in enumerate(speech_timestamps):\n  chunk = collect_chunks(time_stamp, wav)\n  save_audio(str(idx)+'_save.wav', chunk)\n\n####################################\n# \u767a\u8a71\u533a\u9593\u3092\u524a\u9664\u3057\u305f\u30d5\u30a1\u30a4\u30eb\u3092\uff11\u3064\u306b\u307e\u3068\u3081\u308b\n####################################\ndelete_data = drop_chunks(speech_timestamps ,wav)\nsave_audio('save.wav', delete_data)\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> torch<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">torch.set_num_threads(<\/span><span style=\"color: #B5CEA8\">1<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">from<\/span><span style=\"color: #D4D4D4\"> utils_vad <\/span><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> (get_speech_timestamps, collect_chunks, drop_chunks)<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">SAMPLING_RATE = <\/span><span style=\"color: #B5CEA8\">16000<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">speech_timestamps = get_speech_timestamps(wav, model, <\/span><span style=\"color: #9CDCFE\">sampling_rate<\/span><span style=\"color: #D4D4D4\">=SAMPLING_RATE)<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\">####################################<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u767a\u8a71\u533a\u9593\u3092\u307e\u3068\u3081\u3066\u4e00\u3064\u306e\u30d5\u30a1\u30a4\u30eb\u306b\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\">####################################<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">save_data = collect_chunks(speech_timestamps ,wav)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">save_audio(<\/span><span style=\"color: #CE9178\">&#39;save.wav&#39;<\/span><span style=\"color: #D4D4D4\">, save_data)<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\">####################################<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u767a\u8a71\u533a\u9593\u3092\u4e00\u3064\u3065\u3064\u5225\u306e\u30d5\u30a1\u30a4\u30eb\u306b\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\">####################################<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">for<\/span><span style=\"color: #D4D4D4\"> idx, time_stamp <\/span><span style=\"color: #C586C0\">in<\/span><span style=\"color: #D4D4D4\"> <\/span><span style=\"color: #DCDCAA\">enumerate<\/span><span style=\"color: #D4D4D4\">(speech_timestamps):<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">  chunk = collect_chunks(time_stamp, wav)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">  save_audio(<\/span><span style=\"color: #4EC9B0\">str<\/span><span style=\"color: #D4D4D4\">(idx)+<\/span><span style=\"color: #CE9178\">&#39;_save.wav&#39;<\/span><span style=\"color: #D4D4D4\">, chunk)<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\">####################################<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u767a\u8a71\u533a\u9593\u3092\u524a\u9664\u3057\u305f\u30d5\u30a1\u30a4\u30eb\u3092\uff11\u3064\u306b\u307e\u3068\u3081\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\">####################################<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">delete_data = drop_chunks(speech_timestamps ,wav)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">save_audio(<\/span><span style=\"color: #CE9178\">&#39;save.wav&#39;<\/span><span style=\"color: #D4D4D4\">, delete_data)<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"%E7%99%BA%E8%A9%B1%E5%8C%BA%E9%96%93%E3%81%AE%E5%8F%AF%E8%A6%96%E5%8C%96\"><\/span>\u767a\u8a71\u533a\u9593\u306e\u53ef\u8996\u5316<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<p class=\"wp-block-paragraph\">pandas\u3068matplotlib\u306e\u30e9\u30a4\u30d6\u30e9\u30ea\u304c\u30a4\u30f3\u30b9\u30c8\u30fc\u30eb\u3055\u308c\u3066\u3044\u308b\u5834\u5408\u3001\u767a\u8a71\u533a\u9593\u306e\u78ba\u7387\u3092\u30b0\u30e9\u30d5\u8868\u793a\u51fa\u6765\u307e\u3059\u3002<\/p>\n\n\n\n<div class=\"wp-block-kevinbatdorf-code-block-pro\" data-code-block-pro-font-family=\"Code-Pro-JetBrains-Mono\" style=\"font-size:.875rem;font-family:Code-Pro-JetBrains-Mono,ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;line-height:1.25rem;--cbp-tab-width:2;tab-size:var(--cbp-tab-width, 2)\"><span style=\"display:block;padding:16px 0 0 16px;margin-bottom:-1px;width:100%;text-align:left;background-color:#1E1E1E\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"54\" height=\"14\" viewBox=\"0 0 54 14\"><g fill=\"none\" fill-rule=\"evenodd\" transform=\"translate(1 1)\"><circle cx=\"6\" cy=\"6\" r=\"6\" fill=\"#FF5F56\" stroke=\"#E0443E\" stroke-width=\".5\"><\/circle><circle cx=\"26\" cy=\"6\" r=\"6\" fill=\"#FFBD2E\" stroke=\"#DEA123\" stroke-width=\".5\"><\/circle><circle cx=\"46\" cy=\"6\" r=\"6\" fill=\"#27C93F\" stroke=\"#1AAB29\" stroke-width=\".5\"><\/circle><\/g><\/svg><\/span><span role=\"button\" tabindex=\"0\" data-code=\"import torch\ntorch.set_num_threads(1)\nfrom utils_vad import (get_speech_timestamps)\nimport matplotlib.pyplot as plt\n\nSAMPLING_RATE = 16000\n# \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\n# \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b\nspeech_timestamps = get_speech_timestamps(wav, model,\n                                          sampling_rate=SAMPLING_RATE,\n                                          visualize_probs=True)\n\nplt.show()\" style=\"color:#D4D4D4;display:none\" aria-label=\"Copy\" class=\"code-block-pro-copy-button\"><svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" style=\"width:24px;height:24px\" fill=\"none\" viewBox=\"0 0 24 24\" stroke=\"currentColor\" stroke-width=\"2\"><path class=\"with-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2m-6 9l2 2 4-4\"><\/path><path class=\"without-check\" stroke-linecap=\"round\" stroke-linejoin=\"round\" d=\"M9 5H7a2 2 0 00-2 2v12a2 2 0 002 2h10a2 2 0 002-2V7a2 2 0 00-2-2h-2M9 5a2 2 0 002 2h2a2 2 0 002-2M9 5a2 2 0 012-2h2a2 2 0 012 2\"><\/path><\/svg><\/span><pre class=\"shiki dark-plus\" style=\"background-color: #1E1E1E\" tabindex=\"0\"><code><span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> torch<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">torch.set_num_threads(<\/span><span style=\"color: #B5CEA8\">1<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">from<\/span><span style=\"color: #D4D4D4\"> utils_vad <\/span><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> (get_speech_timestamps)<\/span><\/span>\n<span class=\"line\"><span style=\"color: #C586C0\">import<\/span><span style=\"color: #D4D4D4\"> matplotlib.pyplot <\/span><span style=\"color: #C586C0\">as<\/span><span style=\"color: #D4D4D4\"> plt<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">SAMPLING_RATE = <\/span><span style=\"color: #B5CEA8\">16000<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570model\u306finit_jit_model\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #6A9955\"># \u5909\u6570wav\u306fread_audio\u30e1\u30bd\u30c3\u30c9\u3067\u53d6\u5f97\u6e08\u307f\u3068\u3059\u308b<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">speech_timestamps = get_speech_timestamps(wav, model,<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">                                          <\/span><span style=\"color: #9CDCFE\">sampling_rate<\/span><span style=\"color: #D4D4D4\">=SAMPLING_RATE,<\/span><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">                                          <\/span><span style=\"color: #9CDCFE\">visualize_probs<\/span><span style=\"color: #D4D4D4\">=<\/span><span style=\"color: #569CD6\">True<\/span><span style=\"color: #D4D4D4\">)<\/span><\/span>\n<span class=\"line\"><\/span>\n<span class=\"line\"><span style=\"color: #D4D4D4\">plt.show()<\/span><\/span><\/code><\/pre><\/div>\n\n\n\n<p class=\"wp-block-paragraph\">\u30b5\u30f3\u30d7\u30eb\u30b0\u30e9\u30d5<\/p>\n\n\n\n<figure class=\"wp-block-image size-full\"><img loading=\"lazy\" decoding=\"async\" width=\"800\" height=\"408\" src=\"https:\/\/elosove.com\/wp-content\/uploads\/2024\/03\/vad-graph.png\" alt=\"\" class=\"wp-image-703\" srcset=\"https:\/\/elosove.com\/wp-content\/uploads\/2024\/03\/vad-graph.png 800w, https:\/\/elosove.com\/wp-content\/uploads\/2024\/03\/vad-graph-300x153.png 300w, https:\/\/elosove.com\/wp-content\/uploads\/2024\/03\/vad-graph-768x392.png 768w\" sizes=\"auto, (max-width: 800px) 100vw, 800px\" \/><\/figure>\n\n\n\n<p class=\"wp-block-paragraph\">\u3000<\/p>\n\n\n\n<h3 class=\"wp-block-heading\"><span class=\"ez-toc-section\" id=\"stream%E5%87%A6%E7%90%86\"><\/span>stream\u51e6\u7406<span class=\"ez-toc-section-end\"><\/span><\/h3>\n\n\n\n<p class=\"wp-block-paragraph\">\u516c\u5f0f\u306eStream imitation example\u306e\u6700\u521d\u306e\u30b3\u30fc\u30c9\u3001&#8221;## using VADIterator class&#8221;\u306f0.032 sec (= 512\/16000)\u6bce\u306b\u767a\u8a71\u533a\u9593\u306e\u5224\u5b9a\u3092\u3057\u3066\u3044\u304d\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\">&#8220;## just probabilities&#8221;\u306e\u30b3\u30fc\u30c9\u306f0.032 sec\u6bce\u306b\u767a\u8a71\u78ba\u7387\u3092\u8fd4\u3057\u307e\u3059\u3002<\/p>\n\n\n\n<p class=\"wp-block-paragraph\"><\/p>\n","protected":false},"excerpt":{"rendered":"<p>whisper\u3084rinna\u306a\u3069\u306e\u91cd\u3044\u97f3\u58f0\u8a8d\u8b58\u51e6\u7406\u3092\u3059\u308b\u524d\u306b\u3001\u30b5\u30a6\u30f3\u30c9\u30d5\u30a1\u30a4\u30eb\u5185\u3067\u767a\u8a71\u90e8\u5206\u306e\u307f\u3092\u629c\u304d\u53d6\u308b\u8efd\u3044\u51e6\u7406\u3092\u631f\u307f\u305f\u3044\u6642\u304c\u3042\u308a\u307e\u3059\u3002 \u8abf\u3079\u305f\u6642\u70b9\u3067\u3059\u3050\u306b\u5b9f\u88c5\u51fa\u6765\u305d\u3046\u306a\u96f0\u56f2\u6c17\u306e\u3082\u306e\u306f\u4e0b\u8a18\u306e5\u3064\u3050\u3089\u3044\u3002 \u4eca\u56de\u306f\u624b\u6301\u3061\u306e\u97f3\u58f0 [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":708,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[4],"tags":[27,28],"class_list":["post-701","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-tech","tag-silerovad","tag-28"],"_links":{"self":[{"href":"https:\/\/elosove.com\/index.php?rest_route=\/wp\/v2\/posts\/701","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/elosove.com\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/elosove.com\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/elosove.com\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/elosove.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=701"}],"version-history":[{"count":7,"href":"https:\/\/elosove.com\/index.php?rest_route=\/wp\/v2\/posts\/701\/revisions"}],"predecessor-version":[{"id":880,"href":"https:\/\/elosove.com\/index.php?rest_route=\/wp\/v2\/posts\/701\/revisions\/880"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/elosove.com\/index.php?rest_route=\/wp\/v2\/media\/708"}],"wp:attachment":[{"href":"https:\/\/elosove.com\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=701"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/elosove.com\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=701"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/elosove.com\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=701"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}