test_espnet_home / index.html
ms180's picture
Initial commit
9caf213 verified
<!doctype html>
<html lang="en-US">
<head>
<meta charset="utf-8" />
<meta name="viewport" content="width=device-width,initial-scale=1" />
<meta name="generator" content="VuePress 2.0.0-rc.9" />
<style>
:root {
--c-bg: #fff;
}
html.dark {
--c-bg: #22272e;
}
html,
body {
background-color: var(--c-bg);
}
</style>
<script>
const userMode = localStorage.getItem('vuepress-color-scheme')
const systemDarkMode =
window.matchMedia &&
window.matchMedia('(prefers-color-scheme: dark)').matches
if (userMode === 'dark' || (userMode !== 'light' && systemDarkMode)) {
document.documentElement.classList.toggle('dark', true)
}
</script>
<link rel="manifest" href="/manifest.webmanifest"><meta name="application-name" content="Example"><meta name="apple-mobile-web-app-title" content="Example"><meta name="apple-mobile-web-app-status-bar-style" content="black"><meta name="msapplication-TileColor" content="#3eaf7c"><meta name="theme-color" content="#3eaf7c"><title> </title><meta name="description" content=" ">
<link rel="preload" href="/assets/style-SNWc1iKP.css" as="style"><link rel="stylesheet" href="/assets/style-SNWc1iKP.css">
<link rel="modulepreload" href="/assets/app-DTS6SjJz.js"><link rel="modulepreload" href="/assets/index.html-DGcx4T0I.js">
<link rel="prefetch" href="/assets/DataPreparation_CMU_11492_692_Spring2023(Assignment0).html-CJ8-yKXK.js" as="script"><link rel="prefetch" href="/assets/SpeechEnhancement_CMU_11492_692_Spring2023(Assignment7).html-BDY4p1H1.js" as="script"><link rel="prefetch" href="/assets/SpokenLanguageUnderstanding_CMU_11492_692_Spring2023(Assignment6).html-DDjiuGQB.js" as="script"><link rel="prefetch" href="/assets/TextToSpeech_CMU_11492_692_Spring2023(Assignment8).html-DnIftUJK.js" as="script"><link rel="prefetch" href="/assets/espnet2_new_task_tutorial_CMU_11751_18781_Fall2022.html-D9GsoT-_.js" as="script"><link rel="prefetch" href="/assets/espnet2_recipe_tutorial_CMU_11751_18781_Fall2022.html-DobzmqH0.js" as="script"><link rel="prefetch" href="/assets/espnet2_tutorial_2021_CMU_11751_18781.html-BY6Z52B4.js" as="script"><link rel="prefetch" href="/assets/asr_cli.html-BA-xBrC-.js" as="script"><link rel="prefetch" href="/assets/asr_library.html-rEQwKTMV.js" as="script"><link rel="prefetch" href="/assets/espnet2_asr_realtime_demo.html-BnK1Wovv.js" as="script"><link rel="prefetch" href="/assets/espnet2_asr_transfer_learning_demo.html-DJeSoTyY.js" as="script"><link rel="prefetch" href="/assets/espnet2_streaming_asr_demo.html-Yx-OX8AZ.js" as="script"><link rel="prefetch" href="/assets/espnet_se_demonstration_for_waspaa_2021.html--JdDNbEo.js" as="script"><link rel="prefetch" href="/assets/se_demo.html-DY-mv2y8.js" as="script"><link rel="prefetch" href="/assets/onnx_conversion_demo.html-D56NEMop.js" as="script"><link rel="prefetch" href="/assets/pretrained.html-JpE__EKJ.js" as="script"><link rel="prefetch" href="/assets/espnet2_2pass_slu_demo.html-BmvJ92Ni.js" as="script"><link rel="prefetch" href="/assets/st_demo.html-WLzB4ZGO.js" as="script"><link rel="prefetch" href="/assets/espnet2_tts_realtime_demo.html-BdxLBr1c.js" as="script"><link rel="prefetch" href="/assets/tts_cli.html-BfB21gs4.js" as="script"><link rel="prefetch" href="/assets/tts_realtime_demo.html-BKOGq7as.js" as="script"><link rel="prefetch" href="/assets/finetune_owsm.html-ICOQYZj2.js" as="script"><link rel="prefetch" href="/assets/finetune_with_lora.html-3NfoQDOl.js" as="script"><link rel="prefetch" href="/assets/train.html-BQ-t2Cs4.js" as="script"><link rel="prefetch" href="/assets/tacotron2.html-Ds1AKES7.js" as="script"><link rel="prefetch" href="/assets/404.html-DN7291h8.js" as="script"><link rel="prefetch" href="/assets/NpmBadge-rh9tvaXX.js" as="script">
</head>
<body>
<div id="app"><!--[--><div class="theme-container no-sidebar"><!--[--><header class="navbar"><div class="toggle-sidebar-button" title="toggle sidebar" aria-expanded="false" role="button" tabindex="0"><div class="icon" aria-hidden="true"><span></span><span></span><span></span></div></div><span><a class="route-link" href="/"><img class="logo" src="/images/espnet_logo1.png" alt=" "><span class="site-name can-hide" aria-hidden="true"> </span></a></span><div class="navbar-items-wrapper" style=""><!--[--><!--]--><nav class="navbar-items can-hide" aria-label="site navigation"><!--[--><div class="navbar-item"><a class="external-link" href="https://github.com/espnet/espnet" rel="noopener noreferrer" target="_blank" aria-label="Github"><!--[--><!--[--><!--]--> Github <span><svg class="external-link-icon" xmlns="http://www.w3.org/2000/svg" aria-hidden="true" focusable="false" x="0px" y="0px" viewBox="0 0 100 100" width="15" height="15"><path fill="currentColor" d="M18.8,85.1h56l0,0c2.2,0,4-1.8,4-4v-32h-8v28h-48v-48h28v-8h-32l0,0c-2.2,0-4,1.8-4,4v56C14.8,83.3,16.6,85.1,18.8,85.1z"></path><polygon fill="currentColor" points="45.7,48.7 51.3,54.3 77.2,28.5 77.2,37.2 85.2,37.2 85.2,14.9 62.8,14.9 62.8,22.9 71.5,22.9"></polygon></svg><span class="external-link-icon-sr-only">open in new window</span></span><!--[--><!--]--><!--]--></a></div><div class="navbar-item"><a class="external-link" href="https://huggingface.co/espnet" rel="noopener noreferrer" target="_blank" aria-label="HuggingFace"><!--[--><!--[--><!--]--> HuggingFace <span><svg class="external-link-icon" xmlns="http://www.w3.org/2000/svg" aria-hidden="true" focusable="false" x="0px" y="0px" viewBox="0 0 100 100" width="15" height="15"><path fill="currentColor" d="M18.8,85.1h56l0,0c2.2,0,4-1.8,4-4v-32h-8v28h-48v-48h28v-8h-32l0,0c-2.2,0-4,1.8-4,4v56C14.8,83.3,16.6,85.1,18.8,85.1z"></path><polygon fill="currentColor" points="45.7,48.7 51.3,54.3 77.2,28.5 77.2,37.2 85.2,37.2 85.2,14.9 62.8,14.9 62.8,22.9 71.5,22.9"></polygon></svg><span class="external-link-icon-sr-only">open in new window</span></span><!--[--><!--]--><!--]--></a></div><div class="navbar-item"><a class="external-link" href="https://espnet.github.io/espnet" rel="noopener noreferrer" target="_blank" aria-label="Docs"><!--[--><!--[--><!--]--> Docs <span><svg class="external-link-icon" xmlns="http://www.w3.org/2000/svg" aria-hidden="true" focusable="false" x="0px" y="0px" viewBox="0 0 100 100" width="15" height="15"><path fill="currentColor" d="M18.8,85.1h56l0,0c2.2,0,4-1.8,4-4v-32h-8v28h-48v-48h28v-8h-32l0,0c-2.2,0-4,1.8-4,4v56C14.8,83.3,16.6,85.1,18.8,85.1z"></path><polygon fill="currentColor" points="45.7,48.7 51.3,54.3 77.2,28.5 77.2,37.2 85.2,37.2 85.2,14.9 62.8,14.9 62.8,22.9 71.5,22.9"></polygon></svg><span class="external-link-icon-sr-only">open in new window</span></span><!--[--><!--]--><!--]--></a></div><div class="navbar-item"><div class="navbar-dropdown-wrapper"><button class="navbar-dropdown-title" type="button" aria-label="espnet2"><span class="title">espnet2</span><span class="arrow down"></span></button><button class="navbar-dropdown-title-mobile" type="button" aria-label="espnet2"><span class="title">espnet2</span><span class="right arrow"></span></button><ul style="display:none;" class="navbar-dropdown"><!--[--><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>TTS</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/tts/tts_cli.html" aria-label="Text-to-Speech (Recipe)"><!--[--><!--[--><!--]--> Text-to-Speech (Recipe) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/tts/tts_realtime_demo.html" aria-label="ESPnet real time E2E-TTS demonstration"><!--[--><!--[--><!--]--> ESPnet real time E2E-TTS demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/tts/espnet2_tts_realtime_demo.html" aria-label="ESPnet2-TTS realtime demonstration"><!--[--><!--[--><!--]--> ESPnet2-TTS realtime demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>SE</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/se/se_demo.html" aria-label="ESPnet Speech Enhancement Demonstration"><!--[--><!--[--><!--]--> ESPnet Speech Enhancement Demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/se/espnet_se_demonstration_for_waspaa_2021.html" aria-label="ESPnet Speech Enhancement Demonstration"><!--[--><!--[--><!--]--> ESPnet Speech Enhancement Demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>SLU</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/slu/espnet2_2pass_slu_demo.html" aria-label="ESPNET 2 pass SLU Demonstration"><!--[--><!--[--><!--]--> ESPNET 2 pass SLU Demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>ASR</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/asr_cli.html" aria-label="Speech Recognition (Recipe)"><!--[--><!--[--><!--]--> Speech Recognition (Recipe) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/espnet2_asr_realtime_demo.html" aria-label="ESPnet2-ASR realtime demonstration"><!--[--><!--[--><!--]--> ESPnet2-ASR realtime demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/asr_library.html" aria-label="Speech Recognition (Library)"><!--[--><!--[--><!--]--> Speech Recognition (Library) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/espnet2_asr_transfer_learning_demo.html" aria-label="Use transfer learning for ASR in ESPnet2"><!--[--><!--[--><!--]--> Use transfer learning for ASR in ESPnet2 <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/espnet2_streaming_asr_demo.html" aria-label="ESPnet2 real streaming Transformer demonstration"><!--[--><!--[--><!--]--> ESPnet2 real streaming Transformer demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>OTHERS</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/others/onnx_conversion_demo.html" aria-label="espnet_onnx demonstration"><!--[--><!--[--><!--]--> espnet_onnx demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/others/pretrained.html" aria-label="Pretrained Model"><!--[--><!--[--><!--]--> Pretrained Model <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>ST</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/st/st_demo.html" aria-label="ESPnet Speech Translation Demonstration"><!--[--><!--[--><!--]--> ESPnet Speech Translation Demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><!--]--></ul></div></div><div class="navbar-item"><div class="navbar-dropdown-wrapper"><button class="navbar-dropdown-title" type="button" aria-label="espnetez"><span class="title">espnetez</span><span class="arrow down"></span></button><button class="navbar-dropdown-title-mobile" type="button" aria-label="espnetez"><span class="title">espnetez</span><span class="right arrow"></span></button><ul style="display:none;" class="navbar-dropdown"><!--[--><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>TTS</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/tts/tacotron2.html" aria-label="TTS demo for ESPnet-Easy!"><!--[--><!--[--><!--]--> TTS demo for ESPnet-Easy! <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>ASR</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/asr/finetune_with_lora.html" aria-label="Finetune Model with ESPnet-Easy"><!--[--><!--[--><!--]--> Finetune Model with ESPnet-Easy <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/asr/train.html" aria-label="Sample demo for ESPnet-Easy!"><!--[--><!--[--><!--]--> Sample demo for ESPnet-Easy! <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/asr/finetune_owsm.html" aria-label="OWSM finetuning with custom dataset"><!--[--><!--[--><!--]--> OWSM finetuning with custom dataset <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><!--]--></ul></div></div><div class="navbar-item"><div class="navbar-dropdown-wrapper"><button class="navbar-dropdown-title" type="button" aria-label="tutorials"><span class="title">tutorials</span><span class="arrow down"></span></button><button class="navbar-dropdown-title-mobile" type="button" aria-label="tutorials"><span class="title">tutorials</span><span class="right arrow"></span></button><ul style="display:none;" class="navbar-dropdown"><!--[--><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/espnet2_tutorial_2021_CMU_11751_18781.html" aria-label="CMU 11751/18781 2021: ESPnet Tutorial"><!--[--><!--[--><!--]--> CMU 11751/18781 2021: ESPnet Tutorial <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/SpokenLanguageUnderstanding_CMU_11492_692_Spring2023(Assignment6).html" aria-label="CMU 11492/11692 Spring 2023: Spoken Language Understanding"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Spoken Language Understanding <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/SpeechEnhancement_CMU_11492_692_Spring2023(Assignment7).html" aria-label="CMU 11492/11692 Spring 2023: Speech Enhancement"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Speech Enhancement <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/DataPreparation_CMU_11492_692_Spring2023(Assignment0).html" aria-label="CMU 11492/11692 Spring 2023: Data preparation"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Data preparation <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/espnet2_new_task_tutorial_CMU_11751_18781_Fall2022.html" aria-label="CMU 11751/18781 Fall 2022: ESPnet Tutorial2 (New task)"><!--[--><!--[--><!--]--> CMU 11751/18781 Fall 2022: ESPnet Tutorial2 (New task) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/espnet2_recipe_tutorial_CMU_11751_18781_Fall2022.html" aria-label="CMU 11751/18781 Fall 2022: ESPnet Tutorial"><!--[--><!--[--><!--]--> CMU 11751/18781 Fall 2022: ESPnet Tutorial <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/TextToSpeech_CMU_11492_692_Spring2023(Assignment8).html" aria-label="CMU 11492/11692 Spring 2023: Text to Speech"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Text to Speech <!--[--><!--]--><!--]--></a></li><!--]--></ul></div></div><!--]--></nav><!--[--><!--]--><button class="toggle-color-mode-button" title="toggle color mode"><svg style="" class="icon" focusable="false" viewBox="0 0 32 32"><path d="M16 12.005a4 4 0 1 1-4 4a4.005 4.005 0 0 1 4-4m0-2a6 6 0 1 0 6 6a6 6 0 0 0-6-6z" fill="currentColor"></path><path d="M5.394 6.813l1.414-1.415l3.506 3.506L8.9 10.318z" fill="currentColor"></path><path d="M2 15.005h5v2H2z" fill="currentColor"></path><path d="M5.394 25.197L8.9 21.691l1.414 1.415l-3.506 3.505z" fill="currentColor"></path><path d="M15 25.005h2v5h-2z" fill="currentColor"></path><path d="M21.687 23.106l1.414-1.415l3.506 3.506l-1.414 1.414z" fill="currentColor"></path><path d="M25 15.005h5v2h-5z" fill="currentColor"></path><path d="M21.687 8.904l3.506-3.506l1.414 1.415l-3.506 3.505z" fill="currentColor"></path><path d="M15 2.005h2v5h-2z" fill="currentColor"></path></svg><svg style="display:none;" class="icon" focusable="false" viewBox="0 0 32 32"><path d="M13.502 5.414a15.075 15.075 0 0 0 11.594 18.194a11.113 11.113 0 0 1-7.975 3.39c-.138 0-.278.005-.418 0a11.094 11.094 0 0 1-3.2-21.584M14.98 3a1.002 1.002 0 0 0-.175.016a13.096 13.096 0 0 0 1.825 25.981c.164.006.328 0 .49 0a13.072 13.072 0 0 0 10.703-5.555a1.01 1.01 0 0 0-.783-1.565A13.08 13.08 0 0 1 15.89 4.38A1.015 1.015 0 0 0 14.98 3z" fill="currentColor"></path></svg></button><form class="search-box" role="search"><input type="search" placeholder="Search" autocomplete="off" spellcheck="false" value><!----></form></div></header><!--]--><div class="sidebar-mask"></div><!--[--><aside class="sidebar"><nav class="navbar-items" aria-label="site navigation"><!--[--><div class="navbar-item"><a class="external-link" href="https://github.com/espnet/espnet" rel="noopener noreferrer" target="_blank" aria-label="Github"><!--[--><!--[--><!--]--> Github <span><svg class="external-link-icon" xmlns="http://www.w3.org/2000/svg" aria-hidden="true" focusable="false" x="0px" y="0px" viewBox="0 0 100 100" width="15" height="15"><path fill="currentColor" d="M18.8,85.1h56l0,0c2.2,0,4-1.8,4-4v-32h-8v28h-48v-48h28v-8h-32l0,0c-2.2,0-4,1.8-4,4v56C14.8,83.3,16.6,85.1,18.8,85.1z"></path><polygon fill="currentColor" points="45.7,48.7 51.3,54.3 77.2,28.5 77.2,37.2 85.2,37.2 85.2,14.9 62.8,14.9 62.8,22.9 71.5,22.9"></polygon></svg><span class="external-link-icon-sr-only">open in new window</span></span><!--[--><!--]--><!--]--></a></div><div class="navbar-item"><a class="external-link" href="https://huggingface.co/espnet" rel="noopener noreferrer" target="_blank" aria-label="HuggingFace"><!--[--><!--[--><!--]--> HuggingFace <span><svg class="external-link-icon" xmlns="http://www.w3.org/2000/svg" aria-hidden="true" focusable="false" x="0px" y="0px" viewBox="0 0 100 100" width="15" height="15"><path fill="currentColor" d="M18.8,85.1h56l0,0c2.2,0,4-1.8,4-4v-32h-8v28h-48v-48h28v-8h-32l0,0c-2.2,0-4,1.8-4,4v56C14.8,83.3,16.6,85.1,18.8,85.1z"></path><polygon fill="currentColor" points="45.7,48.7 51.3,54.3 77.2,28.5 77.2,37.2 85.2,37.2 85.2,14.9 62.8,14.9 62.8,22.9 71.5,22.9"></polygon></svg><span class="external-link-icon-sr-only">open in new window</span></span><!--[--><!--]--><!--]--></a></div><div class="navbar-item"><a class="external-link" href="https://espnet.github.io/espnet" rel="noopener noreferrer" target="_blank" aria-label="Docs"><!--[--><!--[--><!--]--> Docs <span><svg class="external-link-icon" xmlns="http://www.w3.org/2000/svg" aria-hidden="true" focusable="false" x="0px" y="0px" viewBox="0 0 100 100" width="15" height="15"><path fill="currentColor" d="M18.8,85.1h56l0,0c2.2,0,4-1.8,4-4v-32h-8v28h-48v-48h28v-8h-32l0,0c-2.2,0-4,1.8-4,4v56C14.8,83.3,16.6,85.1,18.8,85.1z"></path><polygon fill="currentColor" points="45.7,48.7 51.3,54.3 77.2,28.5 77.2,37.2 85.2,37.2 85.2,14.9 62.8,14.9 62.8,22.9 71.5,22.9"></polygon></svg><span class="external-link-icon-sr-only">open in new window</span></span><!--[--><!--]--><!--]--></a></div><div class="navbar-item"><div class="navbar-dropdown-wrapper"><button class="navbar-dropdown-title" type="button" aria-label="espnet2"><span class="title">espnet2</span><span class="arrow down"></span></button><button class="navbar-dropdown-title-mobile" type="button" aria-label="espnet2"><span class="title">espnet2</span><span class="right arrow"></span></button><ul style="display:none;" class="navbar-dropdown"><!--[--><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>TTS</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/tts/tts_cli.html" aria-label="Text-to-Speech (Recipe)"><!--[--><!--[--><!--]--> Text-to-Speech (Recipe) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/tts/tts_realtime_demo.html" aria-label="ESPnet real time E2E-TTS demonstration"><!--[--><!--[--><!--]--> ESPnet real time E2E-TTS demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/tts/espnet2_tts_realtime_demo.html" aria-label="ESPnet2-TTS realtime demonstration"><!--[--><!--[--><!--]--> ESPnet2-TTS realtime demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>SE</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/se/se_demo.html" aria-label="ESPnet Speech Enhancement Demonstration"><!--[--><!--[--><!--]--> ESPnet Speech Enhancement Demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/se/espnet_se_demonstration_for_waspaa_2021.html" aria-label="ESPnet Speech Enhancement Demonstration"><!--[--><!--[--><!--]--> ESPnet Speech Enhancement Demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>SLU</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/slu/espnet2_2pass_slu_demo.html" aria-label="ESPNET 2 pass SLU Demonstration"><!--[--><!--[--><!--]--> ESPNET 2 pass SLU Demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>ASR</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/asr_cli.html" aria-label="Speech Recognition (Recipe)"><!--[--><!--[--><!--]--> Speech Recognition (Recipe) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/espnet2_asr_realtime_demo.html" aria-label="ESPnet2-ASR realtime demonstration"><!--[--><!--[--><!--]--> ESPnet2-ASR realtime demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/asr_library.html" aria-label="Speech Recognition (Library)"><!--[--><!--[--><!--]--> Speech Recognition (Library) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/espnet2_asr_transfer_learning_demo.html" aria-label="Use transfer learning for ASR in ESPnet2"><!--[--><!--[--><!--]--> Use transfer learning for ASR in ESPnet2 <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/asr/espnet2_streaming_asr_demo.html" aria-label="ESPnet2 real streaming Transformer demonstration"><!--[--><!--[--><!--]--> ESPnet2 real streaming Transformer demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>OTHERS</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/others/onnx_conversion_demo.html" aria-label="espnet_onnx demonstration"><!--[--><!--[--><!--]--> espnet_onnx demonstration <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/others/pretrained.html" aria-label="Pretrained Model"><!--[--><!--[--><!--]--> Pretrained Model <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>ST</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnet2/st/st_demo.html" aria-label="ESPnet Speech Translation Demonstration"><!--[--><!--[--><!--]--> ESPnet Speech Translation Demonstration <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><!--]--></ul></div></div><div class="navbar-item"><div class="navbar-dropdown-wrapper"><button class="navbar-dropdown-title" type="button" aria-label="espnetez"><span class="title">espnetez</span><span class="arrow down"></span></button><button class="navbar-dropdown-title-mobile" type="button" aria-label="espnetez"><span class="title">espnetez</span><span class="right arrow"></span></button><ul style="display:none;" class="navbar-dropdown"><!--[--><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>TTS</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/tts/tacotron2.html" aria-label="TTS demo for ESPnet-Easy!"><!--[--><!--[--><!--]--> TTS demo for ESPnet-Easy! <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><li class="navbar-dropdown-item"><!--[--><h4 class="navbar-dropdown-subtitle"><span>ASR</span></h4><ul class="navbar-dropdown-subitem-wrapper"><!--[--><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/asr/finetune_with_lora.html" aria-label="Finetune Model with ESPnet-Easy"><!--[--><!--[--><!--]--> Finetune Model with ESPnet-Easy <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/asr/train.html" aria-label="Sample demo for ESPnet-Easy!"><!--[--><!--[--><!--]--> Sample demo for ESPnet-Easy! <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-subitem"><a class="route-link" href="/espnetez/asr/finetune_owsm.html" aria-label="OWSM finetuning with custom dataset"><!--[--><!--[--><!--]--> OWSM finetuning with custom dataset <!--[--><!--]--><!--]--></a></li><!--]--></ul><!--]--></li><!--]--></ul></div></div><div class="navbar-item"><div class="navbar-dropdown-wrapper"><button class="navbar-dropdown-title" type="button" aria-label="tutorials"><span class="title">tutorials</span><span class="arrow down"></span></button><button class="navbar-dropdown-title-mobile" type="button" aria-label="tutorials"><span class="title">tutorials</span><span class="right arrow"></span></button><ul style="display:none;" class="navbar-dropdown"><!--[--><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/espnet2_tutorial_2021_CMU_11751_18781.html" aria-label="CMU 11751/18781 2021: ESPnet Tutorial"><!--[--><!--[--><!--]--> CMU 11751/18781 2021: ESPnet Tutorial <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/SpokenLanguageUnderstanding_CMU_11492_692_Spring2023(Assignment6).html" aria-label="CMU 11492/11692 Spring 2023: Spoken Language Understanding"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Spoken Language Understanding <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/SpeechEnhancement_CMU_11492_692_Spring2023(Assignment7).html" aria-label="CMU 11492/11692 Spring 2023: Speech Enhancement"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Speech Enhancement <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/DataPreparation_CMU_11492_692_Spring2023(Assignment0).html" aria-label="CMU 11492/11692 Spring 2023: Data preparation"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Data preparation <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/espnet2_new_task_tutorial_CMU_11751_18781_Fall2022.html" aria-label="CMU 11751/18781 Fall 2022: ESPnet Tutorial2 (New task)"><!--[--><!--[--><!--]--> CMU 11751/18781 Fall 2022: ESPnet Tutorial2 (New task) <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/espnet2_recipe_tutorial_CMU_11751_18781_Fall2022.html" aria-label="CMU 11751/18781 Fall 2022: ESPnet Tutorial"><!--[--><!--[--><!--]--> CMU 11751/18781 Fall 2022: ESPnet Tutorial <!--[--><!--]--><!--]--></a></li><li class="navbar-dropdown-item"><a class="route-link" href="/tutorials/TextToSpeech_CMU_11492_692_Spring2023(Assignment8).html" aria-label="CMU 11492/11692 Spring 2023: Text to Speech"><!--[--><!--[--><!--]--> CMU 11492/11692 Spring 2023: Text to Speech <!--[--><!--]--><!--]--></a></li><!--]--></ul></div></div><!--]--></nav><!--[--><!--]--><!----><!--[--><!--]--></aside><!--]--><!--[--><main class="home"><header class="hero"><!----><h1 id="main-title"> </h1><p class="description"> </p><!----></header><!----><div class="theme-default-content"><div><p align="center"><a href="https://vuepress.vuejs.org/" target="_blank"><img width="600" src="/images/espnet_logo1.png" alt="logo"></a><h3><!----></h3></p><h3 id="install" tabindex="-1"><a class="header-anchor" href="#install"><span>Install</span></a></h3><p>If you intend to do full experiments, including DNN training, then see Installation.</p><p>If you just need the Python module only:</p><div class="language-bash line-numbers-mode" data-ext="sh" data-title="sh"><pre class="shiki dark-plus" style="background-color:#1E1E1E;color:#D4D4D4;" tabindex="0"><code><span class="line"><span style="color:#6A9955;"># We recommend you install PyTorch before installing espnet following https://pytorch.org/get-started/locally/</span></span>
<span class="line"><span style="color:#DCDCAA;">pip</span><span style="color:#CE9178;"> install</span><span style="color:#CE9178;"> espnet</span></span>
<span class="line"><span style="color:#6A9955;"># To install the latest</span></span>
<span class="line"><span style="color:#6A9955;"># pip install git+https://github.com/espnet/espnet</span></span>
<span class="line"><span style="color:#6A9955;"># To install additional packages</span></span>
<span class="line"><span style="color:#6A9955;"># pip install &quot;espnet[all]&quot;</span></span>
<span class="line"></span></code></pre><div class="line-numbers" aria-hidden="true"><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div><div class="line-number"></div></div></div><h3 id="citation" tabindex="-1"><a class="header-anchor" href="#citation"><span>Citation</span></a></h3><p>You can find the citation <a href="https://github.com/espnet/espnet?tab=readme-ov-file#citations" target="_blank" rel="noopener noreferrer">here<span><svg class="external-link-icon" xmlns="http://www.w3.org/2000/svg" aria-hidden="true" focusable="false" x="0px" y="0px" viewBox="0 0 100 100" width="15" height="15"><path fill="currentColor" d="M18.8,85.1h56l0,0c2.2,0,4-1.8,4-4v-32h-8v28h-48v-48h28v-8h-32l0,0c-2.2,0-4,1.8-4,4v56C14.8,83.3,16.6,85.1,18.8,85.1z"></path><polygon fill="currentColor" points="45.7,48.7 51.3,54.3 77.2,28.5 77.2,37.2 85.2,37.2 85.2,14.9 62.8,14.9 62.8,22.9 71.5,22.9"></polygon></svg><span class="external-link-icon-sr-only">open in new window</span></span></a></p></div></div><!--[--><div class="footer">MIT Licensed | Copyright © 2024-present ESPnet Community</div><!--]--></main><!--]--></div><!--[--><!----><!--]--><!--]--></div>
<script type="module" src="/assets/app-DTS6SjJz.js" defer></script>
</body>
</html>