@@ -205,7 +205,7 @@ <h1 class="title is-1 publication-title">Fun-ASR: End-to-End Speech Recognition
205205
206206 < div class ="column has-text-centered ">
207207 < div class ="publication-links ">
208- <!-- GitHub Repository -->
208+ <!-- GitHub Repository -->
209209 < span class ="link-block ">
210210 < a href ="https://github.com/FunAudioLLM/Fun-ASR " target ="_blank "
211211 class ="external-link button is-normal is-rounded is-dark ">
@@ -269,54 +269,80 @@ <h2 class="title is-3">Abstract</h2>
269269<!-- Image carousel -->
270270< section class ="hero is-small ">
271271 < div class ="hero-body ">
272- <!-- <div class="container" style="max-width: 50%;"> -->
273- < div class ="container ">
272+ < div class ="container ">
274273 < div class ="columns is-centered ">
275- < div class ="column is-10 ">
276- < div id ="results-carousel " class ="carousel results-carousel ">
277- < div class ="item ">
278- <!-- TODO: Replace with your research result images -->
279- < img src ="static/images/FunAudio_img.png " alt ="Architecture " loading ="lazy " style ="width:100% "/>
280- <!-- Fun-ASR整体架构图 -->
281- < h2 class ="subtitle has-text-centered ">
282- Fun-ASR Architecture Overview
283- </ h2 >
284- </ div >
285- < div class ="item ">
286- < img src ="static/images/compare.png " alt ="comparer " loading ="lazy " style ="width:100% "/> />
287- <!-- Fun-ASR整体架构图 -->
288- < h2 class ="subtitle has-text-centered ">
289- Fun-ASR Performance Comparison with Other Models
290- </ h2 >
291- </ div >
292- < div class ="item ">
293- <!-- Your image here -->
294- < img src ="static/images/encoder-pretrain.png " alt ="encoder-pretrain " loading ="lazy " style ="width:70% "/> />
295- < h2 class ="subtitle has-text-centered ">
296- Pre-training Pipeline for Audio Encoder
297- </ h2 >
274+ < div class ="column is-10 ">
275+ < div id ="architecture-carousel " class ="carousel results-carousel ">
276+ < div class ="item ">
277+ <!-- TODO: Replace with your research result images -->
278+ < img src ="static/images/FunAudio_img.png " alt ="Architecture " loading ="lazy " style ="width:100% "/>
279+ < h2 class ="subtitle has-text-centered ">
280+ Fun-ASR Architecture Overview
281+ </ h2 >
282+ </ div >
283+ < div class ="item ">
284+ <!-- Your image here -->
285+ < img src ="static/images/encoder-pretrain.png " alt ="encoder-pretrain " loading ="lazy " style ="width:70% "/>
286+ < h2 class ="subtitle has-text-centered ">
287+ Pre-training Pipeline for Audio Encoder
288+ </ h2 >
289+ </ div >
290+ < div class ="item ">
291+ <!-- Your image here -->
292+ < img src ="static/images/rl_framework.png " alt ="rl_framework " loading ="lazy " style ="width:100% "/>
293+ < h2 class ="subtitle has-text-centered ">
294+ The FunRL Framework
295+ </ h2 >
296+ </ div >
297+ < div class ="item ">
298+ <!-- Your image here -->
299+ < img src ="static/images/rl_time.png " alt ="rl_time " loading ="lazy " style ="height:800px; width:100% "/>
300+ < h2 class ="subtitle has-text-centered ">
301+ Time Consumption Analysis
302+ </ h2 >
303+ </ div >
304+ </ div >
298305 </ div >
299- < div class ="item ">
300- <!-- Your image here -->
301- < img src ="static/images/rl_framework.png " alt ="rl_framework " loading ="lazy " style ="width:100% "/> />
302- < h2 class ="subtitle has-text-centered ">
303- The FunRL Framework
304- </ h2 >
305- </ div >
306- < div class ="item ">
307- <!-- Your image here -->
308- < img src ="static/images/rl_time.png " alt ="rl_time " loading ="lazy " style ="height:800px; width:100% "/> />
309- < h2 class ="subtitle has-text-centered ">
310- Time Consumption Analysis
311- </ h2 >
312- </ div >
306+ </ div >
313307 </ div >
308+ </ section >
309+
310+
311+ < section class ="hero is-small ">
312+ < div class ="hero-body ">
313+ < div class ="container ">
314+ < div class ="columns is-centered ">
315+ < div class ="column is-10 ">
316+ < div id ="architecture-carousel " class ="carousel results-carousel ">
317+ < div class ="item ">
318+ <!-- Your image here -->
319+ < img src ="static/images/compare.png " alt ="compare " loading ="lazy " style ="width:100% "/>
320+ < h2 class ="subtitle has-text-centered ">
321+ Performance Comparison in Different Scenarios
322+ </ h2 >
323+ </ div >
324+ < div class ="item ">
325+ <!-- Your image here -->
326+ < img src ="static/images/compare.png " alt ="compare_1 " loading ="lazy " style ="height:800px; width:100% "/>
327+ < h2 class ="subtitle has-text-centered ">
328+ Performance Comparison in Different Scenarios (Contd.)
329+ </ h2 >
330+ </ div >
331+ </ div >
332+ </ div >
333+ </ div >
314334 </ div >
315- </ div >
316- </ div >
317- </ div >
318335</ section >
319- <!-- End image carousel -->
336+
337+
338+
339+
340+
341+
342+
343+
344+
345+
320346
321347< section class ="section ">
322348 < div class ="container is-max-desktop ">
@@ -1517,6 +1543,7 @@ <h4 class="table-title">Multilingual ASR Performance (WER/CER %)</h4>
15171543
15181544
15191545
1546+
15201547
15211548
15221549<!--BibTex citation -->
0 commit comments