<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:atom="http://www.w3.org/2005/Atom" xmlns:media="http://search.yahoo.com/mrss/" xmlns:feedpress="https://feed.press/xmlns" xmlns:podcast="https://podcastindex.org/namespace/1.0" version="2.0">
  <channel>
    <feedpress:locale>en</feedpress:locale>
    <atom:link rel="hub" href="https://feedpress.superfeedr.com/"/>
    <atom:link href="https://feedpress.me/wx-yyzt" rel="self" type="application/rss+xml"/>
    <atom:icon>https://localhost:3000/favicon.ico</atom:icon>
    <title>语音杂谈</title>
    <description>公众号“语音杂谈”更新 - 使用 Huginn 制作</description>
    <link>https://localhost:3000</link>
    <lastBuildDate>Sun, 03 May 2026 20:19:39 -0700</lastBuildDate>
    <pubDate>Sun, 03 May 2026 20:19:39 -0700</pubDate>
    <ttl>60</ttl>
    <item>
      <title>MeanAudio：单步生成！100 倍加速！首个 MeanFlow 文本转音频模型重磅开源</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzI4OTQyNzA0Ng%3D%3D&amp;mid=2247544976&amp;idx=2&amp;sn=9be632d0d04c1d2747e4e5e8bce5dbaf</link>
      <pubDate>Mon, 13 Apr 2026 03:00:45 -0700</pubDate>
      <guid isPermaLink="false">633087</guid>
    </item>
    <item>
      <title>语音/音频处理学术速递[4.13]</title>
      <description><![CDATA[cs.SD语音14篇，eess.AS音频处理8篇]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzI4OTQyNzA0Ng%3D%3D&amp;mid=2247544976&amp;idx=3&amp;sn=aadf8a8d0daa937374abf382f95ac949</link>
      <pubDate>Mon, 13 Apr 2026 03:00:45 -0700</pubDate>
      <guid isPermaLink="false">633086</guid>
    </item>
    <item>
      <title>【征稿启事】第十五届中文口语语言处理国际研讨会 (ISCSLP 2026) 邀您相聚马来西亚槟城！</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzI4OTQyNzA0Ng%3D%3D&amp;mid=2247544976&amp;idx=1&amp;sn=dc1d49eec285190f0da066086a7d3969</link>
      <pubDate>Mon, 13 Apr 2026 03:00:44 -0700</pubDate>
      <guid isPermaLink="false">633073</guid>
    </item>
    <item>
      <title>语音/音频处理学术速递[3.30]</title>
      <description><![CDATA[cs.SD语音9篇，eess.AS音频处理7篇]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzI4OTQyNzA0Ng%3D%3D&amp;mid=2247544680&amp;idx=3&amp;sn=481e008444f526046928f2e85b3151c9</link>
      <pubDate>Mon, 30 Mar 2026 03:08:39 -0700</pubDate>
      <guid isPermaLink="false">630630</guid>
    </item>
    <item>
      <title>Suno 5.5 发布 允许用户克隆声音演唱 AI 生成歌曲</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzI4OTQyNzA0Ng%3D%3D&amp;mid=2247544680&amp;idx=2&amp;sn=1284d747138a494153c7b44722c8f1dc</link>
      <pubDate>Mon, 30 Mar 2026 03:08:39 -0700</pubDate>
      <guid isPermaLink="false">630628</guid>
    </item>
    <item>
      <title>ICASSP 2026｜MeanVC：基于平均流的轻量级流式零样本语音转换</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzI4OTQyNzA0Ng%3D%3D&amp;mid=2247544680&amp;idx=1&amp;sn=be550df1d0c4764a623a4e5619f39e72</link>
      <pubDate>Mon, 30 Mar 2026 03:08:38 -0700</pubDate>
      <guid isPermaLink="false">630627</guid>
    </item>
    <item>
      <title>基于WeNet的关键词识别WeKws - WeNet keyword spotting-3-其他模型构造</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496939&amp;idx=4&amp;sn=4c3d2acbdfdc05231161c62acf39168a</link>
      <pubDate>Fri, 29 Jul 2022 19:00:39 -0700</pubDate>
      <guid isPermaLink="false">629374</guid>
    </item>
    <item>
      <title>基于WeNet的关键词识别WeKws - WeNet keyword spotting-2-TCN模型forward</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496939&amp;idx=3&amp;sn=5413692e8dbce0dac27cf24ffdebcc23</link>
      <pubDate>Fri, 29 Jul 2022 19:00:39 -0700</pubDate>
      <guid isPermaLink="false">629373</guid>
    </item>
    <item>
      <title>基于WeNet的关键词识别WeKws - WeNet keyword spotting-1-TCN模型构造</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496939&amp;idx=2&amp;sn=ca269d2d65c22a3fe7d09bb940224870</link>
      <pubDate>Fri, 29 Jul 2022 19:00:39 -0700</pubDate>
      <guid isPermaLink="false">629372</guid>
    </item>
    <item>
      <title>INTERSPEECH 2022论文解读｜Paraformer: 高识别率、高计算效率的单轮非自回归端到端语音识别模型</title>
      <description><![CDATA[Paraformer 模型在工业在数据上取得了与自回归模型类似的识别效果，计算效率提升 10 倍以上。]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496939&amp;idx=1&amp;sn=5aedc86899d5064fcb27583bf5c00180</link>
      <pubDate>Fri, 29 Jul 2022 19:00:38 -0700</pubDate>
      <guid isPermaLink="false">629362</guid>
    </item>
    <item>
      <title>极速上手新一代 Kaldi 服务端框架 sherpa</title>
      <description><![CDATA[本文介绍如何极速（而非快速）上手新一代 Kaldi 服务端框架 sherpa。]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496610&amp;idx=2&amp;sn=702413199010b8b2fff18c109b6eacbf</link>
      <pubDate>Wed, 20 Jul 2022 03:30:47 -0700</pubDate>
      <guid isPermaLink="false">629361</guid>
    </item>
    <item>
      <title>端到端语音识别应用基于前缀树的热词技术</title>
      <description><![CDATA[在深度学习火爆的今天，大规模数据下训练的大规模模型在线上任务中日益常见。随着大模型效果的提升，随之带来了一些]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496610&amp;idx=1&amp;sn=f61290bb301a4cae89ccf0e40462b301</link>
      <pubDate>Wed, 20 Jul 2022 03:30:46 -0700</pubDate>
      <guid isPermaLink="false">629360</guid>
    </item>
    <item>
      <title>论文分享|腾讯音乐天琴实验室两篇论文入选国际会议INTERSPEECH</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496482&amp;idx=2&amp;sn=8251ff59810cd7db14a5d62ee06edff0</link>
      <pubDate>Sat, 16 Jul 2022 03:30:47 -0700</pubDate>
      <guid isPermaLink="false">629359</guid>
    </item>
    <item>
      <title>IEEE TPAMI | 火山语音提出多源迁移高斯回归模型，效果超越多个SOTA方法</title>
      <description><![CDATA[该研究成果已被人工智能领域顶级国际期刊 IEEE TPAMI 接收。]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496482&amp;idx=1&amp;sn=b7c7abc9be451939e252f3ca4f46f2dd</link>
      <pubDate>Sat, 16 Jul 2022 03:30:46 -0700</pubDate>
      <guid isPermaLink="false">629358</guid>
    </item>
    <item>
      <title>论文推介：语音指令识别中的最小序列混淆错误准则</title>
      <description><![CDATA[作为语音识别领域的一项典型任务，语音指令识别（Speech Command Recognition，SCR）]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496436&amp;idx=2&amp;sn=4c37d9c3083c1b4f606acc6491028fd4</link>
      <pubDate>Thu, 14 Jul 2022 03:31:23 -0700</pubDate>
      <guid isPermaLink="false">629357</guid>
    </item>
    <item>
      <title>【语音之家】AI产业沙龙—智能语音技术在美团的应用实践</title>
      <description><![CDATA[直播时间：2022年7月15日 18:00 - 20:05]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496436&amp;idx=1&amp;sn=40ec5d167c75a93276ca51afe2e2de73</link>
      <pubDate>Thu, 14 Jul 2022 03:31:23 -0700</pubDate>
      <guid isPermaLink="false">629338</guid>
    </item>
    <item>
      <title>字节跳动 AI Lab 总监李航：语言模型的过去、现在和未来</title>
      <description><![CDATA[在未来几年，神经语言模型尤其是预训练的语言模型仍将是 NLP 最有力的工具。]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496373&amp;idx=2&amp;sn=281711deeff01720fb00eaf50344fd8f</link>
      <pubDate>Tue, 12 Jul 2022 03:31:40 -0700</pubDate>
      <guid isPermaLink="false">629337</guid>
    </item>
    <item>
      <title>新一代 Kaldi 中基于量化的蒸馏实验</title>
      <description><![CDATA[Dan哥的新型蒸馏方法]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496373&amp;idx=1&amp;sn=83341a63d8450889c0439a6b92644625</link>
      <pubDate>Tue, 12 Jul 2022 03:31:40 -0700</pubDate>
      <guid isPermaLink="false">629336</guid>
    </item>
    <item>
      <title>AIWIN 2022丨文本语音驱动数字人表情口型竞赛</title>
      <description><![CDATA[文本语音驱动数字人表情口型竞赛，一起探秘数字人。]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496327&amp;idx=2&amp;sn=d9320e99fe006766b6ecb6582c6d0e2c</link>
      <pubDate>Sat, 09 Jul 2022 04:02:16 -0700</pubDate>
      <guid isPermaLink="false">629334</guid>
    </item>
    <item>
      <title>论文分享丨NPU-ASLP实验室将携14篇论文参加语音旗舰会议INTERSPEECH2022</title>
      <description><![CDATA[作为语音相关研究领域的旗舰国际会议，INTERSPEECH2022（Annual Conference of]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496327&amp;idx=1&amp;sn=3934c9f011515101c700ae336e417155</link>
      <pubDate>Sat, 09 Jul 2022 04:02:16 -0700</pubDate>
      <guid isPermaLink="false">629333</guid>
    </item>
    <item>
      <title>论文分享丨基于随机循环一致性准则的语音信息分解工作获 Odyssey 最佳学生论文奖</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496241&amp;idx=2&amp;sn=8c9ed0a13aff52be3df983c4f32fee02</link>
      <pubDate>Thu, 07 Jul 2022 04:01:33 -0700</pubDate>
      <guid isPermaLink="false">629332</guid>
    </item>
    <item>
      <title>如何基于新一代 Kaldi 框架快速搭建服务端 ASR 系统</title>
      <description><![CDATA[如何基于新一代 Kaldi 框架快速搭建一个服务端的 ASR 系统]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496241&amp;idx=1&amp;sn=d412722ba58c56014d54f0a621bb03ac</link>
      <pubDate>Thu, 07 Jul 2022 04:01:33 -0700</pubDate>
      <guid isPermaLink="false">629314</guid>
    </item>
    <item>
      <title>论文分享 | THUHCSI人机语音交互实验室论文入选多媒体领域顶级国际会议ACM MM</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496194&amp;idx=3&amp;sn=38a26a9d6e56624f4f635ab5c86300d6</link>
      <pubDate>Tue, 05 Jul 2022 04:00:26 -0700</pubDate>
      <guid isPermaLink="false">629312</guid>
    </item>
    <item>
      <title>全球首个《AI对话系统分级定义》发布，这下语音助手有了强弱之分</title>
      <description><![CDATA[L0 ~ L5，AI对话系统领域有了自己的分级规范。]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496194&amp;idx=2&amp;sn=99c348c4b93aba26bfae2e1c2a605d60</link>
      <pubDate>Tue, 05 Jul 2022 04:00:25 -0700</pubDate>
      <guid isPermaLink="false">629310</guid>
    </item>
    <item>
      <title>【语音之家公开课】语音分离的神经网络方法 Speech Separation with Neural Network</title>
      <description><![CDATA[7月8日18:00，邹月娴进行分享！]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496194&amp;idx=1&amp;sn=ca6de9eba781847e2dcb7610c181b166</link>
      <pubDate>Tue, 05 Jul 2022 04:00:24 -0700</pubDate>
      <guid isPermaLink="false">629309</guid>
    </item>
    <item>
      <title>Reworked Conformer</title>
      <description><![CDATA[看Povey博士如何魔改Conformer]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496130&amp;idx=2&amp;sn=657cb8bfa4e2610f60410c7ecb94c798</link>
      <pubDate>Sat, 02 Jul 2022 04:00:29 -0700</pubDate>
      <guid isPermaLink="false">629308</guid>
    </item>
    <item>
      <title>如何打造真人化高表现力的语音合成系统</title>
      <description><![CDATA[高表现力语音合成逐渐成为未来的趋势。它有三个显著的特点：韵律自然、情感风格丰富和音质清澈。]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzU4MTA0NDE5NQ%3D%3D&amp;mid=2247496130&amp;idx=1&amp;sn=b2e8e7a4723d41de80c4871f913777ef</link>
      <pubDate>Sat, 02 Jul 2022 04:00:29 -0700</pubDate>
      <guid isPermaLink="false">629307</guid>
    </item>
    <item>
      <title>ICASSP 2026｜Phys-NVAS：基于视觉语言模型物理先验挖掘与3D声学环境建模的新视角声学合成</title>
      <description><![CDATA[]]></description>
      <link>http://mp.weixin.qq.com/s?__biz=MzI4OTQyNzA0Ng%3D%3D&amp;mid=2247544660&amp;idx=1&amp;sn=f4dfc47f37775070c428a8de20216888</link>
      <pubDate>Sat, 28 Mar 2026 03:00:30 -0700</pubDate>
      <guid isPermaLink="false">627673</guid>
    </item>
  </channel>
</rss>
