
{"id":7542,"date":"2026-01-26T04:39:34","date_gmt":"2026-01-25T20:39:34","guid":{"rendered":"https:\/\/infernews.com\/?page_id=7542"},"modified":"2026-02-24T00:08:28","modified_gmt":"2026-02-23T16:08:28","slug":"asr-tts","status":"publish","type":"page","link":"https:\/\/infernews.com\/blog\/asr-tts\/","title":{"rendered":"ASR &#8211; TTS \u958b\u6e90\u7cb5\u8a9e\u8a9e\u97f3"},"content":{"rendered":"<figure class=\"wp-block-embed-youtube wp-block-embed is-type-video is-provider-youtube wp-embed-aspect-16-9 wp-has-aspect-ratio\"><div class=\"lyte-wrapper\" title=\"WenetSpeech-Yue (Cantonese Version)\" style=\"width:853px;max-width:100%;margin:5px auto;\"><div class=\"lyMe\" id=\"WYL_ApuVgdgg4Io\" itemprop=\"video\" itemscope itemtype=\"https:\/\/schema.org\/VideoObject\"><div><meta itemprop=\"thumbnailUrl\" content=\"https:\/\/infernews.com\/blog\/wp-content\/plugins\/wp-youtube-lyte\/lyteCache.php?origThumbUrl=https%3A%2F%2Fi.ytimg.com%2Fvi%2FApuVgdgg4Io%2Fhqdefault.jpg\" \/><meta itemprop=\"embedURL\" content=\"https:\/\/www.youtube.com\/embed\/ApuVgdgg4Io\" \/><meta itemprop=\"duration\" content=\"PT7M24S\" \/><meta itemprop=\"uploadDate\" content=\"2025-09-08T03:10:36Z\" \/><\/div><div id=\"lyte_ApuVgdgg4Io\" data-src=\"https:\/\/infernews.com\/blog\/wp-content\/plugins\/wp-youtube-lyte\/lyteCache.php?origThumbUrl=https%3A%2F%2Fi.ytimg.com%2Fvi%2FApuVgdgg4Io%2Fhqdefault.jpg\" class=\"pL\"><div class=\"tC\"><div class=\"tT\" itemprop=\"name\">WenetSpeech-Yue (Cantonese Version)<\/div><\/div><div class=\"play\"><\/div><div class=\"ctrl\"><div class=\"Lctrl\"><\/div><div class=\"Rctrl\"><\/div><\/div><\/div><noscript><a href=\"https:\/\/youtu.be\/ApuVgdgg4Io\" rel=\"nofollow\"><img loading=\"lazy\" decoding=\"async\" src=\"https:\/\/infernews.com\/blog\/wp-content\/plugins\/wp-youtube-lyte\/lyteCache.php?origThumbUrl=https%3A%2F%2Fi.ytimg.com%2Fvi%2FApuVgdgg4Io%2F0.jpg\" alt=\"WenetSpeech-Yue (Cantonese Version)\" width=\"853\" height=\"460\" \/><br \/>Watch this video on YouTube<\/a><\/noscript><meta itemprop=\"description\" content=\"A Large-scale Cantonese Speech Corpus with Multi-dimensional Annotation\"><\/div><\/div><div class=\"lL\" style=\"max-width:100%;width:853px;margin:5px auto;\"><\/div><figcaption><\/figcaption><\/figure>\n\n\n<p><\/p>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n<div class=\"vlp-link-container vlp-layout-spotlight-clone wp-block-visual-link-preview-link\"><a href=\"https:\/\/aslp-lab.github.io\/WenetSpeech-Yue\/\" class=\"vlp-link\" title=\"WenetSpeech-Yue\" rel=\"nofollow\" target=\"_blank\"><\/a><div class=\"vlp-layout-zone-main\"><span class=\"vlp-block-0 vlp-link-title\">WenetSpeech-Yue<\/span><div class=\"vlp-block-1 vlp-link-summary\">A Large-Scale Cantonese Speech Corpus with Multi-dimensional Annotation<\/div><div class=\"vlp-block-2 vlp-link-image\"><img loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"451\" src=\"https:\/\/infernews.com\/blog\/wp-content\/uploads\/2026\/01\/WenetSpeech-Yue.jpg\" class=\"attachment-large size-large not-transparent\" alt=\"\" srcset=\"https:\/\/infernews.com\/blog\/wp-content\/uploads\/2026\/01\/WenetSpeech-Yue.jpg 1024w, https:\/\/infernews.com\/blog\/wp-content\/uploads\/2026\/01\/WenetSpeech-Yue-300x132.jpg 300w, https:\/\/infernews.com\/blog\/wp-content\/uploads\/2026\/01\/WenetSpeech-Yue-768x338.jpg 768w\" sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" data-has-transparency=\"false\" data-dominant-color=\"d8dada\" style=\"max-width: 1024px;--dominant-color: #d8dada;\" \/><\/div><\/div><\/div>\n\n<div class=\"vlp-link-container vlp-layout-spotlight-clone wp-block-visual-link-preview-link\"><a href=\"https:\/\/canclid.github.io\/zoengjyutgaai\/\" class=\"vlp-link\" title=\"\u5f35\u60a6\u6977\u8b1b\u53e4\u8a9e\u97f3\u6578\u64da\u96c6 The Zoeng Jyut Gaai Storytelling Speech Dataset\" rel=\"nofollow\" target=\"_blank\"><\/a><div class=\"vlp-layout-zone-main\"><span class=\"vlp-block-0 vlp-link-title\">\u5f35\u60a6\u6977\u8b1b\u53e4\u8a9e\u97f3\u6578\u64da\u96c6 The Zoeng Jyut Gaai Storytelling Speech Dataset<\/span><div class=\"vlp-block-1 vlp-link-summary\">\u958b\u6e90\u7cb5\u8a9e\u8a9e\u97f3\u6578\u64da\u96c6\uff0c\u9069\u5408\u8a9e\u97f3\u8b58\u5225\u3001\u8a9e\u97f3\u5408\u6210\u3001\u5927\u8a9e\u8a00\u6a21\u578b\u3001\u8a9e\u8a00\u5b78\u6587\u5b78\u7814\u7a76\u7b49\u61c9\u7528 Open-sourced Cantonese speech dataset for ASR, TTS, LLM, linguistics research and more<\/div><div class=\"vlp-block-2 vlp-link-image\"><img decoding=\"async\" src=\"https:\/\/canclid.github.io\/zoengjyutgaai\/zoengjyutgaai.webp\" style=\"max-width: 1024px; max-height: 1024px\" \/><\/div><\/div><\/div>\n\n\n<p><\/p>\n","protected":false},"excerpt":{"rendered":"","protected":false},"author":1,"featured_media":0,"parent":0,"menu_order":0,"comment_status":"closed","ping_status":"closed","template":"","meta":{"googlesitekit_rrm_CAowvqSiDA:productID":"","footnotes":""},"class_list":["post-7542","page","type-page","status-publish","hentry"],"_links":{"self":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/pages\/7542","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/pages"}],"about":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/types\/page"}],"author":[{"embeddable":true,"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/comments?post=7542"}],"version-history":[{"count":5,"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/pages\/7542\/revisions"}],"predecessor-version":[{"id":7721,"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/pages\/7542\/revisions\/7721"}],"wp:attachment":[{"href":"https:\/\/infernews.com\/blog\/wp-json\/wp\/v2\/media?parent=7542"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}