[{"@type":"PropertyValue","name":"Format","value":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Recording environment","value":"professional recording studio;"},{"@type":"PropertyValue","name":"Recording content","value":"contains educational, game and general colloquial content;"},{"@type":"PropertyValue","name":"Speaker","value":"professional voice actor, two male and two female, 2 hours per person;"},{"@type":"PropertyValue","name":"Annotation","value":"word and phoneme transcription, prosodic boundary annotation;"},{"@type":"PropertyValue","name":"Device","value":"microphone;"},{"@type":"PropertyValue","name":"Language","value":"Cantonese;"},{"@type":"PropertyValue","name":"Application scenarios","value":"speech synthesis."}]
{"id":1568,"datatype":"1","titleimg":"https://www.nexdata.ai/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"219","type2str":null,"dataname":"4 People - Cantonese Average Tone Speech Synthesis Corpus","datazy":[{"title":"Format","content":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"title":"Recording environment","content":"professional recording studio;"},{"title":"Recording content","content":"contains educational, game and general colloquial content;"},{"title":"Speaker","content":"professional voice actor, two male and two female, 2 hours per person;"},{"title":"Annotation","content":"word and phoneme transcription, prosodic boundary annotation;"},{"title":"Device","content":"microphone;"},{"title":"Language","content":"Cantonese;"},{"title":"Application scenarios","content":"speech synthesis."}],"datatag":"Synthesis Corpus,TTS,Cantonese","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":null,"samplePresentation":[{"name":"200001.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/200001.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=%2BAY2dp1kQW7BvpcceiWPQipnpzo%3D","intro":"呢个#1都#1可以#1值得#1考虑#1一下嘅#4。\tni1 go3 dou1 ho2 ji3 zik6 dak1 haau2 leoi6 jat1 haa5 ge3","size":376116,"progress":100,"type":"mp3"},{"name":"200002.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/200002.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=BsjU8nsdUJ8IHf78C4t8PjdYwiU%3D","intro":"盛赞#1布兰卡奇#1礼拜堂#2为#1艺术#1大师#1学校#4。\tsing6 zaan3 bou3 laan4 kaa1 kei4 lai5 baai3 tong2 wai4 ngai6 seot6 daai6 si1 hok6 haau6","size":560840,"progress":100,"type":"mp3"},{"name":"200003.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/200003.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=C3LSZhhEGixBYBRasQGRmsbciLE%3D","intro":"玩耐咗#2就#1可以#1获得#3活动#1经验#1同#1硬币#4。\twaan2 noi6 zo2 zau6 ho2 ji3 wok6 dak1 wut6 dung6 ging1 jim6 tung4 ngaang6 bai6","size":556736,"progress":100,"type":"mp3"},{"name":"200004.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/200004.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=vr8NK4zM8kvLM3MHmhKaZ%2Bb81XU%3D","intro":"房间#1可能#1酒店#1最好#1近#1海边啦#4。\tfong4 gaan1 ho2 nang4 zau2 dim3 zeoi3 hou2 kan5 hoi2 bin1 laa1","size":435200,"progress":100,"type":"mp3"},{"name":"200005.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/200005.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=7%2FLka1KhsyS3y%2B7UCSyD0qRCWhQ%3D","intro":"指喺#1正文中#3,表达嘅#1中心#3,具有#1实质性#1意义嘅词#4。\tzi2 hai2 zing3 man4 zung1 biu2 daat6 ge3 zung1 sam1 geoi6 jau5 sat6 zat1 sing3 ji3 ji6 ge3 ci4","size":657146,"progress":100,"type":"mp3"}],"officialSummary":"4 People - Cantonese Average Tone Speech Synthesis Corpus,recorded by native of Guangdong. The corpus contain educational, game and general colloquial content. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.","dataexampl":null,"datakeyword":["Synthesis Corpus","TTS","Cantonese"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Language,Voice Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechSyn","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
4 People - Cantonese Average Tone Speech Synthesis Corpus
Synthesis Corpus
TTS
Cantonese
4 People - Cantonese Average Tone Speech Synthesis Corpus,recorded by native of Guangdong. The corpus contain educational, game and general colloquial content. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
48,000Hz, 24bit, uncompressed wav, mono channel;
Recording environment
professional recording studio;
Recording content
contains educational, game and general colloquial content;
Speaker
professional voice actor, two male and two female, 2 hours per person;
Annotation
word and phoneme transcription, prosodic boundary annotation;