[{"@type":"PropertyValue","name":"Format","value":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Recording environment","value":"professional recording studio;"},{"@type":"PropertyValue","name":"Recording content","value":"contains educational, game and general colloquial content;"},{"@type":"PropertyValue","name":"Speaker","value":"professional voice actor, two male and two female, 2 hours per person;"},{"@type":"PropertyValue","name":"Annotation","value":"word and phoneme transcription, prosodic boundary annotation;"},{"@type":"PropertyValue","name":"Device","value":"microphone;"},{"@type":"PropertyValue","name":"Language","value":"Hong Kong Cantonese;"},{"@type":"PropertyValue","name":"Application scenarios","value":"speech synthesis."}]
{"id":1569,"datatype":"1","titleimg":"https://www.nexdata.ai/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"219","type2str":null,"dataname":"8 Hours – Cantonese Speech Dataset for TTS (Hong Kong)","datazy":[{"title":"Format","content":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"title":"Recording environment","content":"professional recording studio;"},{"title":"Recording content","content":"contains educational, game and general colloquial content;"},{"title":"Speaker","content":"professional voice actor, two male and two female, 2 hours per person;"},{"title":"Annotation","content":"word and phoneme transcription, prosodic boundary annotation;"},{"title":"Device","content":"microphone;"},{"title":"Language","content":"Hong Kong Cantonese;"},{"title":"Application scenarios","content":"speech synthesis."}],"datatag":"Synthesis Corpus,TTS,Hong Kong Cantonese","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":null,"samplePresentation":[{"name":"100001.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/100001.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=VEwdNnttbLTmbyQWk7%2BRvR4XKfk%3D","intro":"佢哋#1產生喺#1新文化#1運動#1之後#4。 keoi5 dei6 caan2 sang1 hai2 san1 man4 faa3 wan6 dung6 zi1 hau6","size":437402,"progress":100,"type":"mp3"},{"name":"100003.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/100003.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=w8qDZpFMFMH2bZnUXwoZnHYJJAI%3D","intro":"好多#1遊戲#1都#1只係#1換個#1皮膚#1做#1副本#4。 hou2 do1 jau4 hei3 dou1 zi2 hai6 wun6 go3 pei4 fu1 zou6 fu3 bun2","size":469736,"progress":100,"type":"mp3"},{"name":"100004.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/100004.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=CJ5BSLriTZSWJGdk8QmfDEfFpB4%3D","intro":"事物#1相應嘅#1心理#1需要#1而#1產生#4。 si6 mat6 soeng1 jing3 ge3 sam1 lei5 seoi1 jiu3 ji4 caan2 sang1","size":470768,"progress":100,"type":"mp3"},{"name":"100005.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250809222008/100005.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=T1a18vKWU8PBKdguc3mutG7VA4U%3D","intro":"你#1日頭#1又#1可以#2夜晚#1又#1可以#4。 lei5 jat6 tau2 jau6 ho2 ji3 je6 maan5 jau6 ho2 ji3","size":415296,"progress":100,"type":"mp3"}],"officialSummary":"This dataset features recordings from 4 native Hong Kong Cantonese speakers. The corpus contain educational, game and general colloquial content. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.","dataexampl":null,"datakeyword":["Cantonese speech dataset","Hong Kong Cantonese speech corpus","Cantonese text-to-speech dataset","Cantonese voice dataset for AI","native Cantonese speech recordings","Cantonese TTS dataset","Hong Kong accent speech dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Language,Voice Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechSyn","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
8 Hours – Cantonese Speech Dataset for TTS (Hong Kong)
Cantonese speech dataset
Hong Kong Cantonese speech corpus
Cantonese text-to-speech dataset
Cantonese voice dataset for AI
native Cantonese speech recordings
Cantonese TTS dataset
Hong Kong accent speech dataset
This dataset features recordings from 4 native Hong Kong Cantonese speakers. The corpus contain educational, game and general colloquial content. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
48,000Hz, 24bit, uncompressed wav, mono channel;
Recording environment
professional recording studio;
Recording content
contains educational, game and general colloquial content;
Speaker
professional voice actor, two male and two female, 2 hours per person;
Annotation
word and phoneme transcription, prosodic boundary annotation;