[{"@type":"PropertyValue","name":"Format","value":"44,100Hz, 16bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Recording environment","value":"quiet indoor environment, low background noise, without echo;"},{"@type":"PropertyValue","name":"Recording content","value":"news and colloquial sentences;"},{"@type":"PropertyValue","name":"Speaker","value":"9 males, 29 females;"},{"@type":"PropertyValue","name":"Device","value":"microphone;"},{"@type":"PropertyValue","name":"Language","value":"Cantonese, English;"},{"@type":"PropertyValue","name":"Annotation","value":"word and phoneme transcription, prosodic boundary annotation;"},{"@type":"PropertyValue","name":"Application scenarios","value":"speech synthesis."}]
{"id":1201,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY221030001.png?Expires=2007353716&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=l0UgJBrdkzvD1ShKlGzGoeMzuZo%3D","type1":"165","type1str":null,"type2":"165","type2str":null,"dataname":"38 People - Hong Kong Cantonese Average Tone Speech Synthesis Corpus","datazy":[{"title":"Format","value":"44,100Hz, 16bit, uncompressed wav, mono channel;"},{"title":"Recording environment","value":"quiet indoor environment, low background noise, without echo;"},{"title":"Recording content","value":"news and colloquial sentences;"},{"title":"Speaker","value":"9 males, 29 females;"},{"title":"Device","value":"microphone;"},{"title":"Language","value":"Cantonese, English;"},{"title":"Annotation","value":"word and phoneme transcription, prosodic boundary annotation;"},{"title":"Application scenarios","value":"speech synthesis."}],"datatag":"Tts","technologydoc":null,"downurl":null,"datainfo":"","standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/280002.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=J7FTsOeBKqJDsGSCcKOvgDkpoio%3D","/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/280002.wav","280002fgf咁你#1即係#1declare咗#1你有#1两份#1收入#4fgfgam2 nei5 zik1 hai6 / D IH0 . K L EH1 R / zo2 nei5 jau5 loeng5 fan6 sau1 jap6"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/040001.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=HK82e8kgqHHJ6HvPPuvvQ8dsMBs%3D","/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/040001.wav","040001fgf我#1唔太鐘意#1畀人#1話我#1cute#4fgfngo5 m4 taai3 zung1 ji3 bei2 jan4 waa6 ngo5 / K Y UW1 T"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/000001.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=YxUL5eh6hQp5tEw4Y7g6k5uyIr0%3D","/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/000001.wav","000001fgfSend嗰#1message#1俾我啊#4fgfS EH1 N D / go3 / M EH1 . S IH0 JH / bei2 ngo5 aa1"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/070001.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=mt8F6OBallpTQrTIxeXatBHqwKU%3D","/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/070001.wav","070001fgfDepends on#2你想#1揾#1咩工#4fgfD IH0 . P EH1 N D Z AA1 N nei5 soeng2 wan2 me1 gung1"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/350001.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=XahBgUzJpjZJTHQYbxR52VGhAeo%3D","/data/apps/damp/temp/ziptemp/APY221030001_demo1713261600124/APY221030001_demo/350001.wav","350001fgf識得#1佢耐#3你#1就知#1佢#1好funny#4fgfsik1 dak1 keoi5 noi6 nei5 zau6 zi1 keoi5 hou2 / F AH1 . N IH0"]],"officialSummary":"38 People - Hong Kong Cantonese Average Tone Speech Synthesis Corpus, It is recorded by Hong Kong native speakers. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.","dataexampl":"","datakeyword":["Synthesis Corpus","TTS","Female","General","Male","english"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Voice Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechSyn","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"single":"no"}
38 People - Hong Kong Cantonese Average Tone Speech Synthesis Corpus
Synthesis Corpus
TTS
Female
General
Male
english
38 People - Hong Kong Cantonese Average Tone Speech Synthesis Corpus, It is recorded by Hong Kong native speakers. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
44,100Hz, 16bit, uncompressed wav, mono channel;
Recording environment
quiet indoor environment, low background noise, without echo;
Recording content
news and colloquial sentences;
Speaker
9 males, 29 females;
Device
microphone;
Language
Cantonese, English;
Annotation
word and phoneme transcription, prosodic boundary annotation;
Application scenarios
speech synthesis.
Sample
Audio
280002fgf咁你#1即係#1declare咗#1你有#1两份#1收入#4fgfgam2 nei5 zik1 hai6 / D IH0 . K L EH1 R / zo2 nei5 jau5 loeng5 fan6 sau1 jap6
Audio
040001fgf我#1唔太鐘意#1畀人#1話我#1cute#4fgfngo5 m4 taai3 zung1 ji3 bei2 jan4 waa6 ngo5 / K Y UW1 T
Audio
000001fgfSend嗰#1message#1俾我啊#4fgfS EH1 N D / go3 / M EH1 . S IH0 JH / bei2 ngo5 aa1
Audio
070001fgfDepends on#2你想#1揾#1咩工#4fgfD IH0 . P EH1 N D Z AA1 N nei5 soeng2 wan2 me1 gung1
Audio
350001fgf識得#1佢耐#3你#1就知#1佢#1好funny#4fgfsik1 dak1 keoi5 noi6 nei5 zau6 zi1 keoi5 hou2 / F AH1 . N IH0
Recommended Dataset
4 People - Northeastern dialect Average Tone Speech Synthesis Corpus
4 People - Northeastern dialect Average Tone Speech Synthesis Corpus. It is recorded by Northeast native. About 40% of the corpus contains words unique to Northeast China, the phonemes and tones are balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
2 People - Japanese Average Tone Speech Synthesis Corpus
2 People - Japanese Average Tone Speech Synthesis Corpus. It is recorded by rn native Japan, with authentic accent. Contains news and colloquial style general corpus,the phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSJapaneseAverage Tone
10 Hours - Chaozhou Dialect Speech Synthesis Corpus - Female
10 Hours - Chaozhou Dialect Speech Synthesis Corpus - Female. It is recorded by Chaozhou-Shantou Pronunciation. the phonemes and tones are balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
Synthesis CorpusTTSFemaleGeneralChaozhouDialect
2 People - Mexican Spanish Average Tone Speech Synthesis Corpus
2 People - Mexican Spanish Average Tone Speech Synthesis Corpus. It is recorded by rn native Mexican, with authentic accent, Covering both customer service and general styles. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSMexicanSpanishAverage Tone
2 People - Spanish Average Tone Speech Synthesis Corpus
2 People - Spanish Average Tone Speech Synthesis Corpus. It is recorded by rn native Spaniard, with authentic accent. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSSpanishAverage Tone
2 People - New Zealand English Average Tone Speech Synthesis Corpus
2 People - New Zealand English Average Tone Speech Synthesis Corpus. It is recorded by rn native New Zealanders, with authentic accent. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSNew Zealand EnglishAverage Tone
20 Hours - Sichuan Dialect Speech Synthesis Corpus - Female
20 Hours - Sichuan Dialect Speech Synthesis Corpus - Female. It is recorded by Chengdu Sichuan Pronunciation. the phonemes and tones are balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
Synthesis CorpusTTSFemaleGeneralSichuanDialect
10 People - British English Average Tone Speech Synthesis Corpus
10 People - British English Average Tone Speech Synthesis Corpus. It is recorded by British English native speakers, with authentic accent. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.