[{"@type":"PropertyValue","name":"Format","value":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Recording environment","value":"professional recording studio;"},{"@type":"PropertyValue","name":"Recording content","value":"general narrative sentences, interrogative sentences, etc;"},{"@type":"PropertyValue","name":"Speaker","value":"british native speaker, 5 male and 5 female, 2 hours per person;"},{"@type":"PropertyValue","name":"Device","value":"microphone;"},{"@type":"PropertyValue","name":"Language","value":"British English;"},{"@type":"PropertyValue","name":"Annotation","value":"word and phoneme transcription, four-level prosodic boundary annotation;"},{"@type":"PropertyValue","name":"Application scenarios","value":"speech synthesis."}]
{"id":1309,"datatype":"1","titleimg":"/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"165","type2str":null,"dataname":"10 People - British English Average Tone Speech Synthesis Corpus","datazy":[{"title":"Format","value":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"title":"Recording environment","value":"professional recording studio;"},{"title":"Recording content","value":"general narrative sentences, interrogative sentences, etc;"},{"title":"Speaker","value":"british native speaker, 5 male and 5 female, 2 hours per person;"},{"title":"Device","value":"microphone;"},{"title":"Language","value":"British English;"},{"title":"Annotation","value":"word and phoneme transcription, four-level prosodic boundary annotation;"},{"title":"Application scenarios","value":"speech synthesis."}],"datatag":"English,Tts,British English,Average Tone","technologydoc":null,"downurl":null,"datainfo":"","standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/002256.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=%2BHJ4HkASPXXwA7c4hgakyICBGkU%3D","/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/002256.wav","Carville was a Louisiana Cajun and ex marine/ who had- a great strategic sense%.K AA1 . V IH2 L / W AA1 Z / AX0 / L UW0 . IY1 . Z IY0 . AE2 . N AX0 / K EY1 . JH AX0 N / AX0 N D / EH1 K S / M AX0 . R IY1 N / HH UW1 / HH AE1 D / AX0 / G R EY1 T3 / S T R AX0 . T IY1 . JH IH0 K / S EH1 N S"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/002022.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=WXpZl9Nc8CO2%2BGbIhNHYEH3kKKg%3D","/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/002022.wav","I don't feel very well%.AY1 / D OW1 N T3 / F IY1 L / V EH1 . R IY0 / W EH1 L"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/001934.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=MBx0DzNxXrt%2BHjwGHlgP2hKls%2Fc%3D","/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/001934.wav","No American President had been there- in/ twenty years%.N OW13 / AX0 . M EH1 . R AX0 . K AX0 N / P R EH1 . Z AX0 . D EH2 N T / HH AE1 D / B IH1 N / DH EH1 R / IH0 N / T W EH1 N . T IY0 / Y IH1 R Z"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/001433.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=%2BCG6azbNrvwWodlfe4HkdmFgQWg%3D","/data/apps/damp/temp/ziptemp/APY230812002_demo1699437601234/APY230812002_demo/001433.wav","I don't/ like to speak- about/ things which I don't understand%.AY1 / D OW1 N T / L AY1 K / T UW1 / S P IY1 K3 / AX0 . B AW1 T / TH IH1 NG Z / W IH1 CH / AY1 / D OW1 N T / AH2 N . D AX0 . S T AE1 N D"]],"officialSummary":"10 People - British English Average Tone Speech Synthesis Corpus. It is recorded by British English native speakers, with authentic accent. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.","dataexampl":"","datakeyword":["TTS","British English","Average Tone"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Voice Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechSyn","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"single":"no"}
10 People - British English Average Tone Speech Synthesis Corpus
TTS
British English
Average Tone
10 People - British English Average Tone Speech Synthesis Corpus. It is recorded by British English native speakers, with authentic accent. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
48,000Hz, 24bit, uncompressed wav, mono channel;
Recording environment
professional recording studio;
Recording content
general narrative sentences, interrogative sentences, etc;
Speaker
british native speaker, 5 male and 5 female, 2 hours per person;
Device
microphone;
Language
British English;
Annotation
word and phoneme transcription, four-level prosodic boundary annotation;
Application scenarios
speech synthesis.
Sample
Audio
Carville was a Louisiana Cajun and ex marine/ who had- a great strategic sense%.K AA1 . V IH2 L / W AA1 Z / AX0 / L UW0 . IY1 . Z IY0 . AE2 . N AX0 / K EY1 . JH AX0 N / AX0 N D / EH1 K S / M AX0 . R IY1 N / HH UW1 / HH AE1 D / AX0 / G R EY1 T3 / S T R AX0 . T IY1 . JH IH0 K / S EH1 N S
Audio
I don't feel very well%.AY1 / D OW1 N T3 / F IY1 L / V EH1 . R IY0 / W EH1 L
Audio
No American President had been there- in/ twenty years%.N OW13 / AX0 . M EH1 . R AX0 . K AX0 N / P R EH1 . Z AX0 . D EH2 N T / HH AE1 D / B IH1 N / DH EH1 R / IH0 N / T W EH1 N . T IY0 / Y IH1 R Z
Audio
I don't/ like to speak- about/ things which I don't understand%.AY1 / D OW1 N T / L AY1 K / T UW1 / S P IY1 K3 / AX0 . B AW1 T / TH IH1 NG Z / W IH1 CH / AY1 / D OW1 N T / AH2 N . D AX0 . S T AE1 N D
Recommended Dataset
26.1 Hours - Chinese Mandarin Synthesis Corpus-Female, Customer Service
26.1 Hours - Chinese Mandarin Synthesis Corpus-Female, Customer Service, It is recorded by Chinese native speakers, with lively and frindly voice. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
Synthesis CorpusTTSMandarinFemaleCustomer Service
6.78 Hours - Chinese Mandarin Speech Synthesis Corpus-Female Imitating Children
Female audio data of adults imitating children, 6599 sentences in total and 6.78 hours. It is recorded by Chinese native speakers, with authentic accent and sweet sound. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSChineseChildren
19.46 Hours - American English Speech Synthesis Corpus-Female
Female audio data of American English,. It is recorded by American English native speaker, with authentic accent and sweet sound. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSAmerican EnglishFemale
4 People - Northeastern dialect Average Tone Speech Synthesis Corpus
4 People - Northeastern dialect Average Tone Speech Synthesis Corpus. It is recorded by Northeast native. About 40% of the corpus contains words unique to Northeast China, the phonemes and tones are balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
10 Hours - Chaozhou Dialect Speech Synthesis Corpus - Female
10 Hours - Chaozhou Dialect Speech Synthesis Corpus - Female. It is recorded by Chaozhou-Shantou Pronunciation. the phonemes and tones are balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
Synthesis CorpusTTSFemaleGeneralChaozhouDialect
2 People - Mexican Spanish Average Tone Speech Synthesis Corpus
2 People - Mexican Spanish Average Tone Speech Synthesis Corpus. It is recorded by rn native Mexican, with authentic accent, Covering both customer service and general styles. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSMexicanSpanishAverage Tone
2 People - Spanish Average Tone Speech Synthesis Corpus
2 People - Spanish Average Tone Speech Synthesis Corpus. It is recorded by rn native Spaniard, with authentic accent. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.
TTSSpanishAverage Tone
2 People - New Zealand English Average Tone Speech Synthesis Corpus
2 People - New Zealand English Average Tone Speech Synthesis Corpus. It is recorded by rn native New Zealanders, with authentic accent. The phoneme coverage is balanced. Professional phonetician participates in the annotation. It precisely matches with the research and development needs of the speech synthesis.