[{"@type":"PropertyValue","name":"Format","value":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Recording environment","value":"professional recording studio;"},{"@type":"PropertyValue","name":"Recording content","value":"Given topic, speaker's self-expression;"},{"@type":"PropertyValue","name":"Speaker","value":"professional Character Voice, natural conversation, not reading aloud, one male voice, one female voice;"},{"@type":"PropertyValue","name":"Annotation","value":"word and pinyin transcription, prosodic boundary annotation, secondary language annotation;"},{"@type":"PropertyValue","name":"Device","value":"microphone;"},{"@type":"PropertyValue","name":"Language","value":"chinese, chinese/english mixed;"},{"@type":"PropertyValue","name":"Application scenarios","value":"speech synthesis."}]
{"id":1470,"datatype":"1","titleimg":"/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"219","type2str":null,"dataname":"2 People - Chinese Natural Conversation Speech Synthesis Corpus","datazy":[{"title":"Format","desc":"Format","content":"48,000Hz, 24bit, uncompressed wav, mono channel;"},{"title":"Recording environment","desc":"Recording environment","content":"professional recording studio;"},{"title":"Recording content","desc":"Recording content","content":"Given topic, speaker's self-expression;"},{"title":"Speaker","desc":"Speaker","content":"professional Character Voice, natural conversation, not reading aloud, one male voice, one female voice;"},{"title":"Annotation","desc":"Annotation","content":"word and pinyin transcription, prosodic boundary annotation, secondary language annotation;"},{"title":"Device","desc":"Device","content":"microphone;"},{"title":"Language","desc":"Language","content":"chinese, chinese/english mixed;"},{"title":"Application scenarios","desc":"Application scenarios","content":"speech synthesis."}],"datatag":"Natural conservation,Secondary language,TTS","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[],"officialSummary":"2 People - Chinese Natural Conversation Speech Synthesis Corpus. It is recorded by Chinese native speaker, natural conversation style. phonemes and tones are balanced. Professional phonetician participates in the annotation, and annotate secondary language, Secondary Language Annotation: Inhalation: V; Pause: P; Hesitation: T; Mouth clicking: M; Drawl: D; Cough: C; Laughter: L; Stutter repetition: R; Inversion: I; Modal particle: S (Modal particles include \"ah\", \"oh\", \"wow\", \"right?\", \"what?\", \"well\" etc.). It precisely matches with the research and development needs of the speech synthesis.","dataexampl":null,"datakeyword":["Natural conservation","Secondary language","TTS"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Voice Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechSyn","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
2 People - Chinese Natural Conversation Speech Synthesis Corpus
Natural conservation
Secondary language
TTS
2 People - Chinese Natural Conversation Speech Synthesis Corpus. It is recorded by Chinese native speaker, natural conversation style. phonemes and tones are balanced. Professional phonetician participates in the annotation, and annotate secondary language, Secondary Language Annotation: Inhalation: V; Pause: P; Hesitation: T; Mouth clicking: M; Drawl: D; Cough: C; Laughter: L; Stutter repetition: R; Inversion: I; Modal particle: S (Modal particles include "ah", "oh", "wow", "right?", "what?", "well" etc.). It precisely matches with the research and development needs of the speech synthesis.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
48,000Hz, 24bit, uncompressed wav, mono channel;
Recording environment
professional recording studio;
Recording content
Given topic, speaker's self-expression;
Speaker
professional Character Voice, natural conversation, not reading aloud, one male voice, one female voice;
Annotation
word and pinyin transcription, prosodic boundary annotation, secondary language annotation;