[{"@type":"PropertyValue","name":"Data size","value":"411 speakers, approx. 262 hours, 147,668 utterances"},{"@type":"PropertyValue","name":"Speaker profile ","value":"Japanese children aged 6–13"},{"@type":"PropertyValue","name":"Device ","value":"Smartphone"},{"@type":"PropertyValue","name":"Data format Audio data format","value":"WAV; transcription format: TSVData"},{"@type":"PropertyValue","name":"content ","value":"Scripted read-aloud speech, categorized into lower-grade (ages 6–9) and upper-grade (ages 10–13)Annotation contentUtterance transcription,Read-aloud Scripts"},{"@type":"PropertyValue","name":"Accuracy","value":"Character Accuracy Rate 98% or above"},{"@type":"PropertyValue","name":"Application Scenarios ","value":"ASR, TTS, speaker recognition, pronunciation assessment"}]
{"id":2160,"datatype":"1","titleimg":"https://www.nexdata.ai/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"166","type2str":null,"dataname":"262 Hours - Japanese Children's Speech Dataset","datazy":[{"title":"Data size","content":"411 speakers, approx. 262 hours, 147,668 utterances"},{"title":"Speaker profile ","content":"Japanese children aged 6–13"},{"title":"Device ","content":"Smartphone"},{"title":"Data format Audio data format","content":"WAV; transcription format: TSVData"},{"title":"content ","content":"Scripted read-aloud speech, categorized into lower-grade (ages 6–9) and upper-grade (ages 10–13)Annotation contentUtterance transcription,Read-aloud Scripts"},{"title":"Accuracy","content":"Character Accuracy Rate 98% or above"},{"title":"Application Scenarios ","content":"ASR, TTS, speaker recognition, pronunciation assessment"}],"datatag":"Japanese,children,speech","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":null,"samplePresentation":[],"officialSummary":"411 Speakers - Approx. 262 Hours Japanese Children's Speech Dataset, comprising 147,668 scripted utterances. Speakers are Japanese children aged 6 to 13, categorized into lower-grade (ages 6–9, 179 speakers) and upper-grade (ages 10–13, 232 speakers) groups with balanced gender distribution. Recordings were conducted using smartphones in 16kHz/16bit mono WAV format, accompanied by utterance transcriptions and read-aloud scripts. The dataset is applicable to tasks such as Japanese children's ASR, TTS, speaker recognition, and pronunciation assessment.","dataexampl":null,"datakeyword":["Japanese","children","speech"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Language,Data Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","dataShowType":"[{\"code\":\"0\",\"language\":\"ZH\"},{\"code\":\"1\",\"language\":\"ZH\"},{\"code\":\"2\",\"language\":\"EN,JP,DE,PT,ES,KO,FR\"},{\"code\":\"3\",\"language\":\"EN\"}]","productNameEn":"262 Hours - Japanese Children's Speech Dataset","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
411 Speakers - Approx. 262 Hours Japanese Children's Speech Dataset, comprising 147,668 scripted utterances. Speakers are Japanese children aged 6 to 13, categorized into lower-grade (ages 6–9, 179 speakers) and upper-grade (ages 10–13, 232 speakers) groups with balanced gender distribution. Recordings were conducted using smartphones in 16kHz/16bit mono WAV format, accompanied by utterance transcriptions and read-aloud scripts. The dataset is applicable to tasks such as Japanese children's ASR, TTS, speaker recognition, and pronunciation assessment.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.