[{"@type":"PropertyValue","name":"Format","value":"16kHz, 16bit, uncompressed wav, mono channel"},{"@type":"PropertyValue","name":"Recording environment","value":"quiet indoor environment, without echo"},{"@type":"PropertyValue","name":"Recording content (read speech)","value":"children's books; human-machine interaction category; smart home command and control category; numbers; general category"},{"@type":"PropertyValue","name":"Speaker","value":"1,085 Korean children, all children are 6-15 years old"},{"@type":"PropertyValue","name":"Recording device","value":"Android Smartphone, iPhone"},{"@type":"PropertyValue","name":"Country","value":"Korea"},{"@type":"PropertyValue","name":"Language","value":"Korean"},{"@type":"PropertyValue","name":"Accuracy rate","value":"Sentence Accuracy Rate (SAR) 95%"}]
{"id":1112,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY210731001.png?Expires=2007353693&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=iniJJtLsGUI5LbhvhN7OmmFwflQ%3D","type1":"165","type1str":null,"type2":"167","type2str":null,"dataname":"Korean Children Speech Dataset – 393 Hours of Scripted Monologues","datazy":[{"title":"Format","desc":"Format","content":"16kHz, 16bit, uncompressed wav, mono channel"},{"title":"Recording environment","desc":"Recording environment","content":"quiet indoor environment, without echo"},{"title":"Recording content (read speech)","desc":"Recording content (read speech)","content":"children's books; human-machine interaction category; smart home command and control category; numbers; general category"},{"title":"Speaker","desc":"Speaker","content":"1,085 Korean children, all children are 6-15 years old"},{"title":"Recording device","desc":"Recording device","content":"Android Smartphone, iPhone"},{"title":"Country","desc":"Country","content":"Korea"},{"title":"Language","desc":"Language","content":"Korean"},{"title":"Accuracy rate","desc":"Accuracy rate","content":"Sentence Accuracy Rate (SAR) 95%"}],"datatag":"Korea,Korean,Children,Mobile phone,Speech","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/2.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/2.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=tjJkB2FONlxEQjxmmQuO55dutyM%3D","intro":"쁘찌하우스 노부꼬를 예약하고 싶어.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/1.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/1.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=%2BWgX75sUcNeCLdKMU5l13KfdAlk%3D","intro":"시간 되면 자주 들어주세요.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/4.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/4.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=acS%2FjbXw3g9lo%2F66cKhY5056Fik%3D","intro":"저도 오빠처럼 수영을 잘 하고 싶어요.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/3.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/3.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=EYEQ%2FP4JLoEYAXO4XM2pKanYRYA%3D","intro":"에어컨가 자동으로 켜질수 있게 설정해주세요.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/5.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY210731001_demo1712656800539/5.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=rkhyK7pjBf9efjcrBDklaQr6HfY%3D","intro":"천이백칠십육만삼천육백십칠원","size":0,"progress":100,"type":"mp3"}],"officialSummary":"This 393-hour Korean Children Speech Dataset consists of scripted monologue recordings from young speakers, captured using smartphones. The speech content includes essays, storytelling, and numeric readings. Each audio file is transcribed and annotated with metadata such as speaker ID, gender, and age. Collected from a geographically diverse group of native Korean-speaking children, this dataset is designed to support training of automatic speech recognition (ASR), text-to-speech (TTS), pronunciation evaluation systems, and educational language models. The dataset has been quality-verified by multiple AI enterprises and is fully compliant with GDPR, CCPA, and PIPL privacy regulations.","dataexampl":null,"datakeyword":["Korean children speech dataset","Korean child voice dataset","kids speech recognition dataset Korean","Korean ASR training data for children","scripted monologue kids Korean","smartphone voice dataset Korean","Korean kids TTS dataset","Korean educational speech corpus"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
Korean Children Speech Dataset – 393 Hours of Scripted Monologues
Korean children speech dataset
Korean child voice dataset
kids speech recognition dataset Korean
Korean ASR training data for children
scripted monologue kids Korean
smartphone voice dataset Korean
Korean kids TTS dataset
Korean educational speech corpus
This 393-hour Korean Children Speech Dataset consists of scripted monologue recordings from young speakers, captured using smartphones. The speech content includes essays, storytelling, and numeric readings. Each audio file is transcribed and annotated with metadata such as speaker ID, gender, and age. Collected from a geographically diverse group of native Korean-speaking children, this dataset is designed to support training of automatic speech recognition (ASR), text-to-speech (TTS), pronunciation evaluation systems, and educational language models. The dataset has been quality-verified by multiple AI enterprises and is fully compliant with GDPR, CCPA, and PIPL privacy regulations.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
16kHz, 16bit, uncompressed wav, mono channel
Recording environment
quiet indoor environment, without echo
Recording content (read speech)
children's books; human-machine interaction category; smart home command and control category; numbers; general category
Speaker
1,085 Korean children, all children are 6-15 years old