[{"@type":"PropertyValue","name":"Format","value":"8kHz 8bit, a-law/u-law pcm, mono channel"},{"@type":"PropertyValue","name":"Content category","value":"Dialogue based on given topics"},{"@type":"PropertyValue","name":"Recording condition","value":"Low background noise (indoor)"},{"@type":"PropertyValue","name":"Recording device","value":"Telephony"},{"@type":"PropertyValue","name":"Country","value":"Korea(KOR)"},{"@type":"PropertyValue","name":"Language(Region) Code","value":"ko-KR"},{"@type":"PropertyValue","name":"Language","value":"Korean"},{"@type":"PropertyValue","name":"Speaker","value":"216 people in total, 44% male and 56% female"},{"@type":"PropertyValue","name":"Features of annotation","value":"Transcription text, timestamp, speaker ID, gender"},{"@type":"PropertyValue","name":"Accuracy rate","value":"Sentence accuracy rate(SAR) 95%"}]
{"id":1260,"datatype":"1","titleimg":"https://www.nexdata.ai/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"166","type2str":null,"dataname":"Korean Telephony Speech Dataset – 136 Hours of Spontaneous Calls","datazy":[{"title":"Format","desc":"Format","content":"8kHz 8bit, a-law/u-law pcm, mono channel"},{"title":"Content category","desc":"Content category","content":"Dialogue based on given topics"},{"title":"Recording condition","desc":"Recording condition","content":"Low background noise (indoor)"},{"title":"Recording device","desc":"Recording device","content":"Telephony"},{"title":"Country","desc":"Country","content":"Korea(KOR)"},{"title":"Language(Region) Code","desc":"Language(Region) Code","content":"ko-KR"},{"title":"Language","desc":"Language","content":"Korean"},{"title":"Speaker","desc":"Speaker","content":"216 people in total, 44% male and 56% female"},{"title":"Features of annotation","desc":"Features of annotation","content":"Transcription text, timestamp, speaker ID, gender"},{"title":"Accuracy rate","desc":"Accuracy rate","content":"Sentence accuracy rate(SAR) 95%"}],"datatag":"Korean,Conversational,Telephone","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-1.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-1.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=8Br5pcP1V9ttmLYdxOoEYe6eTWE%3D","intro":"A 시리즈가 있고 또 무슨 Z 시리즈가 있고 이러지 않아?","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-3.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-3.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=mvwVVmoXo%2FRZxKjx7wK9T0DQdt4%3D","intro":"해외 직구.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-7.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-7.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=F7r9nYk301PmicpdcTXLOxgQ1%2FI%3D","intro":"저는 예전부터 항상","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-8.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-8.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=Xn7HtmdfvfbeKPZCBMFf68ppqTU%3D","intro":"갤럭시만 썼던 것 같애요.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-4.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230703001_demo1712656802183/APY230703001_demo/mob_301_00101_8k-4.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=Z85%2BWNZtNUhMRvdKPuFICzlW50c%3D","intro":"그냥 아직 한국에는 안 팔아서 어디서 어디 엄마가 사주신 거거든요 그냥.","size":0,"progress":100,"type":"mp3"}],"officialSummary":"This Korean Telephony Speech Dataset contains 136 hours of spontaneous dialogue recorded over phone calls. Covering over 20 real-life domains including customer service, e-commerce, finance, travel, and daily conversations, the dataset features natural two-speaker conversations collected via diverse telephony channels. Each sample is transcribed and annotated with speaker ID, gender, age, and other metadata. Data was collected from 216 native Korean speakers across different regions, enhancing model generalization. Ideal for automatic speech recognition (ASR), speaker diarization, and call center conversational AI systems. All data complies with GDPR, CCPA, and PIPL for responsible and legal AI development.","dataexampl":null,"datakeyword":["Korean telephony speech dataset","Korean telephone audio","telephone conversation Korean","call center voice dataset Korean","Korean spoken dialogue corpus","multilingual telephony dataset","Korean voice dataset","speech-to-text Korean phone call","spontaneous Korean speech data"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
Korean Telephony Speech Dataset – 136 Hours of Spontaneous Calls
Korean telephony speech dataset
Korean telephone audio
telephone conversation Korean
call center voice dataset Korean
Korean spoken dialogue corpus
multilingual telephony dataset
Korean voice dataset
speech-to-text Korean phone call
spontaneous Korean speech data
This Korean Telephony Speech Dataset contains 136 hours of spontaneous dialogue recorded over phone calls. Covering over 20 real-life domains including customer service, e-commerce, finance, travel, and daily conversations, the dataset features natural two-speaker conversations collected via diverse telephony channels. Each sample is transcribed and annotated with speaker ID, gender, age, and other metadata. Data was collected from 216 native Korean speakers across different regions, enhancing model generalization. Ideal for automatic speech recognition (ASR), speaker diarization, and call center conversational AI systems. All data complies with GDPR, CCPA, and PIPL for responsible and legal AI development.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.