[{"@type":"PropertyValue","name":"Format","value":"16kHz, 16bit, uncompressed wav, mono channel"},{"@type":"PropertyValue","name":"Content category","value":"Dialogue based on given topics"},{"@type":"PropertyValue","name":"Recording condition","value":"Low background noise (indoor)"},{"@type":"PropertyValue","name":"Recording device","value":"Android smartphone, iPhone"},{"@type":"PropertyValue","name":"Country","value":"The United Kingdom(GBK)"},{"@type":"PropertyValue","name":"Language(Region) Code","value":"en-GB"},{"@type":"PropertyValue","name":"Language","value":"English"},{"@type":"PropertyValue","name":"Speaker","value":"944 native speakers in total"},{"@type":"PropertyValue","name":"Features of annotation","value":"Transcription text, timestamp, speaker ID, gender, noise"},{"@type":"PropertyValue","name":"Accuracy rate","value":"Sentence accuracy rate(SAR) 95%"}]
{"id":1393,"datatype":"1","titleimg":"https://www.nexdata.ai/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"166","type2str":null,"dataname":"743 Hours - UK English Spontaneous Dialogue Speech Dataset (Smartphone Recorded)","datazy":[{"title":"Format","content":"16kHz, 16bit, uncompressed wav, mono channel","desc":"Format"},{"title":"Content category","content":"Dialogue based on given topics","desc":"Content category"},{"title":"Recording condition","content":"Low background noise (indoor)","desc":"Recording condition"},{"title":"Recording device","content":"Android smartphone, iPhone","desc":"Recording device"},{"title":"Country","content":"The United Kingdom(GBK)","desc":"Country"},{"title":"Language(Region) Code","content":"en-GB","desc":"Language(Region) Code"},{"title":"Language","content":"English","desc":"Language"},{"title":"Speaker","content":"944 native speakers in total","desc":"Speaker"},{"title":"Features of annotation","content":"Transcription text, timestamp, speaker ID, gender, noise","desc":"Features of annotation"},{"title":"Accuracy rate","content":"Sentence accuracy rate(SAR) 95%","desc":"Accuracy rate"}],"datatag":"English,British English,UK,Conversational","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O1_31.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O1_31.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=SOGSuorLHNN3JMhszRX5fllgmqc%3D","intro":"It's a lot about the nature and the power of [OVERLAP/]nature. [/OVERLAP].","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O1_37.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O1_37.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=u%2Frw7Cb4SWpS6hi1JZo3FXKY%2Bs4%3D","intro":"Ah, yeah. The [OVERLAP/]black beach. Yeah. [/OVERLAP]yeah.[OVERLAP/] it's also[/OVERLAP] yeah call there's.[N]","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O2_32.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O2_32.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=oLWYG1WtvFwb5lzvIRftvmeLXjY%3D","intro":"It's power of nature.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O1_30.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O1_30.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=npYL14p9griFEGFrgcA1lTHAyjE%3D","intro":"When you have the time, do it. [OVERLAP/]because[/OVERLAP] it's you know, it's.[N]","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O2_34.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240209001_demo1725271202516/0001_004_O2_34.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=mC5Qa4jxpmFOzVXuScUVkp6x370%3D","intro":"","size":0,"progress":100,"type":"mp3"}],"officialSummary":"This dataset contains 200 hours of spontaneous UK English dialogue recorded using smartphones. Collected from approximately 500 native British English speakers across various regions, the dataset reflects real-world acoustic diversity. Each audio segment is accompanied by detailed annotations, including transcription, timestamp, speaker ID, gender, and more. Ideal for applications in automatic speech recognition (ASR), speech synthesis (TTS), speaker diarization, and natural language understanding (NLU), the dataset has been validated by leading AI companies. All data complies with global privacy regulations such as GDPR, CCPA, and PIPL.","dataexampl":null,"datakeyword":["UK English speech dataset","spontaneous dialogue audio","smartphone speech recording","British English ASR dataset","English voice training data","UK accent speech","real-world speech corpus","multi-speaker UK English dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
743 Hours - UK English Spontaneous Dialogue Speech Dataset (Smartphone Recorded)
UK English speech dataset
spontaneous dialogue audio
smartphone speech recording
British English ASR dataset
English voice training data
UK accent speech
real-world speech corpus
multi-speaker UK English dataset
This dataset contains 200 hours of spontaneous UK English dialogue recorded using smartphones. Collected from approximately 500 native British English speakers across various regions, the dataset reflects real-world acoustic diversity. Each audio segment is accompanied by detailed annotations, including transcription, timestamp, speaker ID, gender, and more. Ideal for applications in automatic speech recognition (ASR), speech synthesis (TTS), speaker diarization, and natural language understanding (NLU), the dataset has been validated by leading AI companies. All data complies with global privacy regulations such as GDPR, CCPA, and PIPL.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.