[{"@type":"PropertyValue","name":"Format","value":"16kHz, 16bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Recording condition","value":"Low background noise(indoor), without echo;"},{"@type":"PropertyValue","name":"Content category","value":"Generic domain; human-machine interaction; smart home command and control; in-car command and control; numbers"},{"@type":"PropertyValue","name":"Recording device","value":"Android Smartphone, iPhone;"},{"@type":"PropertyValue","name":"Speaker","value":"1,245 speakers, with 606 males and 639 females; 559 speakers in the age group of 16~25, 567 speakers in the age group of 26~45, 119 speakers are older than 45;"},{"@type":"PropertyValue","name":"Country","value":"Japan(JPN);"},{"@type":"PropertyValue","name":"Language(Region) Code","value":"ja-JP;"},{"@type":"PropertyValue","name":"Language","value":"Japanese;"},{"@type":"PropertyValue","name":"Features of annotation","value":"Transcription text;"},{"@type":"PropertyValue","name":"Accuracy Rate","value":"Sentence Accuracy Rate (SAR) 95%"}]
{"id":947,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY181231008.png?Expires=2007353653&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=T7HMbz0Yo3l/fi3v4J1/Wv0NcJo%3D","type1":"165","type1str":null,"type2":"166","type2str":null,"dataname":"474 Hours Japanese Speech Dataset – Voice Command Data for AI & ASR Models","datazy":[{"title":"Format","desc":"Format","content":"16kHz, 16bit, uncompressed wav, mono channel;"},{"title":"Recording condition","desc":"Recording condition","content":"Low background noise(indoor), without echo;"},{"title":"Content category","desc":"Content category","content":"Generic domain; human-machine interaction; smart home command and control; in-car command and control; numbers"},{"title":"Recording device","desc":"Recording device","content":"Android Smartphone, iPhone;"},{"title":"Speaker","desc":"Speaker","content":"1,245 speakers, with 606 males and 639 females; 559 speakers in the age group of 16~25, 567 speakers in the age group of 26~45, 119 speakers are older than 45;"},{"title":"Country","desc":"Country","content":"Japan(JPN);"},{"title":"Language(Region) Code","desc":"Language(Region) Code","content":"ja-JP;"},{"title":"Language","desc":"Language","content":"Japanese;"},{"title":"Features of annotation","desc":"Features of annotation","content":"Transcription text;"},{"title":"Accuracy Rate","desc":"Accuracy Rate","content":"Sentence Accuracy Rate (SAR) 95%"}],"datatag":"Japanese,Japan,Mobile phone,Reading,Scripted Monologue","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/2.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/2.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=o664HpJYl%2BqfbX%2FOzxQ9l7zH%2B%2FQ%3D","intro":"零九零七四二五零一八三","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/1.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/1.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=14ZCLQ5dfOhPxRh6avyocMgVliw%3D","intro":"八街市今から雨が降るんかな","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/4.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/4.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=B8EuV0sf1h%2Ff8tRx2wBMzlfZnSg%3D","intro":"助手室の温度調節してもらいたい","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/3.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/3.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=b5eu0IzC%2FS4sLQKzbLjhmdEn5h4%3D","intro":"会社はどうなんだ","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/5.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY181231008_demo1710237600135/APY181231008_demo/5.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=4HxTtvi6UmbgrmeBTNxfWtXxKSQ%3D","intro":"空気指数詳しく知りたい","size":0,"progress":100,"type":"mp3"}],"officialSummary":"474 hours of Japanese smartphone-based speech dataset featuring scripted monologue recordings collected from mobile devices. The dataset covers a wide range of real-world scenarios, including human-machine interaction, smart home voice commands, in-car voice control, and numeric instructions. All recordings are transcribed with text content and include rich metadata. Our dataset is collected from 1,245 speakers, enhancing model performance in real and complex tasks. Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.","dataexampl":null,"datakeyword":["japanese speech dataset","japanese ASR dataset","voice assistant training dataset","smart home voice dataset","speech recognition training data japanese","Voice assistant dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","dataShowType":"[{\"code\":\"0\",\"language\":\"ZH\"},{\"code\":\"1\",\"language\":\"ZH\"},{\"code\":\"2\",\"language\":\"EN,JP,PT,DE,KO,FR,ES\"},{\"code\":\"3\",\"language\":\"EN\"}]","productNameEn":"474 Hours-Japanese Speech Data By Mobile Phone","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
474 Hours Japanese Speech Dataset – Voice Command Data for AI & ASR Models
japanese speech dataset
japanese ASR dataset
voice assistant training dataset
smart home voice dataset
speech recognition training data japanese
Voice assistant dataset
474 hours of Japanese smartphone-based speech dataset featuring scripted monologue recordings collected from mobile devices. The dataset covers a wide range of real-world scenarios, including human-machine interaction, smart home voice commands, in-car voice control, and numeric instructions. All recordings are transcribed with text content and include rich metadata. Our dataset is collected from 1,245 speakers, enhancing model performance in real and complex tasks. Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
16kHz, 16bit, uncompressed wav, mono channel;
Recording condition
Low background noise(indoor), without echo;
Content category
Generic domain; human-machine interaction; smart home command and control; in-car command and control; numbers
Recording device
Android Smartphone, iPhone;
Speaker
1,245 speakers, with 606 males and 639 females; 559 speakers in the age group of 16~25, 567 speakers in the age group of 26~45, 119 speakers are older than 45;