[{"@type":"PropertyValue","name":"Format","value":"16kHz, 16bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Recording condition","value":"Low background noise(indoor), without echo;"},{"@type":"PropertyValue","name":"Content category","value":"Generic domain;"},{"@type":"PropertyValue","name":"Recording device","value":"Android Smartphone, iPhone;"},{"@type":"PropertyValue","name":"Speaker","value":"1,006 people from Japan; 44% male and 56% female;"},{"@type":"PropertyValue","name":"Country","value":"Japan(JPN);"},{"@type":"PropertyValue","name":"Language(Region) Code","value":"ja-JP;"},{"@type":"PropertyValue","name":"Language","value":"Japanese;"},{"@type":"PropertyValue","name":"Features of annotation","value":"Transcription text;"},{"@type":"PropertyValue","name":"Accuracy Rate","value":"Sentence Accuracy Rate (SAR) 95%"}]
{"id":934,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY180901052.png?Expires=2007353648&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=GZZqD2qIZGRK4Il3P098UZfLbLg%3D","type1":"165","type1str":null,"type2":"166","type2str":null,"dataname":"261 Hours Japanese Speech Dataset – Native Speakers & Labeled Audio for AI Training","datazy":[{"title":"Format","desc":"Format","content":"16kHz, 16bit, uncompressed wav, mono channel;"},{"title":"Recording condition","desc":"Recording condition","content":"Low background noise(indoor), without echo;"},{"title":"Content category","desc":"Content category","content":"Generic domain;"},{"title":"Recording device","desc":"Recording device","content":"Android Smartphone, iPhone;"},{"title":"Speaker","desc":"Speaker","content":"1,006 people from Japan; 44% male and 56% female;"},{"title":"Country","desc":"Country","content":"Japan(JPN);"},{"title":"Language(Region) Code","desc":"Language(Region) Code","content":"ja-JP;"},{"title":"Language","desc":"Language","content":"Japanese;"},{"title":"Features of annotation","desc":"Features of annotation","content":"Transcription text;"},{"title":"Accuracy Rate","desc":"Accuracy Rate","content":"Sentence Accuracy Rate (SAR) 95%"}],"datatag":"Japanese,Mobile Phone,Reading,Scripted Monologue","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":["261 hours","1006 people","covering wide range of regions"],"samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0305G0099896327_S0127.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0305G0099896327_S0127.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=OZidSor62ZpKiRW0DTvTyE7vck0%3D","intro":"一説によると、彼の母カリュケー","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0305G0099893067_S0120.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0305G0099893067_S0120.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=Kb%2BGLAX2%2F9Qlj49hJiUBu%2Big4HE%3D","intro":"一般に地理検と呼ばれる","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0298G000700022_S0246.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0298G000700022_S0246.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=BoNiAkhfPpqcZNcMosEmtLEfuGM%3D","intro":"これまでの成長実績および今後の成長見込","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0298G001200003_S0018.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0298G001200003_S0018.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=21qQuzANs9iXXJhacn9yIfn2GQ0%3D","intro":"大神宮前駅跡に建つモニュメント","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0304G0003883401_S0390.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY180901052_demo1695808923189/APY180901052_demo/T0304G0003883401_S0390.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=rbrIImuF0Ljv6CBxecZ2axEMoyQ%3D","intro":"リターン オブ ザ インベーダー","size":0,"progress":100,"type":"mp3"}],"officialSummary":"261 hours of Japanese smartphone-based speech dataset consisting of scripted monologue recordings collected from mobile devices. The dataset covers general domain speech and reflects real-world mobile usage scenarios.All audio samples are fully transcribed and include structured text content and metadata. Our dataset is collected from 1006 Japanese native speakers across diverse geographic regions, enhancing model performance in real and complex tasks.Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.","dataexampl":null,"datakeyword":["japanese speech dataset","japanese ASR dataset","speech to text dataset japanese","japanese mobile speech dataset","labeled japanese speech data"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","dataShowType":"[{\"code\":\"0\",\"language\":\"ZH\"},{\"code\":\"1\",\"language\":\"ZH\"},{\"code\":\"2\",\"language\":\"EN,JP,PT,DE,KO,FR,ES\"},{\"code\":\"3\",\"language\":\"EN\"}]","productNameEn":"261 Hours – Japanese Speech Data by Mobile Phone","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
261 Hours Japanese Speech Dataset – Native Speakers & Labeled Audio for AI Training
japanese speech dataset
japanese ASR dataset
speech to text dataset japanese
japanese mobile speech dataset
labeled japanese speech data
261 hours of Japanese smartphone-based speech dataset consisting of scripted monologue recordings collected from mobile devices. The dataset covers general domain speech and reflects real-world mobile usage scenarios.All audio samples are fully transcribed and include structured text content and metadata. Our dataset is collected from 1006 Japanese native speakers across diverse geographic regions, enhancing model performance in real and complex tasks.Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.