[{"@type":"PropertyValue","name":"Format","value":"16kHz, 16bit, uncompressed wav, mono channel;"},{"@type":"PropertyValue","name":"Content category","value":"Smart car, smart home, voice assistant;"},{"@type":"PropertyValue","name":"Recording condition","value":"Low background noise(indoor), without echo;"},{"@type":"PropertyValue","name":"Recording device","value":"Android smartphone, iPhone;"},{"@type":"PropertyValue","name":"Speaker","value":"203 Taiwanese, 33% male and 67% female;"},{"@type":"PropertyValue","name":"Country","value":"China(CHN);"},{"@type":"PropertyValue","name":"Language(Region) Code","value":"zh-TW;"},{"@type":"PropertyValue","name":"Language","value":"Taiwanese Mandarin;"},{"@type":"PropertyValue","name":"Features of annotation","value":"Transcription text, noise symbols, special identifiers;"},{"@type":"PropertyValue","name":"Accuracy Rate","value":"Sentence Accuracy Rate (SAR) 95%(noise symbols and other identifiers are excluded)"}]
{"id":64,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY161101043_G.png?Expires=2007353628&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=4Cd3KaznaaPy7Ox5mLd6Rp2b05M%3D","type1":"165","type1str":null,"type2":"165","type2str":null,"dataname":"203 People - Taiwanese Mandarin(China) Scripted Monologue Smartphone speech dataset_Guiding","datazy":[{"title":"Format","value":"16kHz, 16bit, uncompressed wav, mono channel;"},{"title":"Content category","value":"Smart car, smart home, voice assistant;"},{"title":"Recording condition","value":"Low background noise(indoor), without echo;"},{"title":"Recording device","value":"Android smartphone, iPhone;"},{"title":"Speaker","value":"203 Taiwanese, 33% male and 67% female;"},{"title":"Country","value":"China(CHN);"},{"title":"Language(Region) Code","value":"zh-TW;"},{"title":"Language","value":"Taiwanese Mandarin;"},{"title":"Features of annotation","value":"Transcription text, noise symbols, special identifiers;"},{"title":"Accuracy Rate","value":"Sentence Accuracy Rate (SAR) 95%(noise symbols and other identifiers are excluded)"}],"datatag":"Taiwanese Mandarin,China,Smartphone,Guiding,Scripted Monologue","technologydoc":null,"downurl":null,"datainfo":"The product is recorded by 203 local Taiwanese speakers of 137 women and 66 men. It was recorded in quiet room without echo. The data can be used for tasks such as speech recognition, machine translation, voiceprint recognition model training and Algorithms researching.","standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":["203 people","Taiwan locals","16kHz, 16bit, wav"],"samplePresentation":[["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0233G0124Q0006.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=2pkUdkT2N4Hf9aWMDIM5%2F0wXqOM%3D","/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0233G0124Q0006.wav","查詢餘額"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0233G0123Q0012.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=F44QZDe%2FpyngQORF6JZacXWNTIY%3D","/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0233G0123Q0012.wav","前排右側座位調前"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0233G0123Q0011.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=LjjmaGuFE71FqvRJQ7eGNfXmVPc%3D","/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0233G0123Q0011.wav","放低靠背"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0235G0209Q0018.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=XTlh6NNdTDxI1HzELJicG1xj5i4%3D","/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0235G0209Q0018.wav","把電壓轉換至兩百二十福特"],["mp3","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0235G0209Q0021.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=x2rVoL9ZSJ%2FCwx8OWXax67DKkNI%3D","/data/apps/damp/temp/ziptemp/APY161101043_G_demo1718791202920/APY161101043_G/T0235G0209Q0021.wav","今天晚上哪一台播甄嬛傳"]],"officialSummary":"Taiwanese Mandarin(China) Scripted Monologue Smartphone speech dataset_Guiding, collected from monologue based on given prompts, covering smart car, smart home, voice assistant domains. Transcribed with text content and other attributes. Our dataset was collected from extensive and diversify speakers(203 native speakers), geographicly speaking, enhancing model performance in real and complex tasks.Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.","dataexampl":"","datakeyword":["Taiwan Mandarin speech data"," Taiwanese voice data"," Taiwanese Scripted Speech Data"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Language,Data Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"single":"no"}
203 People - Taiwanese Mandarin(China) Scripted Monologue Smartphone speech dataset_Guiding
Taiwan Mandarin speech data
Taiwanese voice data
Taiwanese Scripted Speech Data
Taiwanese Mandarin(China) Scripted Monologue Smartphone speech dataset_Guiding, collected from monologue based on given prompts, covering smart car, smart home, voice assistant domains. Transcribed with text content and other attributes. Our dataset was collected from extensive and diversify speakers(203 native speakers), geographicly speaking, enhancing model performance in real and complex tasks.Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Format
16kHz, 16bit, uncompressed wav, mono channel;
Content category
Smart car, smart home, voice assistant;
Recording condition
Low background noise(indoor), without echo;
Recording device
Android smartphone, iPhone;
Speaker
203 Taiwanese, 33% male and 67% female;
Country
China(CHN);
Language(Region) Code
zh-TW;
Language
Taiwanese Mandarin;
Features of annotation
Transcription text, noise symbols, special identifiers;
Accuracy Rate
Sentence Accuracy Rate (SAR) 95%(noise symbols and other identifiers are excluded)