[{"@type":"PropertyValue","name":"Data size","value":"20,011 pictures, 20,011descriptions"},{"@type":"PropertyValue","name":"Language distribution","value":"Asian languages: Korean, Indonesian, Malay, Vietnamese, Thai, Chinese, Japanese European languages: French, German, Italian, Portuguese, Russian, Spanish, English"},{"@type":"PropertyValue","name":"Collection environment","value":"including store plaques, stop signs, posters, road signs, prompts and other scenes"},{"@type":"PropertyValue","name":"Collection diversity","value":"including 14 languages, various natural scenes, and multiple shooting angles"},{"@type":"PropertyValue","name":"Data format","value":"image format is .jpg, text format is .txt"},{"@type":"PropertyValue","name":"Collection equipment","value":"mobile phone, camera"},{"@type":"PropertyValue","name":"Description language","value":"English"},{"@type":"PropertyValue","name":"Text length","value":"in principle, 30~60 words, usually 3-5 sentences"},{"@type":"PropertyValue","name":"Main description content","value":"text arrangement, text content, color, scene"},{"@type":"PropertyValue","name":"Main deAccuracy ratescription content","value":"the proportion of correctly labeled images is not less than 97%"}]
{"id":1288,"datatype":"1","titleimg":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/asset/productNew/nexdata/APY231231006.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=S9MIa6xU4NUNo%2BI0K6hsmMft9oU%3D","type1":"226","type1str":null,"type2":"226","type2str":null,"dataname":"20,011 Image Caption Data of OCR in Natural Scenes","datazy":[{"title":"Data size","value":"20,011 pictures, 20,011descriptions"},{"title":"Language distribution","value":"Asian languages: Korean, Indonesian, Malay, Vietnamese, Thai, Chinese, Japanese European languages: French, German, Italian, Portuguese, Russian, Spanish, English"},{"title":"Collection environment","value":"including store plaques, stop signs, posters, road signs, prompts and other scenes"},{"title":"Collection diversity","value":"including 14 languages, various natural scenes, and multiple shooting angles"},{"title":"Data format","value":"image format is .jpg, text format is .txt"},{"title":"Collection equipment","value":"mobile phone, camera"},{"title":"Description language","value":"English"},{"title":"Text length","value":"in principle, 30~60 words, usually 3-5 sentences"},{"title":"Main description content","value":"text arrangement, text content, color, scene"},{"title":"Main deAccuracy ratescription content","value":"the proportion of correctly labeled images is not less than 97%"}],"datatag":"AIGC,English caption,OCR caption,Multiple shooting angles,Multinational scenes","technologydoc":null,"downurl":null,"datainfo":"","standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[["jpg","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/%3F%3F10.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=MCVrBqb27YBjyCDI0Jnyl3bJBGA%3D","/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/??10.png",""],["jpg","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/%3F%3F6.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=YloKf4W4lvZRZqUksIOndlMhK5E%3D","/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/??6.png",""],["jpg","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/%3F%3F7.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=MaMzeRl2B1sFE7KT28iUKO33omo%3D","/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/??7.png",""]],"officialSummary":"20,011 Image Caption Data of OCR in Natural Scenes, including Asian and European languages, a total of 14 languages, the collection environment includes shop plaques, stop signs, posters, road signs and other scenes, including a variety of shooting angles. The description language is English, which mainly describes the text arrangement, text content, color and other information.","dataexampl":"","datakeyword":["AIGC"," English caption"," OCR caption"," multilingual OCR data"," multilingual OCR data"," OCR data"," OCR dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"llm","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"single":"no","firstList":[["jpg","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/%3F%3F9.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=VEHblArfRzk5e3PLr2jzicBVmRY%3D","/data/apps/damp/temp/ziptemp/APY231231006_demo1727085603555/??9.png",""]]}
20,011 Image Caption Data of OCR in Natural Scenes
AIGC
English caption
OCR caption
multilingual OCR data
multilingual OCR data
OCR data
OCR dataset
20,011 Image Caption Data of OCR in Natural Scenes, including Asian and European languages, a total of 14 languages, the collection environment includes shop plaques, stop signs, posters, road signs and other scenes, including a variety of shooting angles. The description language is English, which mainly describes the text arrangement, text content, color and other information.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Data size
20,011 pictures, 20,011descriptions
Language distribution
Asian languages: Korean, Indonesian, Malay, Vietnamese, Thai, Chinese, Japanese European languages: French, German, Italian, Portuguese, Russian, Spanish, English
Collection environment
including store plaques, stop signs, posters, road signs, prompts and other scenes
Collection diversity
including 14 languages, various natural scenes, and multiple shooting angles
Data format
image format is .jpg, text format is .txt
Collection equipment
mobile phone, camera
Description language
English
Text length
in principle, 30~60 words, usually 3-5 sentences
Main description content
text arrangement, text content, color, scene
Main deAccuracy ratescription content
the proportion of correctly labeled images is not less than 97%