[{"@type":"PropertyValue","name":"Data size","value":"9,574 images, 243,240 bounding boxes"},{"@type":"PropertyValue","name":"Language distribution","value":"English, Spanish, Portuguese, French, German, Japanese, Italian and Dutch"},{"@type":"PropertyValue","name":"Collecting environment","value":"black boards, white boards, green boards"},{"@type":"PropertyValue","name":"Device","value":"cellphone"},{"@type":"PropertyValue","name":"Photographic angle","value":"eye-level angle, looking down angle, looking up angle"},{"@type":"PropertyValue","name":"Data format","value":"the image data format is .jpg and other common image formats, the annotation file data format is.json"},{"@type":"PropertyValue","name":"Annotation content","value":"line-level quadrilateral (polygon) bounding box annotation and transcription for the texts"},{"@type":"PropertyValue","name":"Accuracy rate","value":"the error bound of each vertex of quadrilateral bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%"}]
{"id":1522,"datatype":"1","titleimg":"/shujutang/static/image/index/datatang_tuxiang_default.webp","type1":"147","type1str":null,"type2":"150","type2str":null,"dataname":"9,574 Images – Handwriting OCR Data On Board of 8 Languages","datazy":[{"title":"Data size","desc":"Data size","content":"9,574 images, 243,240 bounding boxes"},{"title":"Language distribution","desc":"Language distribution","content":"English, Spanish, Portuguese, French, German, Japanese, Italian and Dutch"},{"title":"Collecting environment","desc":"Collecting environment","content":"black boards, white boards, green boards"},{"title":"Device","desc":"Device","content":"cellphone"},{"title":"Photographic angle","desc":"Photographic angle","content":"eye-level angle, looking down angle, looking up angle"},{"title":"Data format","desc":"Data format","content":"the image data format is .jpg and other common image formats, the annotation file data format is.json"},{"title":"Annotation content","desc":"Annotation content","content":"line-level quadrilateral (polygon) bounding box annotation and transcription for the texts"},{"title":"Accuracy rate","desc":"Accuracy rate","content":"the error bound of each vertex of quadrilateral bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%"}],"datatag":"Handwriting,OCR,Black board,White board,Green board","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"English.jpg","url":"https://storage-product.datatang.com/damp/product/instructions_zh/20250520181645/English.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=iXnFSR4p1zCPdImOWx4vrYdgpTk%3D","intro":"","size":3706616,"progress":100,"type":"jpg"},{"name":"English-1.jpg","url":"https://storage-product.datatang.com/damp/product/instructions_zh/20250520181645/English-1.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=avTJb3O47GRlf350BDF64u7Pg1I%3D","intro":"","size":1563589,"progress":100,"type":"jpg"},{"name":"French.jpg","url":"https://storage-product.datatang.com/damp/product/instructions_zh/20250520181645/French.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=I94DzxisImSVjIMOdYAr2oC5tqM%3D","intro":"","size":1028972,"progress":100,"type":"jpg"}],"officialSummary":"9,574 Images – Handwriting OCR Data On Board of 8 Languages. The language distribution includes English, Spanish and Portuguese, etc. The data diversity includes multiple collecting scenes, multiple text carriers, multiple languages, multiple photographic angles. The collecting angeles are looking up angle, eye-level angle and looking down angle. In terms of annotation, row-level quadrilateral (polygon) annotation and content transcription are performed on the text. The dataset can be used for tasks such as handwriting OCR.","dataexampl":null,"datakeyword":["Handwriting","OCR","Black board","White board","Green board"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"ocr","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"firstList":[{"name":"German.jpg","url":"https://storage-product.datatang.com/damp/product/instructions_zh/20250520181645/German.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=vMIP6sYPAFSoLdpyUqVyw%2BQoUNA%3D","intro":"","size":3863985,"progress":100,"type":"jpg"}]}
9,574 Images – Handwriting OCR Data On Board of 8 Languages
Handwriting
OCR
Black board
White board
Green board
9,574 Images – Handwriting OCR Data On Board of 8 Languages. The language distribution includes English, Spanish and Portuguese, etc. The data diversity includes multiple collecting scenes, multiple text carriers, multiple languages, multiple photographic angles. The collecting angeles are looking up angle, eye-level angle and looking down angle. In terms of annotation, row-level quadrilateral (polygon) annotation and content transcription are performed on the text. The dataset can be used for tasks such as handwriting OCR.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Data size
9,574 images, 243,240 bounding boxes
Language distribution
English, Spanish, Portuguese, French, German, Japanese, Italian and Dutch
Collecting environment
black boards, white boards, green boards
Device
cellphone
Photographic angle
eye-level angle, looking down angle, looking up angle
Data format
the image data format is .jpg and other common image formats, the annotation file data format is.json
Annotation content
line-level quadrilateral (polygon) bounding box annotation and transcription for the texts
Accuracy rate
the error bound of each vertex of quadrilateral bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%