[{"@type":"PropertyValue","name":"Data size","value":"14,980 images, 8 languages"},{"@type":"PropertyValue","name":"Data environment","value":"including meeting room, conference room"},{"@type":"PropertyValue","name":"Language types","value":"French, Korean, Japanese, Spanish, German, Italian, Portuguese and Russian"},{"@type":"PropertyValue","name":"Data diversity","value":"multiple scenes, multiple languages, different photographic angles, different photographic distances, different light conditions"},{"@type":"PropertyValue","name":"Device","value":"cellphone"},{"@type":"PropertyValue","name":"Collecting angles","value":"front, left, right, looking up angle"},{"@type":"PropertyValue","name":"Data format","value":"the image data format is .jpg, the annotation file data format is .json"},{"@type":"PropertyValue","name":"Annotation content","value":"line-level quadrilateral bounding box annotation and transcription for the texts"},{"@type":"PropertyValue","name":"Accuracy","value":"the error bound of each vertex of quadrilateral bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%"}]
{"id":979,"datatype":"1","titleimg":"[{\"name\": \"APY190221001.png\", \"url\": \"https://res.datatang.com/asset/productNew/APY190221001.png?Expires=2007353658&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=BGPbVY68lixdhyzw%2BJL/urGUuWo%3D\", \"size\": 2048, \"progress\": 100}]","type1":"147","type1str":null,"type2":"150","type2str":null,"dataname":"14,980 Images PPT OCR Data of 8 Languages","datazy":[{"title":"Data size","desc":"Data size","content":"14,980 images, 8 languages"},{"title":"Data environment","desc":"Data environment","content":"including meeting room, conference room"},{"title":"Language types","desc":"Language types","content":"French, Korean, Japanese, Spanish, German, Italian, Portuguese and Russian"},{"title":"Data diversity","desc":"Data diversity","content":"multiple scenes, multiple languages, different photographic angles, different photographic distances, different light conditions"},{"title":"Device","desc":"Device","content":"cellphone"},{"title":"Collecting angles","desc":"Collecting angles","content":"front, left, right, looking up angle"},{"title":"Data format","desc":"Data format","content":"the image data format is .jpg, the annotation file data format is .json"},{"title":"Annotation content","desc":"Annotation content","content":"line-level quadrilateral bounding box annotation and transcription for the texts"},{"title":"Accuracy","desc":"Accuracy","content":"the error bound of each vertex of quadrilateral bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%"}],"datatag":"Multiple scenes,Multiple languages,Different photographic angles,Different photographic distances,Different light conditions","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":["14,980 pictures","8 languages","2 natural scenes"],"samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/2.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/2.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=sqPdc1rGwcLu%2BK2TLOwTHcVrLQs%3D","intro":"","size":0,"progress":100,"type":"jpg"},{"name":"/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/3.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/3.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=uOxRQ0dl8DcDwkjpEaXwlvSDyPg%3D","intro":"","size":0,"progress":100,"type":"jpg"},{"name":"/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/1.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/1.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=1jE3Q1rsa7koY0u0viSa%2FobOefo%3D","intro":"","size":0,"progress":100,"type":"jpg"}],"officialSummary":"14,980 Images PPT OCR Data of 8 Languages. This dataset includes 8 languages, multiple scenes, different photographic angles, different photographic distances, different light conditions. For annotation, line-level quadrilateral bounding box annotation and transcription for the texts were annotated in the data. The dataset can be used for tasks such as OCR of multi-language.","dataexampl":null,"datakeyword":["PPT"," OCR"," meeting room"," conference room","different photographic angles"," different photographic distances"," different light conditions","line-level quadrilateral bounding box annotation and transcription for the texts"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"ocr","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"firstList":[{"name":"/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/5.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY190221001_demo1695808941160/APY190221001_demo/5.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=kydEh0XnVloXhfsJGmIByO3Vi6U%3D","intro":"","size":0,"progress":100,"type":"jpg"}]}
line-level quadrilateral bounding box annotation and transcription for the texts
14,980 Images PPT OCR Data of 8 Languages. This dataset includes 8 languages, multiple scenes, different photographic angles, different photographic distances, different light conditions. For annotation, line-level quadrilateral bounding box annotation and transcription for the texts were annotated in the data. The dataset can be used for tasks such as OCR of multi-language.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Data size
14,980 images, 8 languages
Data environment
including meeting room, conference room
Language types
French, Korean, Japanese, Spanish, German, Italian, Portuguese and Russian
Data diversity
multiple scenes, multiple languages, different photographic angles, different photographic distances, different light conditions
Device
cellphone
Collecting angles
front, left, right, looking up angle
Data format
the image data format is .jpg, the annotation file data format is .json
Annotation content
line-level quadrilateral bounding box annotation and transcription for the texts
Accuracy
the error bound of each vertex of quadrilateral bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%