[{"@type":"PropertyValue","name":"Data size","value":"100 people, the total number of handwriting piece is 22,163, at least 159 handwriting pieces for each subject"},{"@type":"PropertyValue","name":"Nationality distribution","value":"50 Japanese, 49 Koreans and 1 Afghan"},{"@type":"PropertyValue","name":"Gender distribution","value":"males"},{"@type":"PropertyValue","name":"Age distribution","value":"the young and middle-aged people are the majorities"},{"@type":"PropertyValue","name":"Data diversity","value":"multiple cellphone models, different corpus"},{"@type":"PropertyValue","name":"Device","value":"cellphone"},{"@type":"PropertyValue","name":"Data format","value":".json"},{"@type":"PropertyValue","name":"Annotation content","value":"text content, age, nationality, trace of handwriting"},{"@type":"PropertyValue","name":"Accuracy","value":"The annotation accuracy is not less than 95%"}]
{"id":127,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY161201436.png?Expires=2007353637&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=8629pvjIYayLUHSOsKgpTx6y%2BfI%3D","type1":"147","type1str":null,"type2":"150","type2str":null,"dataname":"Handwriting OCR Dataset – Japanese and Korean (22,163 Images)","datazy":[{"title":"Data size","desc":"Data size","content":"100 people, the total number of handwriting piece is 22,163, at least 159 handwriting pieces for each subject"},{"title":"Nationality distribution","desc":"Nationality distribution","content":"50 Japanese, 49 Koreans and 1 Afghan"},{"title":"Gender distribution","desc":"Gender distribution","content":"males"},{"title":"Age distribution","desc":"Age distribution","content":"the young and middle-aged people are the majorities"},{"title":"Data diversity","desc":"Data diversity","content":"multiple cellphone models, different corpus"},{"title":"Device","desc":"Device","content":"cellphone"},{"title":"Data format","desc":"Data format","content":".json"},{"title":"Annotation content","desc":"Annotation content","content":"text content, age, nationality, trace of handwriting"},{"title":"Accuracy","desc":"Accuracy","content":"The annotation accuracy is not less than 95%"}],"datatag":"Japanese,Korean,Handwriting OCR,Trace of handwriting","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":["100 people","Japanese, Korean","handwritting OCR"],"samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1317G0001S00011197.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1317G0001S00011197.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=edilEs2GkZ3dqocxkFB1DadO6wI%3D","intro":"","size":0,"progress":100,"type":"jpg"},{"name":"/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1317G0001S00011243.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1317G0001S00011243.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=BYZzGo9eLrV5BiPFHd1Rbq4dvao%3D","intro":"","size":0,"progress":100,"type":"jpg"},{"name":"/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1316G0013S00011063.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1316G0013S00011063.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=IsBLxCaccicp28PnUjp8vn7JfmE%3D","intro":"","size":0,"progress":100,"type":"jpg"}],"officialSummary":"This dataset contains handwritten text images collected from 100 individuals, including 50 Japanese, 49 Koreans and 1 Afghan. For different subjects, the corpus are different. The data diversity includes multiple cellphone models and different corpus. This dataset can be used for tasks such as handwriting OCR models, handwritten text recognition systems, and multilingual OCR pipelines","dataexampl":null,"datakeyword":["handwriting OCR dataset","handwritten OCR dataset","handwriting recognition dataset","Korean handwriting OCR dataset","multilingual handwriting OCR dataset","Japanese handwriting OCR dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"ocr","dataShowType":"[{\"code\":\"0\",\"language\":\"ZH\"},{\"code\":\"1\",\"language\":\"ZH\"},{\"code\":\"2\",\"language\":\"EN,JP,PT,DE,KO,FR,ES\"},{\"code\":\"3\",\"language\":\"EN\"},{\"code\":\"4\",\"language\":\"JP\"}]","productNameEn":"100 People - Handwriting OCR Data of Japanese and Korean","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"firstList":[{"name":"/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1316G0013S00011001.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY161201436_demo1695808874866/APY161201436_demo/T1316G0013S00011001.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=N69IUdiZQhYskf%2F%2Foj3uHWeCADQ%3D","intro":"","size":0,"progress":100,"type":"jpg"}]}
Handwriting OCR Dataset – Japanese and Korean (22,163 Images)
handwriting OCR dataset
handwritten OCR dataset
handwriting recognition dataset
Korean handwriting OCR dataset
multilingual handwriting OCR dataset
Japanese handwriting OCR dataset
This dataset contains handwritten text images collected from 100 individuals, including 50 Japanese, 49 Koreans and 1 Afghan. For different subjects, the corpus are different. The data diversity includes multiple cellphone models and different corpus. This dataset can be used for tasks such as handwriting OCR models, handwritten text recognition systems, and multilingual OCR pipelines
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Data size
100 people, the total number of handwriting piece is 22,163, at least 159 handwriting pieces for each subject
Nationality distribution
50 Japanese, 49 Koreans and 1 Afghan
Gender distribution
males
Age distribution
the young and middle-aged people are the majorities
Data diversity
multiple cellphone models, different corpus
Device
cellphone
Data format
.json
Annotation content
text content, age, nationality, trace of handwriting