[{"@type":"PropertyValue","name":"Data size","value":"10,000 images,1,000 videos"},{"@type":"PropertyValue","name":"Race distribution","value":"Caucasian, black, Asian"},{"@type":"PropertyValue","name":"Gender distribution","value":"male, female"},{"@type":"PropertyValue","name":"Age distribution","value":"from teenagers to old age, mainly young and middle-aged"},{"@type":"PropertyValue","name":"Collection environment","value":"including indoor scenes and outdoor scenes"},{"@type":"PropertyValue","name":"Collection diversity","value":"different age groups, different collection environments, different seasons, various shooting angles, and various human behaviors"},{"@type":"PropertyValue","name":"Data format","value":"image format is .jpg, video format is .mp4, text format is .txt"},{"@type":"PropertyValue","name":"Description language","value":"English, Chinese"},{"@type":"PropertyValue","name":"Text length","value":"in principle, 30~60 words, usually 3-5 sentences"},{"@type":"PropertyValue","name":"Main description conten","value":"gender, age, clothing, behavior description, body movements"},{"@type":"PropertyValue","name":"Accuracy rate","value":"the proportion of correctly labeled images is not less than 97%"}]
{"id":1289,"datatype":"1","titleimg":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/asset/productNew/nexdata/APY231231007.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=TB1%2FMNmvxZxSLSxYIQtQjLBQTnw%3D","type1":"226","type1str":null,"type2":"226","type2str":null,"dataname":"11,000 Image & Video Caption Data of Human Action","datazy":[{"title":"Data size","value":"10,000 images,1,000 videos"},{"title":"Race distribution","value":"Caucasian, black, Asian"},{"title":"Gender distribution","value":"male, female"},{"title":"Age distribution","value":"from teenagers to old age, mainly young and middle-aged"},{"title":"Collection environment","value":"including indoor scenes and outdoor scenes"},{"title":"Collection diversity","value":"different age groups, different collection environments, different seasons, various shooting angles, and various human behaviors"},{"title":"Data format","value":"image format is .jpg, video format is .mp4, text format is .txt"},{"title":"Description language","value":"English, Chinese"},{"title":"Text length","value":"in principle, 30~60 words, usually 3-5 sentences"},{"title":"Main description conten","value":"gender, age, clothing, behavior description, body movements"},{"title":"Accuracy rate","value":"the proportion of correctly labeled images is not less than 97%"}],"datatag":"AIGC,Multi-modal,English caption,Different age groups,Different lighting,Different collection environments,Different seasons of clothing,Various human behaviors","technologydoc":null,"downurl":null,"datainfo":"","standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[["jpg","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY231231007_demo1717063200761/%3F%3F13.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=7JIEMolkYVV3EuqbezFBR7QmcQw%3D","/data/apps/damp/temp/ziptemp/APY231231007_demo1717063200761/??13.png",""],["jpg","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY231231007_demo1717063200761/%3F%3F12.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=J6yeSYbccfJrkayGKnozKse1EWM%3D","/data/apps/damp/temp/ziptemp/APY231231007_demo1717063200761/??12.png",""],["jpg","https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY231231007_demo1717063200761/%3F%3F11.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=TWegv%2FWb9d%2Ffyb4kf5ZqAmdXobQ%3D","/data/apps/damp/temp/ziptemp/APY231231007_demo1717063200761/??11.png",""]],"officialSummary":"11,000 Image & Video caption data of human action contains 10,000 images and 10,000videos of various human behaviors in different seasons and different shooting angles, including indoor scenes and outdoor scenes. The description language is English, mainly describing the gender, age, clothing, behavior description and body movements of the characters.","dataexampl":"","datakeyword":["AIGC"," human behavior data"," behavior recognition data"," human behavior recognition data"," human detection data"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"llm","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"single":"no"}
11,000 Image & Video caption data of human action contains 10,000 images and 10,000videos of various human behaviors in different seasons and different shooting angles, including indoor scenes and outdoor scenes. The description language is English, mainly describing the gender, age, clothing, behavior description and body movements of the characters.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Data size
10,000 images,1,000 videos
Race distribution
Caucasian, black, Asian
Gender distribution
male, female
Age distribution
from teenagers to old age, mainly young and middle-aged
Collection environment
including indoor scenes and outdoor scenes
Collection diversity
different age groups, different collection environments, different seasons, various shooting angles, and various human behaviors
Data format
image format is .jpg, video format is .mp4, text format is .txt
Description language
English, Chinese
Text length
in principle, 30~60 words, usually 3-5 sentences
Main description conten
gender, age, clothing, behavior description, body movements
Accuracy rate
the proportion of correctly labeled images is not less than 97%