[{"@type":"PropertyValue","name":"Data size","value":"202 people, each person collects the audio and video data from 13 different angles +1 txt document"},{"@type":"PropertyValue","name":"People distribution","value":"race distribution: Asian (Indonesia), gender distribution: 89 males, 113 females, age distribution: 165 people aged 18-30, 32 people aged 31-45, and 5 people aged 46-60"},{"@type":"PropertyValue","name":"Collecting environment","value":"indoor natural light scenes, indoor fluorescent lamp scenes"},{"@type":"PropertyValue","name":"Data diversity","value":"including multiple scenes, different ages, different shooting angles"},{"@type":"PropertyValue","name":"Device","value":"cellphone, the resolution is 1,920*1,080"},{"@type":"PropertyValue","name":"Collecting angle","value":"audio and video data of front face, 3 angles left side face, 3 angles right side face, looking down, looking up, left side face down, right side face down, left side face up and right side face up all 13 different angles were collected at the same time"},{"@type":"PropertyValue","name":"Recording content","value":"general field, unlimited content"},{"@type":"PropertyValue","name":"Language","value":"Mandarin Chinese, each video is more than 20 seconds"},{"@type":"PropertyValue","name":"Data format","value":"the video data format is .mp4, the audio is greater than or equal to 16KHz, 16bit, the frame rate is 25-30 fps"},{"@type":"PropertyValue","name":"Accuracy rata","value":"the accuracy rate of word is more than 95%"}]
{"id":1298,"datatype":"1","titleimg":"[{\"name\": \"APY230627001.jpg\", \"url\": \"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/asset/productNew/nexdata/APY230627001.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=APun%2FFClw%2Fz8gHzlhCPPBIQlbos%3D\", \"size\": 2048, \"progress\": 100}]","type1":"147","type1str":null,"type2":"149","type2str":null,"dataname":"202 People - Multi-angle Lip Multimodal Video Data","datazy":[{"title":"Data size","desc":"Data size","content":"202 people, each person collects the audio and video data from 13 different angles +1 txt document"},{"title":"People distribution","desc":"People distribution","content":"race distribution: Asian (Indonesia), gender distribution: 89 males, 113 females, age distribution: 165 people aged 18-30, 32 people aged 31-45, and 5 people aged 46-60"},{"title":"Collecting environment","desc":"Collecting environment","content":"indoor natural light scenes, indoor fluorescent lamp scenes"},{"title":"Data diversity","desc":"Data diversity","content":"including multiple scenes, different ages, different shooting angles"},{"title":"Device","desc":"Device","content":"cellphone, the resolution is 1,920*1,080"},{"title":"Collecting angle","desc":"Collecting angle","content":"audio and video data of front face, 3 angles left side face, 3 angles right side face, looking down, looking up, left side face down, right side face down, left side face up and right side face up all 13 different angles were collected at the same time"},{"title":"Recording content","desc":"Recording content","content":"general field, unlimited content"},{"title":"Language","desc":"Language","content":"Mandarin Chinese, each video is more than 20 seconds"},{"title":"Data format","desc":"Data format","content":"the video data format is .mp4, the audio is greater than or equal to 16KHz, 16bit, the frame rate is 25-30 fps"},{"title":"Accuracy rata","desc":"Accuracy rata","content":"the accuracy rate of word is more than 95%"}],"datatag":"Lip multimodal,Mandarin Chinese,Multiple scenes,Different ages,Different shooting angles","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/002_male_29.png","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/002_male_29.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=ALASNNOKRu%2FsdItuxWu7btO8Gqs%3D","intro":"","size":0,"progress":100,"type":"jpg"},{"name":"/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/001_female_30.png","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/001_female_30.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=mZRLnTYk5W0s3jRzP7Um81hhRvw%3D","intro":"","size":0,"progress":100,"type":"jpg"},{"name":"/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/156_male_42.png","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/156_male_42.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=2wVvKW6e6XgkYOi9kPqptswFKGs%3D","intro":"","size":0,"progress":100,"type":"jpg"}],"officialSummary":"202 People - Multi-angle Lip Multimodal Video Data. The collection environments include indoor natural light scenes and indoor fluorescent lamp scenes. The device is cellphone. The diversity includes multiple scenes, different ages, 13 shooting angles. The language is Mandarin Chinese. The recording content is general field, unlimited content. The data can be used in multi-modal learning algorithms research in speech and image fields.","dataexampl":null,"datakeyword":["Multi-angle"," lip multimodal","indoor natural light scenes","indoor fluorescent lamp scenes"," 13 shooting angles"," Mandarin Chinese","general field"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Language,Data Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"],"firstList":[{"name":"/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/090_female_38.png","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/090_female_38.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=c6Jkb362VMrtxemlPNPSW%2FkEH%2Fk%3D","intro":"","size":0,"progress":100,"type":"jpg"}]}
[{"@type":"ImageObject","embedUrl":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/002_male_29.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=ALASNNOKRu%2FsdItuxWu7btO8Gqs%3D"},{"@type":"ImageObject","embedUrl":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/001_female_30.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=mZRLnTYk5W0s3jRzP7Um81hhRvw%3D"},{"@type":"ImageObject","embedUrl":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/156_male_42.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=2wVvKW6e6XgkYOi9kPqptswFKGs%3D"},{"@type":"ImageObject","embedUrl":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY230627001_demo1715767204254/APY230627001_demo/090_female_38.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=c6Jkb362VMrtxemlPNPSW%2FkEH%2Fk%3D"}]
202 People - Multi-angle Lip Multimodal Video Data
Multi-angle
lip multimodal
indoor natural light scenes
indoor fluorescent lamp scenes
13 shooting angles
Mandarin Chinese
general field
202 People - Multi-angle Lip Multimodal Video Data. The collection environments include indoor natural light scenes and indoor fluorescent lamp scenes. The device is cellphone. The diversity includes multiple scenes, different ages, 13 shooting angles. The language is Mandarin Chinese. The recording content is general field, unlimited content. The data can be used in multi-modal learning algorithms research in speech and image fields.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Data size
202 people, each person collects the audio and video data from 13 different angles +1 txt document
People distribution
race distribution: Asian (Indonesia), gender distribution: 89 males, 113 females, age distribution: 165 people aged 18-30, 32 people aged 31-45, and 5 people aged 46-60
Collecting environment
indoor natural light scenes, indoor fluorescent lamp scenes
Data diversity
including multiple scenes, different ages, different shooting angles
Device
cellphone, the resolution is 1,920*1,080
Collecting angle
audio and video data of front face, 3 angles left side face, 3 angles right side face, looking down, looking up, left side face down, right side face down, left side face up and right side face up all 13 different angles were collected at the same time
Recording content
general field, unlimited content
Language
Mandarin Chinese, each video is more than 20 seconds
Data format
the video data format is .mp4, the audio is greater than or equal to 16KHz, 16bit, the frame rate is 25-30 fps
Accuracy rata
the accuracy rate of word is more than 95%
Sample
Recommended Dataset
Tell Us Your Special Needs
82499c90-0f92-49b1-9d98-fa7b31ca535e