[{"@type":"PropertyValue","name":"Format","value":"24kHz, 16 bit, wav, mono channel;"},{"@type":"PropertyValue","name":"Content category","value":"Free dialogue based on given topics"},{"@type":"PropertyValue","name":"Recording condition","value":"Low background noise (indoor);"},{"@type":"PropertyValue","name":"Recording device","value":"Android smartphone, iPhone;"},{"@type":"PropertyValue","name":"Speaker","value":"234 people, with 102 males and 132 females"},{"@type":"PropertyValue","name":"Country","value":"Japan(JPN);"},{"@type":"PropertyValue","name":"Language","value":"Japanese;"},{"@type":"PropertyValue","name":"Features of annotation","value":"Transcription text, timestamp, speaker ID, gender."},{"@type":"PropertyValue","name":"Accuracy Rate","value":"Character Accuracy Rate (CAR) 98%"}]
{"id":1703,"datatype":"1","titleimg":"https://www.nexdata.ai/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"166","type2str":null,"dataname":"200 Hours - Japanese Full-Duplex Multi-Channel Speech Dataset","datazy":[{"title":"Format","content":"24kHz, 16 bit, wav, mono channel;"},{"title":"Content category","content":"Free dialogue based on given topics"},{"title":"Recording condition","content":"Low background noise (indoor);"},{"title":"Recording device","content":"Android smartphone, iPhone;"},{"title":"Speaker","content":"234 people, with 102 males and 132 females"},{"title":"Country","content":"Japan(JPN);"},{"title":"Language","content":"Japanese;"},{"title":"Features of annotation","content":"Transcription text, timestamp, speaker ID, gender."},{"title":"Accuracy Rate","content":"Character Accuracy Rate (CAR) 98%"}],"datatag":"Japanese,Japan,Dialogue,Full-Duplex","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":null,"samplePresentation":[{"name":"G00033S0019_O1_9.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250722160934/G00033S0019_O1_9.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=g4aYYPMbEEGq1o%2FKzMEuayWuSF8%3D","intro":"徳川綱吉で、ですかね、覚えて[OVERLAP/]いま[/OVERLAP]すか。","size":207346,"progress":100,"type":"mp3"},{"name":"G00033S0019_O1_1.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250722160934/G00033S0019_O1_1.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=TJysfMzWL9uOkWb1wVG%2B3hTkQOY%3D","intro":"なんかすいません、切れちゃってごめんなさい。","size":78680,"progress":100,"type":"mp3"},{"name":"G00033S0019_O2_17.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250722160934/G00033S0019_O2_17.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=8oNd5jsAJtQd42ajkgUjU%2F9Aah4%3D","intro":"旅行、行った時とかに見たりするんですか?[N]","size":137764,"progress":100,"type":"mp3"},{"name":"G00033S0019_O2_19.wav","url":"https://storage-product.datatang.com/damp/product/sample_presentation/20250722160934/G00033S0019_O2_19.wav?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=ZSbdBl5mI9p3aoDX9vMG1TVRjQs%3D","intro":"え、なんか印象に残ってるとか良かったお城あったりしますか。","size":203126,"progress":100,"type":"mp3"}],"officialSummary":"200 Hours Japanese Full-Duplex Multi-Channel Speech Dataset is collected from dialogues based on given topics. Transcribed with text content, speaker's ID, gender, age and other attributes. Our dataset was collected from extensive and diversify speakers, geographicly speaking, enhancing model performance in real and complex tasks. Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.","dataexampl":null,"datakeyword":["Japanese speech dataset","spontaneous Japanese dialogue","multi-stream Japanese audio data","conversational Japanese corpus","Japanese voice dataset","full-duplex speech dataset","multi-stream speech dataset","multi-channel audio dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
200 Hours - Japanese Full-Duplex Multi-Channel Speech Dataset
Japanese speech dataset
spontaneous Japanese dialogue
multi-stream Japanese audio data
conversational Japanese corpus
Japanese voice dataset
full-duplex speech dataset
multi-stream speech dataset
multi-channel audio dataset
200 Hours Japanese Full-Duplex Multi-Channel Speech Dataset is collected from dialogues based on given topics. Transcribed with text content, speaker's ID, gender, age and other attributes. Our dataset was collected from extensive and diversify speakers, geographicly speaking, enhancing model performance in real and complex tasks. Quality tested by various AI companies. We strictly adhere to data protection regulations and privacy standards, ensuring the maintenance of user privacy and legal rights throughout the data collection, storage, and usage processes, our datasets are all GDPR, CCPA, PIPL complied.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.