[{"@type":"PropertyValue","name":"Storage format","value":"TXT"},{"@type":"PropertyValue","name":"Data content","value":"Japanese-English Parallel Corpus Data"},{"@type":"PropertyValue","name":"Data size","value":"0.38 million pairs of Japanese-English Parallel Corpus Data"},{"@type":"PropertyValue","name":"Language","value":"Japanese, English"},{"@type":"PropertyValue","name":"Application scenario","value":"machine translation"}]
{"id":153,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY170101229.png?Expires=2007353639&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=Z1i3ZVOwZNFMDzyWbqfO7ZysaZk%3D","type1":"183","type1str":null,"type2":"185","type2str":null,"dataname":"Japanese-English Parallel Corpus Dataset – 380,000 Sentence Pairs for Machine Translation","datazy":[{"title":"Storage format","desc":"Storage format","content":"TXT"},{"title":"Data content","desc":"Data content","content":"Japanese-English Parallel Corpus Data"},{"title":"Data size","desc":"Data size","content":"0.38 million pairs of Japanese-English Parallel Corpus Data"},{"title":"Language","desc":"Language","content":"Japanese, English"},{"title":"Application scenario","desc":"Application scenario","content":"machine translation"}],"datatag":"Japanese and English,Parallel Corpus","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":["380,000 groups","Japanese and English parallel corpus","exclusion of sensitive information"],"samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY170101229_demo1711015203143/APY170101229_demo/APY170101229_demo.jpg","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY170101229_demo1711015203143/APY170101229_demo/APY170101229_demo.jpg?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=EeSHuPP1R7yDj%2BCfsbiRAM2AbSI%3D","intro":"","size":0,"progress":100,"type":"jpg"}],"officialSummary":"This dataset contains 380,000 aligned Japanese-English sentence pairs. Sensitive content such as political, pornographic, and personal information has been excluded. It can be a base corpus for translation systems, cross-lingual information retrieval, and text-based language processing applications.","dataexampl":null,"datakeyword":["japanese english parallel corpus","japanese english translation dataset","bilingual corpus japanese english","japanese english text dataset","japanese english aligned corpus","japanese english NLP dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"nlu","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
Japanese-English Parallel Corpus Dataset – 380,000 Sentence Pairs for Machine Translation
japanese english parallel corpus
japanese english translation dataset
bilingual corpus japanese english
japanese english text dataset
japanese english aligned corpus
japanese english NLP dataset
This dataset contains 380,000 aligned Japanese-English sentence pairs. Sensitive content such as political, pornographic, and personal information has been excluded. It can be a base corpus for translation systems, cross-lingual information retrieval, and text-based language processing applications.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Storage format
TXT
Data content
Japanese-English Parallel Corpus Data
Data size
0.38 million pairs of Japanese-English Parallel Corpus Data