[{"@type":"PropertyValue","name":"Storage format","value":"TXT"},{"@type":"PropertyValue","name":"Data content","value":"Chinese-Germany Parallel Corpus Data"},{"@type":"PropertyValue","name":"Data size","value":"5.31 million pairs of Chinese-Germany Parallel Corpus Data"},{"@type":"PropertyValue","name":"Language","value":"Chinese, Germany"},{"@type":"PropertyValue","name":"Application scenario","value":"machine translation"}]
{"id":1163,"datatype":"1","titleimg":"https://res.datatang.com/asset/productNew/APY220223002.png?Expires=2007353706&OSSAccessKeyId=LTAI5tQwXnJZbubgVfVa1ep9&Signature=M8JYEzvsPnDKH0LDXfxQAy/WPNY%3D","type1":"183","type1str":null,"type2":"185","type2str":null,"dataname":"5.3M Pairs German-Chinese Parallel Corpus for NLP and MT Applications","datazy":[{"title":"Storage format","content":"TXT","desc":"Storage format"},{"title":"Data content","content":"Chinese-Germany Parallel Corpus Data","desc":"Data content"},{"title":"Data size","content":"5.31 million pairs of Chinese-Germany Parallel Corpus Data","desc":"Data size"},{"title":"Language","content":"Chinese, Germany","desc":"Language"},{"title":"Application scenario","content":"machine translation","desc":"Application scenario"}],"datatag":"Chinese,German,Chinese-German,Parallel Corpus","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY220223001_demo1711015208453/APY220223001_demo/en-ru ????.png","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY220223001_demo1711015208453/APY220223001_demo/en-ru%20%3F%3F%3F%3F.png?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=5VAq3eE9Dwv%2F0gigvy6sJgycAkY%3D","intro":"","size":0,"progress":100,"type":"jpg"}],"officialSummary":"5.3 million Chinese-German parallel sentence pairs stored in text format, covering multiple domains such as tourism, medical treatment, daily life, news, etc. The data desensitization and quality checking had been done. It can be used for machine translation, NLP research, and bilingual text analysis.","dataexampl":null,"datakeyword":["german parallel corpus","chinese german sentence pairs dataset","chinese german bilingual corpus","chinese german NLP corpus","chinese german text alignment dataset"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Type","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"nlu","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
5.3M Pairs German-Chinese Parallel Corpus for NLP and MT Applications
german parallel corpus
chinese german sentence pairs dataset
chinese german bilingual corpus
chinese german NLP corpus
chinese german text alignment dataset
5.3 million Chinese-German parallel sentence pairs stored in text format, covering multiple domains such as tourism, medical treatment, daily life, news, etc. The data desensitization and quality checking had been done. It can be used for machine translation, NLP research, and bilingual text analysis.
This is a paid datasets for commercial use, research purpose and more. Licensed ready made datasets help jump-start AI projects.
Specifications
Storage format
TXT
Data content
Chinese-Germany Parallel Corpus Data
Data size
5.31 million pairs of Chinese-Germany Parallel Corpus Data