[{"@type":"PropertyValue","name":"Data size","value":"30,000 images, including 10,000 images in Khmer (Cambodia), 10,000 images in Lao, and 10,000 images in Burmese"},{"@type":"PropertyValue","name":"Collecting environment","value":"including slogan, receipt, poster, warning sign, road sign, food packaging, billboard, station sign and signboard, etc."},{"@type":"PropertyValue","name":"Data diversity","value":"including a variety of natural scenes, multiple shooting angles"},{"@type":"PropertyValue","name":"Device","value":"cellphone"},{"@type":"PropertyValue","name":"Photographic angle","value":"looking up angle, looking down angle, eye-level angle"},{"@type":"PropertyValue","name":"Data format","value":"the image format is common format such as.jpg, the annotation file format is .json"},{"@type":"PropertyValue","name":"Annotation content","value":"line-level (column-level) quadrilateral bounding box annotation and transcription for the texts;polygon bounding box annotation and transcription for the texts"},{"@type":"PropertyValue","name":"Accuracy rate","value":"the error bound of each vertex of quadrilateral or polygon bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%."}]
{"id":1758,"datatype":"1","titleimg":"/shujutang/static/image/index/datatang_tuxiang_default.jpg","type1":"147","type1str":null,"type2":"150","type2str":null,"dataname":"30,000 Images - Natural Scenes OCR Data in Southeast Asian Languages","datazy":[{"title":"Data size","desc":"Data size","content":"30,000 images, including 10,000 images in Khmer (Cambodia), 10,000 images in Lao, and 10,000 images in Burmese"},{"desc":"Collecting environment","content":"including slogan, receipt, poster, warning sign, road sign, food packaging, billboard, station sign and signboard, etc.","title":"Collecting environment"},{"desc":"Data diversity","content":"including a variety of natural scenes, multiple shooting angles","title":"Data diversity"},{"desc":"Device","content":"cellphone","title":"Device"},{"desc":"Photographic angle","content":"looking up angle, looking down angle, eye-level angle","title":"Photographic angle"},{"desc":"Data format","content":"the image format is common format such as.jpg, the annotation file format is .json","title":"Data format"},{"desc":"Annotation content","content":"line-level (column-level) quadrilateral bounding box annotation and transcription for the texts;polygon bounding box annotation and transcription for the texts","title":"Annotation content"},{"desc":"Accuracy rate","content":"the error bound of each vertex of quadrilateral or polygon bounding box is within 5 pixels, which is a qualified annotation, the accuracy of bounding boxes is not less than 95%; the texts transcription accuracy is not less than 95%.","title":"Accuracy rate"}],"datatag":"OCR,Southeast Asian Languages,Natural Scenes","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"老挝2.jpg","url":"https://storage-product.datatang.com/damp/product/instructions_zh/20250408143051/%E8%80%81%E6%8C%9D2.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=s%2B1eh4MjnUp%2BNvrevGyGE8CYeks%3D","intro":"","size":2370056,"progress":100,"type":"jpg"},{"name":"柬埔寨3.jpg","url":"https://storage-product.datatang.com/damp/product/instructions_zh/20250408143051/%E6%9F%AC%E5%9F%94%E5%AF%A83.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=nkoeGAmA%2F2WQ0KLZU8gLpBpEuf4%3D","intro":"","size":192805,"progress":100,"type":"jpg"},{"name":"缅甸.jpg","url":"https://storage-product.datatang.com/damp/product/instructions_zh/20250408143051/%E7%BC%85%E7%94%B8.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=E%2FxEnHde33VDqiwLCg%2Fjls2boS0%3D","intro":"","size":1161383,"progress":100,"type":"jpg"}],"officialSummary":"30,000 natural scene OCR data for minority languages in Southeast Asia, including Khmer (Cambodia), Lao and Burmese. The diversity of collection includes a variety of natural scenes and a variety of shooting angles. This set of data can be used for Southeast Asian language OCR tasks.","dataexampl":null,"datakeyword":"OCR,Southeast Asian Languages,Natural Scenes","isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"ocr","BGimg":"","voiceBg":["/shujutang/static/image/comm/audio_bg.png","/shujutang/static/image/comm/audio_bg2.png","/shujutang/static/image/comm/audio_bg3.png","/shujutang/static/image/comm/audio_bg4.png","/shujutang/static/image/comm/audio_bg5.png"]}
[{"@type":"ImageObject","embedUrl":"https://storage-product.datatang.com/damp/product/instructions_zh/20250408143051/%E8%80%81%E6%8C%9D2.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=s%2B1eh4MjnUp%2BNvrevGyGE8CYeks%3D"},{"@type":"ImageObject","embedUrl":"https://storage-product.datatang.com/damp/product/instructions_zh/20250408143051/%E6%9F%AC%E5%9F%94%E5%AF%A83.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=nkoeGAmA%2F2WQ0KLZU8gLpBpEuf4%3D"},{"@type":"ImageObject","embedUrl":"https://storage-product.datatang.com/damp/product/instructions_zh/20250408143051/%E7%BC%85%E7%94%B8.jpg?Expires=4102415999&OSSAccessKeyId=LTAI5tEBeSWUJiqjXvBMsxEu&Signature=E%2FxEnHde33VDqiwLCg%2Fjls2boS0%3D"}]