Skip to content

Commit

Permalink
update hf url
Browse files Browse the repository at this point in the history
  • Loading branch information
松灵 committed Dec 27, 2024
1 parent 6ece6c4 commit 5b7ab08
Showing 1 changed file with 39 additions and 39 deletions.
78 changes: 39 additions & 39 deletions vlmeval/dataset/image_ccocr.py
Original file line number Diff line number Diff line change
Expand Up @@ -57,45 +57,45 @@ class CCOCRDataset(ImageBaseDataset):
}

DATASET_URL_HUGGINGFACE = {
"CCOCR_DocParsing_DocPhotoChn": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/doc/doc_photo_chn_75.tsv",
"CCOCR_DocParsing_DocPhotoEng": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/doc/doc_photo_eng_75.tsv",
"CCOCR_DocParsing_DocScanChn": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/doc/doc_scan_chn_75.tsv",
"CCOCR_DocParsing_DocScanEng": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/doc/doc_scan_eng_75.tsv",
"CCOCR_DocParsing_TablePhotoChn": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/table/table_photo_chn_75.tsv",
"CCOCR_DocParsing_TablePhotoEng": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/table/table_photo_eng_75.tsv",
"CCOCR_DocParsing_TableScanChn": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/table/table_scan_chn_75.tsv",
"CCOCR_DocParsing_TableScanEng": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/table/table_scan_eng_75.tsv",
"CCOCR_DocParsing_MolecularHandwriting": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/molecular/molecular_handwriting_100.tsv",
"CCOCR_DocParsing_FormulaHandwriting": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/doc_parsing/formula/formula_handwriting_100.tsv",
"CCOCR_Kie_Sroie2019Word": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/kie/constrained_category/sroie2019_word_347.tsv",
"CCOCR_Kie_Cord": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/kie/constrained_category/CORD_100.tsv",
"CCOCR_Kie_EphoieScut": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/kie/constrained_category/EPHOIE_SCUT_311.tsv",
"CCOCR_Kie_Poie": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/kie/constrained_category/POIE_250.tsv",
"CCOCR_Kie_ColdSibr": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/kie/open_category/COLD_SIBR_400.tsv",
"CCOCR_Kie_ColdCell": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/kie/open_category/COLD_CELL_600.tsv",
"CCOCR_MultiLanOcr_Arabic": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Arabic/Arabic_150.tsv",
"CCOCR_MultiLanOcr_French": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/French/French_150.tsv",
"CCOCR_MultiLanOcr_German": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/German/German_150.tsv",
"CCOCR_MultiLanOcr_Italian": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Italian/Italian_150.tsv",
"CCOCR_MultiLanOcr_Japanese": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Japanese/Japanese_150.tsv",
"CCOCR_MultiLanOcr_Korean": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Korean/Korean_150.tsv",
"CCOCR_MultiLanOcr_Portuguese": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Portuguese/Portuguese_150.tsv",
"CCOCR_MultiLanOcr_Russian": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Russian/Russian_150.tsv",
"CCOCR_MultiLanOcr_Spanish": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Spanish/Spanish_150.tsv",
"CCOCR_MultiLanOcr_Vietnamese": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_lan_ocr/Vietnamese/Vietnamese_150.tsv",
"CCOCR_MultiSceneOcr_Cord": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/document_text/CORD_100.tsv",
"CCOCR_MultiSceneOcr_Funsd": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/document_text/FUNSD_50.tsv",
"CCOCR_MultiSceneOcr_Iam": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/document_text/IAM_50.tsv",
"CCOCR_MultiSceneOcr_ZhDoc": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/document_text/zh_doc_100.tsv",
"CCOCR_MultiSceneOcr_ZhHandwriting": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/document_text/zh_handwriting_50.tsv",
"CCOCR_MultiSceneOcr_Hieragent": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/scene_text/Hieragent_100.tsv",
"CCOCR_MultiSceneOcr_Ic15": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/scene_text/IC15_500.tsv",
"CCOCR_MultiSceneOcr_Inversetext": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/scene_text/InverseText_500.tsv",
"CCOCR_MultiSceneOcr_Totaltext": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/scene_text/TotalText_300.tsv",
"CCOCR_MultiSceneOcr_ZhScene": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/scene_text/zh_scene_450.tsv",
"CCOCR_MultiSceneOcr_UgcLaion": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/ugc_text/ugc_laion_400.tsv",
"CCOCR_MultiSceneOcr_ZhDense": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/ugc_text/zh_dense_50.tsv",
"CCOCR_MultiSceneOcr_ZhVertical": "https://huggingface.co/datasets/Qwen/CC-OCR/resolve/main/multi_scene_ocr/ugc_text/zh_vertical_100.tsv"
"CCOCR_DocParsing_DocPhotoChn": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/doc/doc_photo_chn_75.tsv",
"CCOCR_DocParsing_DocPhotoEng": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/doc/doc_photo_eng_75.tsv",
"CCOCR_DocParsing_DocScanChn": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/doc/doc_scan_chn_75.tsv",
"CCOCR_DocParsing_DocScanEng": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/doc/doc_scan_eng_75.tsv",
"CCOCR_DocParsing_TablePhotoChn": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/table/table_photo_chn_75.tsv",
"CCOCR_DocParsing_TablePhotoEng": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/table/table_photo_eng_75.tsv",
"CCOCR_DocParsing_TableScanChn": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/table/table_scan_chn_75.tsv",
"CCOCR_DocParsing_TableScanEng": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/table/table_scan_eng_75.tsv",
"CCOCR_DocParsing_MolecularHandwriting": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/molecular/molecular_handwriting_100.tsv",
"CCOCR_DocParsing_FormulaHandwriting": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/doc_parsing/formula/formula_handwriting_100.tsv",
"CCOCR_Kie_Sroie2019Word": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/kie/constrained_category/sroie2019_word_347.tsv",
"CCOCR_Kie_Cord": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/kie/constrained_category/CORD_100.tsv",
"CCOCR_Kie_EphoieScut": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/kie/constrained_category/EPHOIE_SCUT_311.tsv",
"CCOCR_Kie_Poie": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/kie/constrained_category/POIE_250.tsv",
"CCOCR_Kie_ColdSibr": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/kie/open_category/COLD_SIBR_400.tsv",
"CCOCR_Kie_ColdCell": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/kie/open_category/COLD_CELL_600.tsv",
"CCOCR_MultiLanOcr_Arabic": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Arabic/Arabic_150.tsv",
"CCOCR_MultiLanOcr_French": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/French/French_150.tsv",
"CCOCR_MultiLanOcr_German": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/German/German_150.tsv",
"CCOCR_MultiLanOcr_Italian": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Italian/Italian_150.tsv",
"CCOCR_MultiLanOcr_Japanese": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Japanese/Japanese_150.tsv",
"CCOCR_MultiLanOcr_Korean": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Korean/Korean_150.tsv",
"CCOCR_MultiLanOcr_Portuguese": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Portuguese/Portuguese_150.tsv",
"CCOCR_MultiLanOcr_Russian": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Russian/Russian_150.tsv",
"CCOCR_MultiLanOcr_Spanish": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Spanish/Spanish_150.tsv",
"CCOCR_MultiLanOcr_Vietnamese": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_lan_ocr/Vietnamese/Vietnamese_150.tsv",
"CCOCR_MultiSceneOcr_Cord": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/document_text/CORD_100.tsv",
"CCOCR_MultiSceneOcr_Funsd": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/document_text/FUNSD_50.tsv",
"CCOCR_MultiSceneOcr_Iam": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/document_text/IAM_50.tsv",
"CCOCR_MultiSceneOcr_ZhDoc": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/document_text/zh_doc_100.tsv",
"CCOCR_MultiSceneOcr_ZhHandwriting": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/document_text/zh_handwriting_50.tsv",
"CCOCR_MultiSceneOcr_Hieragent": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/scene_text/Hieragent_100.tsv",
"CCOCR_MultiSceneOcr_Ic15": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/scene_text/IC15_500.tsv",
"CCOCR_MultiSceneOcr_Inversetext": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/scene_text/InverseText_500.tsv",
"CCOCR_MultiSceneOcr_Totaltext": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/scene_text/TotalText_300.tsv",
"CCOCR_MultiSceneOcr_ZhScene": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/scene_text/zh_scene_450.tsv",
"CCOCR_MultiSceneOcr_UgcLaion": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/ugc_text/ugc_laion_400.tsv",
"CCOCR_MultiSceneOcr_ZhDense": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/ugc_text/zh_dense_50.tsv",
"CCOCR_MultiSceneOcr_ZhVertical": "https://huggingface.co/datasets/wulipc/CC-OCR/resolve/main/multi_scene_ocr/ugc_text/zh_vertical_100.tsv"
}

# define data path
Expand Down

0 comments on commit 5b7ab08

Please sign in to comment.