{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"MinerU","owner":"opendatalab","isFork":false,"description":"A one-stop, open-source, high-quality data extraction tool, supports PDF/webpage/e-book extraction.一站式开源高质量数据提取工具,支持PDF/网页/多格式电子书提取。","allTopics":["python","pdf","parser","ocr","pdf-converter","extract-data","document-analysis","pdf-parser","layout-analysis","ai4science","pdf-extractor-rag","pdf-extractor-llm","pdf-extractor-pretrain"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":137,"starsCount":10960,"forksCount":810,"license":"GNU Affero General Public License v3.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,50,28,60,51,29,18,111,87,142,22,52,11,22,8,34,23,29,71,32,109,41,58,89,61,10,6,5,4],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-09T13:00:47.449Z"}},{"type":"Public","name":"CLIP-Parrot-Bias","owner":"opendatalab","isFork":false,"description":"ECCV2024_Parrot Captions Teach CLIP to Spot Text","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":54,"forksCount":2,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,2,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-06T15:31:29.989Z"}},{"type":"Public","name":"UniMERNet","owner":"opendatalab","isFork":false,"description":"UniMERNet: A Universal Network for Real-World Mathematical Expression Recognition","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":150,"forksCount":12,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,2,0,0,0,0,2,0,0,0,0,0,3,0,1,0,0,0,2,16],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-06T09:15:30.440Z"}},{"type":"Public","name":"MLS-BRN","owner":"opendatalab","isFork":false,"description":"[CVPR 2024] 3D Building Reconstruction from Monocular Remote Sensing Images with Multi-level Supervisions","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":31,"forksCount":2,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-30T09:14:57.032Z"}},{"type":"Public","name":"labelU","owner":"opendatalab","isFork":false,"description":"Data annotation toolbox supports image, audio and video data.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":9,"starsCount":746,"forksCount":67,"license":null,"participation":[8,6,0,0,16,1,13,18,9,12,1,0,14,0,0,0,0,2,1,21,148,15,0,13,22,2,19,28,0,4,0,50,3,0,0,0,0,0,0,0,0,0,0,0,1,2,0,20,3,2,2,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-29T03:44:40.129Z"}},{"type":"Public","name":"PDF-Extract-Kit","owner":"opendatalab","isFork":false,"description":"A Comprehensive Toolkit for High-Quality PDF Content Extraction","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":30,"starsCount":4640,"forksCount":309,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,18,14,5,22,2,7,0,0,0,2,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-28T08:25:04.610Z"}},{"type":"Public","name":"Miner-PDF-Benchmark","owner":"opendatalab","isFork":false,"description":"MPB (Miner-PDF-Benchmark) is an end-to-end PDF document comprehension evaluation suite designed for large-scale model data scenarios.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":6,"starsCount":10,"forksCount":5,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8,16,14,0,0,0,10,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-02T13:55:19.489Z"}},{"type":"Public","name":"CHARM","owner":"opendatalab","isFork":false,"description":"[ACL 2024 Main Conference] Chinese commonsense benchmark for LLMs","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":23,"forksCount":2,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6,0,0,0,0,0,0,0,0,1,1,6,0,0,0,0,0,0,1,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-27T01:54:23.390Z"}},{"type":"Public","name":"magic-doc","owner":"opendatalab","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":17,"starsCount":299,"forksCount":22,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7,103,58,30,36,37,25,7,5,2,13,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-26T12:50:22.765Z"}},{"type":"Public","name":"magic-html","owner":"opendatalab","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":162,"forksCount":13,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,11,2,0,3,4,0,0,2,0,0,0,1,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-18T10:38:15.069Z"}},{"type":"Public","name":"MLLM-DataEngine","owner":"opendatalab","isFork":false,"description":"MLLM-DataEngine: An Iterative Refinement Approach for MLLM","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":34,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-24T05:03:28.409Z"}},{"type":"Public","name":"image-downloader","owner":"opendatalab","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":24,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-13T14:56:48.745Z"}},{"type":"Public","name":"VIGC","owner":"opendatalab","isFork":false,"description":"AAAI 2024: Visual Instruction Generation and Correction ","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":86,"forksCount":3,"license":"Apache License 2.0","participation":[12,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-04T09:21:58.742Z"}},{"type":"Public","name":"HA-DPO","owner":"opendatalab","isFork":false,"description":"Beyond Hallucinations: Enhancing LVLMs through Hallucination-Aware Direct Preference Optimization","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":57,"forksCount":4,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-30T09:10:30.545Z"}},{"type":"Public","name":"opendatalab-python-sdk","owner":"opendatalab","isFork":false,"description":"SDK of OpenDataLab - https://opendatalab.org.cn","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":2,"starsCount":56,"forksCount":4,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-01T07:03:48.760Z"}},{"type":"Public","name":"laion5b-downloader","owner":"opendatalab","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":90,"forksCount":7,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-05-16T09:35:40.155Z"}},{"type":"Public","name":"allz","owner":"opendatalab","isFork":false,"description":"A universal command line tool for compression and decompression","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":4,"forksCount":0,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-17T08:34:05.444Z"}},{"type":"Public","name":"labelU-ML","owner":"opendatalab","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-06T07:39:14.486Z"}}],"repositoryCount":18,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"opendatalab repositories"}