{"payload":{"header_redesign_enabled":false,"results":[{"id":"673277958","archived":false,"color":"#3572A5","followers":1620,"has_funding_file":false,"hl_name":"modelscope/data-juicer","hl_trunc_description":"A one-stop data processing system to make data higher-quality, juicier, and more digestible for LLMs! 🍎 🍋 🌽 ➡️ ➡️🍸 🍹 🍷为大语言模型提供更高质量、更丰富、更易…","language":"Python","mirror":false,"owned_by_organization":true,"public":true,"repo":{"repository":{"id":673277958,"name":"data-juicer","owner_id":109945100,"owner_login":"modelscope","updated_at":"2024-06-06T06:15:55.362Z","has_issues":true}},"sponsorable":false,"topics":["nlp","data-science","opendata","data-visualization","pytorch","dataset","chinese","data-analysis","llama","gpt","multi-modal","pre-training","sora","streamlit","gpt-4","large-language-models","llm","llms","instruction-tuning","llava"],"type":"Public","help_wanted_issues_count":0,"good_first_issue_issues_count":0,"starred_by_current_user":false}],"type":"repositories","page":1,"page_count":1,"elapsed_millis":66,"errors":[],"result_count":1,"facets":[],"protected_org_logins":[],"topics":null,"query_id":"","logged_in":false,"sign_up_path":"/signup?source=code_search_results","sign_in_path":"/login?return_to=https%3A%2F%2Fgithub.com%2Fsearch%3Fq%3Drepo%253Amodelscope%252Fdata-juicer%2B%2Blanguage%253APython","metadata":null,"csrf_tokens":{"/modelscope/data-juicer/star":{"post":"th_eLuUoQVSG1vR5bDEQVEgAP7Szd_UzEQWH6eTEccEz9ehhZvOyfdYkDSpldKJgiK2sf11DeSYwOGh0cn6qTQ"},"/modelscope/data-juicer/unstar":{"post":"LN4klUrfIXiFEhWTKxtEr_vyGTPQ2V32VSZ_6oUv9JAjEqcImtorTWG25IaBwwDhXWobP8vmTfDldbSmaV7eog"},"/sponsors/batch_deferred_sponsor_buttons":{"post":"CgpsZ2V2guc9Lj62_Aig0vmYu3jfehK_vSfIpXeR56qXqLozIKrXGsqkJCrYGaYKuKN6nLtV1kokapB2a-q44Q"}}},"title":"Repository search results"}