{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"OlympicArena","owner":"GAIR-NLP","isFork":false,"description":"This is the official repository of the paper \"OlympicArena: Benchmarking Multi-discipline Cognitive Reasoning for Superintelligent AI\"","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":1,"starsCount":81,"forksCount":3,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,5,20,22,12,0,0,0,0,0,0,0,0,0,39,29,19,0,8,0,3,2,1,1,0,0,0,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-27T08:24:43.567Z"}},{"type":"Public","name":"MathPile","owner":"GAIR-NLP","isFork":false,"description":"Generative AI for Math: MathPile [NeurlPS D&B 2024] ","allTopics":["math","corpus","language-model","pre-training","large-language-models"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":378,"forksCount":20,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,1,0,0,0,19,5,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,3,0,0,0,0,0,0,0,0,0,1,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-27T08:23:44.520Z"}},{"type":"Public","name":"ProX","owner":"GAIR-NLP","isFork":false,"description":"Offical Repo for \"Programming Every Example: Lifting Pre-training Data Quality Like Experts at Scale\"","allTopics":["data-quality","pre-training","neural-symbolic","data-centric-ai","llm"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":104,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-26T09:30:23.313Z"}},{"type":"Public","name":"ReAlign","owner":"GAIR-NLP","isFork":false,"description":"Reformatted Alignment","allTopics":["nlp","natural-language-processing","alignment","large-language-models","llms","generative-ai"],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":111,"forksCount":5,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-23T15:44:00.114Z"}},{"type":"Public","name":"math-evaluation-harness","owner":"GAIR-NLP","isFork":true,"description":"A simple toolkit for benchmarking LLMs on mathematical reasoning tasks. 🧮✨","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":9,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-19T11:17:04.458Z"}},{"type":"Public","name":"OpenResearcher","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":2,"issueCount":0,"starsCount":384,"forksCount":27,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-11T11:09:40.769Z"}},{"type":"Public","name":"weak-to-strong-reasoning","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":49,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-02T06:30:04.044Z"}},{"type":"Public","name":"factool","owner":"GAIR-NLP","isFork":false,"description":"FacTool: Factuality Detection in Generative AI","allTopics":["python","natural-language-processing","fact-checking","large-language-models","generative-ai","chatgpt"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":19,"starsCount":810,"forksCount":61,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-19T20:27:12.544Z"}},{"type":"Public","name":"BeHonest","owner":"GAIR-NLP","isFork":false,"description":"BeHonest: Benchmarking Honesty in Large Language Models","allTopics":["nlp","benchmark","evaluation","alignment","honesty","llm"],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":27,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-15T02:59:51.801Z"}},{"type":"Public","name":"anole","owner":"GAIR-NLP","isFork":false,"description":"Anole: An Open, Autoregressive and Native Multimodal Models for Interleaved Image-Text Generation","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":25,"starsCount":650,"forksCount":36,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-05T01:35:11.674Z"}},{"type":"Public","name":"Safety-J","owner":"GAIR-NLP","isFork":false,"description":"Safety-J: Evaluating Safety with Critique","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":13,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-28T07:04:16.911Z"}},{"type":"Public","name":"MoPS","owner":"GAIR-NLP","isFork":false,"description":"[ACL 2024] Code for \"MoPS: Modular Story Premise Synthesis for Open-Ended Automatic Story Generation\"","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":30,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-19T07:39:20.796Z"}},{"type":"Public","name":"self-improvement-reversal","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":9,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-14T16:33:16.519Z"}},{"type":"Public","name":"MetaCritique","owner":"GAIR-NLP","isFork":false,"description":"Evaluate the Quality of Critique","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":35,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T17:57:45.089Z"}},{"type":"Public","name":"alignment-for-honesty","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":61,"forksCount":2,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-22T06:23:43.712Z"}},{"type":"Public","name":"benbench","owner":"GAIR-NLP","isFork":false,"description":"Benchmarking Benchmark Leakage in Large Language Models","allTopics":["dataset","benchmarks","leakage-detection","large-language-models"],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":3,"starsCount":40,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T01:59:32.735Z"}},{"type":"Public","name":"Preference-Dissection","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":21,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-16T07:56:58.115Z"}},{"type":"Public","name":"cs2916","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":21,"forksCount":8,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-12T07:37:35.074Z"}},{"type":"Public","name":"ReasonEval","owner":"GAIR-NLP","isFork":false,"description":"Evaluating Mathematical Reasoning Beyond Accuracy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":33,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-09T09:21:30.572Z"}},{"type":"Public","name":"OPO","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":49,"forksCount":6,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-02T15:01:34.594Z"}},{"type":"Public","name":"scaleeval","owner":"GAIR-NLP","isFork":false,"description":"Scalable Meta-Evaluation of LLMs as Evaluators","allTopics":["nlp","evaluation-framework","llm","generative-ai"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":41,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-15T13:54:40.105Z"}},{"type":"Public","name":"SimulateBench","owner":"GAIR-NLP","isFork":false,"description":"GPT as Human","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":18,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-21T09:20:34.788Z"}},{"type":"Public","name":"Entropy-ABF","owner":"GAIR-NLP","isFork":false,"description":"Official implementation for 'Extending LLMs’ Context Window with 100 Samples'","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":73,"forksCount":4,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-18T02:37:21.956Z"}},{"type":"Public","name":"auto-j","owner":"GAIR-NLP","isFork":false,"description":"Generative Judge for Evaluating Alignment","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":6,"starsCount":209,"forksCount":11,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-18T02:37:17.655Z"}},{"type":"Public","name":"abel","owner":"GAIR-NLP","isFork":false,"description":"SOTA Math Opensource LLM","allTopics":["math","llm","generative-ai"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":10,"starsCount":299,"forksCount":17,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T14:01:05.446Z"}},{"type":"Public","name":"ChineseFactEval","owner":"GAIR-NLP","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-13T10:27:52.810Z"}}],"repositoryCount":26,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"GAIR-NLP repositories"}