| --- | |
| license: openrail | |
| datasets: | |
| - vikp/textbook_quality_programming | |
| - irds/codesearchnet | |
| - giganticode/java-cmpx-v1 | |
| - nickrosh/Evol-Instruct-Code-80k-v1 | |
| - bigcode/starcoderdata | |
| - bigcode/the-stack | |
| - bigcode/the-stack-smol | |
| - Cdaprod/AI-Developer-Prompts | |
| - code_x_glue_ct_code_to_text | |
| - codeparrot/github-code | |
| - codeparrot/github-code-clean | |
| - code_x_glue_cc_code_completion_line | |
| - >- | |
| autoevaluate/autoeval-eval-jeffdshen__inverse_superglue_mixedp1-jeffdshen__inverse-63643c-1665558893 | |
| - bentrevett/multi30k | |
| - edbeeching/decision_transformer_gym_replay | |
| - psyche/common_crawl | |
| - Birchlabs/openai-prm800k-solutions-only | |
| - openchat/openchat_sharegpt4_dataset | |
| - Open-Orca/OpenOrca | |
| - cjvt/slownet | |
| - para_crawl | |
| - zeroshot/twitter-financial-news-sentiment | |
| - laugustyniak/political-advertising-pl | |
| - code_search_net | |
| - sukaka/novelai-webui | |
| - P1ayer-1/chatgpt-conversations-chatlogs.net | |
| - daniel2588/sarcasm | |
| - psmathur/orca_minis_uncensored_dataset | |
| - player1537/Bloom-560m-trained-on-Wizard-Vicuna-Uncensored-trained-on-Based | |
| - shahules786/prosocial-nsfw-reddit | |
| - Thewillonline/reddit-sarcasm | |
| - datasciencemmw/current-data | |
| - Oniichat/bluemoon_roleplay_chat_data_300k_messages | |
| - dell-research-harvard/AmericanStories | |
| - b-mc2/sql-create-context | |
| language: | |
| - en | |
| - it | |
| - fr | |
| - pt | |
| - la | |
| - ru | |
| - ro | |
| - el | |
| metrics: | |
| - accuracy | |
| - bertscore | |
| - bleu | |
| - code_eval | |