Update README.md
Browse files
README.md
CHANGED
@@ -3,4 +3,70 @@ license: deepfloyd-if-license
|
|
3 |
datasets:
|
4 |
- microsoft/orca-agentinstruct-1M-v1
|
5 |
- OpenCoder-LLM/opc-sft-stage1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6 |
---
|
|
|
3 |
datasets:
|
4 |
- microsoft/orca-agentinstruct-1M-v1
|
5 |
- OpenCoder-LLM/opc-sft-stage1
|
6 |
+
- fka/awesome-chatgpt-prompts
|
7 |
+
- HuggingFaceTB/smoltalk
|
8 |
+
- alpindale/two-million-bluesky-posts
|
9 |
+
- bluesky-community/one-million-bluesky-posts
|
10 |
+
- dijihax/Dataset
|
11 |
+
- internlm/Lean-Workbook
|
12 |
+
- PleIAs/common_corpus
|
13 |
+
- O1-OPEN/OpenO1-SFT
|
14 |
+
- allenai/tulu-3-sft-mixture
|
15 |
+
- OpenCoder-LLM/RefineCode-code-corpus-meta
|
16 |
+
- OpenCoder-LLM/opc-fineweb-code-corpus
|
17 |
+
- iamtarun/python_code_instructions_18k_alpaca
|
18 |
+
- codeparrot/github-code
|
19 |
+
- nenad1002/quantum_science_research_dataset
|
20 |
+
- quantumiracle-git/robotinder-data
|
21 |
+
- open-llm-leaderboard-old/details_quantumaikr__KoreanLM-hf
|
22 |
+
- chemora/EntanglementDetectionDataSet
|
23 |
+
- glaiveai/glaive-function-calling-v2
|
24 |
+
- Salesforce/xlam-function-calling-60k
|
25 |
+
- NousResearch/hermes-function-calling-v1
|
26 |
+
- >-
|
27 |
+
Younes-Abdeahad-Software-Requirements/FNFC-Functional_Non-Functional_Classification
|
28 |
+
- cgoosen/prompt_injection_password_or_secret
|
29 |
+
- google/frames-benchmark
|
30 |
+
- Kaeyze/computer-science-synthetic-dataset
|
31 |
+
- gretelai/gretel-text-to-python-fintech-en-v1
|
32 |
+
- Vezora/Tested-143k-Python-Alpaca
|
33 |
+
- Nan-Do/instructional_code-search-net-python
|
34 |
+
- hackaprompt/hackaprompt-dataset
|
35 |
+
- hackercupai/hackercup
|
36 |
+
- OpenPipe/hacker-news
|
37 |
+
- open-phi/programming_books_llama
|
38 |
+
- kanhatakeyama/wizardlm8x22b-logical-math-coding-sft
|
39 |
+
- datatune/LogiCoT
|
40 |
+
- kanhatakeyama/LogicalDatasetsByMixtral8x22b
|
41 |
+
- dongyu0205/working-memory-capacity-of-ChatGPT
|
42 |
+
- memorylost731/linux_man_pages_library
|
43 |
+
- mmathys/openai-moderation-api-evaluation
|
44 |
+
- BAAI/IndustryCorpus2_current_affairs_government_administration
|
45 |
+
- bigcode/admin
|
46 |
+
- HuggingFaceFW/admin
|
47 |
+
- HuggingFaceFW/fineweb-edu
|
48 |
+
- HuggingFaceFV/finevideo
|
49 |
+
- lmms-lab/LLaVA-Video-178K
|
50 |
+
- Wild-Heart/Disney-VideoGeneration-Dataset
|
51 |
+
- DL3DV/DL3DV-ALL-video
|
52 |
+
- laion/laion-high-resolution
|
53 |
+
- joey234/mmlu-high_school_computer_science-neg
|
54 |
+
- sentence-transformers/embedding-training-data
|
55 |
+
- Cohere/wikipedia-22-12-en-embeddings
|
56 |
+
- philschmid/finanical-rag-embedding-dataset
|
57 |
+
- jwaters8978/web_scraper_dataset
|
58 |
+
- jwaters8978/web_scraper_dataset_2
|
59 |
+
- ammarnasr/the-stack-java-clean
|
60 |
+
- angie-chen55/javascript-github-code
|
61 |
+
- anjandash/java-8m-methods-v2
|
62 |
+
- Vikhrmodels/physics_big
|
63 |
+
- k-mktr/improved-flux-prompts-photoreal-portrait
|
64 |
+
- jacobcd52/physics-papers
|
65 |
+
- zeroshot/arxiv-biology
|
66 |
+
- joey234/mmlu-college_biology-neg
|
67 |
+
- cmcmaster/rheumatology-biologics-dataset
|
68 |
+
- HAERAE-HUB/QARV-KOEN-10M-Entangled
|
69 |
+
- Qutiba/LinuxCommands_Virsh_KVM_Docker_2
|
70 |
+
- MattCoddity/docker_ps
|
71 |
+
- adeocybersecurity/DockerCommand
|
72 |
---
|