distributed/llama-1b
1B
•
Updated
•
120k
distributed/optimized-gpt2-1b
Text Generation
•
1B
•
Updated
•
87
distributed/gpt2-1b-bs2048-nodt-1_1
distributed/optimized-gpt2-1b-vtestnet-v1
Text Generation
•
1B
•
Updated
•
80
distributed/optimized-gpt2-2b
Text Generation
•
2B
•
Updated
•
45
•
5
distributed/optimized-gpt2-500m
Text Generation
•
0.5B
•
Updated
•
12
distributed/optimized-gpt2-1b-stable-embeddings
Text Generation
•
1B
•
Updated
•
11
distributed/optimized-gpt2-2b-vtestnet-v1
Text Generation
•
2B
•
Updated
•
9
distributed/optimized-gpt2-2b-without-stable-embeddings
Text Generation
•
2B
•
Updated
•
29
distributed/optimized-gpt2-1b-vtestnet-v2
Text Generation
•
1B
•
Updated
•
19
distributed/optimized-gpt2-1b-v0.3.2
Updated
distributed/optimized-gpt2-1b-vtestnet-v3
distributed/optimized-gpt2-1b-vtestnet
distributed/optimized-gpt2-5b
Text Generation
•
5B
•
Updated
•
9
distributed/optimized-gpt2-250m
Text Generation
•
0.3B
•
Updated
•
9
distributed/optimized-gpt2-250m-v0.1.2
Text Generation
•
0.3B
•
Updated
•
40
distributed/optimized-gpt2-250m-convergence-test-v1
Text Generation
•
0.3B
•
Updated
•
9
distributed/optimized-gpt2-250m-convergence-test-v2
Text Generation
•
0.3B
•
Updated
•
44
•
1
distributed/optimized-gpt2-250m-v0.1.1
Text Generation
•
0.3B
•
Updated
•
10
distributed/gpt2-94m
Text Generation
•
0.1B
•
Updated
•
8
distributed/optimized-gpt2-124m
Text Generation
•
0.1B
•
Updated
•
15
distributed/gpt2-250m-convergence-test
Text Generation
•
0.1B
•
Updated
•
11
distributed/gpt2-1b
Text Generation
•
1B
•
Updated
•
8
distributed/gpt2-2b
Text Generation
•
2B
•
Updated
•
6
distributed/gpt2-5b
Feature Extraction
•
5B
•
Updated
•
10
distributed/gpt2-250m-convergence-test-v2
Text Generation
•
0.1B
•
Updated
•
9
distributed/gpt2-124m-convergence-test
Feature Extraction
•
0.1B
•
Updated
•
9
distributed/gpt2-124m
Feature Extraction
•
0.1B
•
Updated
•
10
distributed/gpt2-500m
Feature Extraction
•
0.5B
•
Updated
•
37