File size: 437 Bytes
1d031b5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
model_info:
  name: anemll-DeepSeekR1-8B-ctx1024
  version: 0.1.1
  description: |
    Demonstarates running DeepSeekR1-8B on Apple Neural Engine
    Context length: 1024
    Batch size: 64
    Chunks: 8
  license: MIT
  author: Anemll
  framework: Core ML
  language: Python
  parameters:
    context_length: 1024
    batch_size: 64
    lut_embeddings: none
    lut_ffn: 6
    lut_lmhead: 6
    num_chunks: 8
    model_prefix: DeepSeek