* use ggml_*_split activations when possible * forward qkv |
||
|---|---|---|
| .. | ||
| fast | ||
| pooling | ||
| rope | ||
| attention.go | ||
| convolution.go | ||
| embedding.go | ||
| linear.go | ||
| normalization.go | ||
* use ggml_*_split activations when possible * forward qkv |
||
|---|---|---|
| .. | ||
| fast | ||
| pooling | ||
| rope | ||
| attention.go | ||
| convolution.go | ||
| embedding.go | ||
| linear.go | ||
| normalization.go | ||