| CMakeLists.txt |
|
1350 |
| llama-adapter.cpp |
.mem_size = |
14194 |
| llama-adapter.h |
|
1755 |
| llama-arch.cpp |
|
154367 |
| llama-arch.h |
|
13567 |
| llama-batch.cpp |
|
26576 |
| llama-batch.h |
|
5925 |
| llama-chat.cpp |
|
34400 |
| llama-chat.h |
|
1897 |
| llama-context.cpp |
|
97255 |
| llama-context.h |
|
9742 |
| llama-cparams.cpp |
|
100 |
| llama-cparams.h |
|
1019 |
| llama-grammar.cpp |
|
45005 |
| llama-grammar.h |
|
6135 |
| llama-graph.cpp |
|
63345 |
| llama-graph.h |
|
28140 |
| llama-hparams.cpp |
|
3697 |
| llama-hparams.h |
|
7175 |
| llama-impl.cpp |
|
6020 |
| llama-impl.h |
do nothing |
1809 |
| llama-io.cpp |
|
380 |
| llama-io.h |
|
788 |
| llama-kv-cache-unified-iswa.cpp |
|
9936 |
| llama-kv-cache-unified-iswa.h |
|
4152 |
| llama-kv-cache-unified.cpp |
.mem_size = |
78733 |
| llama-kv-cache-unified.h |
|
12745 |
| llama-kv-cells.h |
|
12133 |
| llama-memory-hybrid.cpp |
attn |
8485 |
| llama-memory-hybrid.h |
attn |
4479 |
| llama-memory-recurrent.cpp |
.mem_size = |
37759 |
| llama-memory-recurrent.h |
|
5759 |
| llama-memory.cpp |
|
1534 |
| llama-memory.h |
|
4184 |
| llama-mmap.cpp |
|
19049 |
| llama-mmap.h |
|
1428 |
| llama-model-loader.cpp |
|
56546 |
| llama-model-loader.h |
|
7550 |
| llama-model-saver.cpp |
|
14337 |
| llama-model-saver.h |
|
1052 |
| llama-model.cpp |
|
836169 |
| llama-model.h |
|
15991 |
| llama-quant.h |
|
13 |
| llama-sampling.cpp |
static void llama_log_softmax(float * array, size_t size) {
float max_l = *std::max_element(array, array + size);
float sum = 0.f;
for (size_t i = 0; i < size; ++i) {
float p = expf(array[i] - max_l);
sum += p;
array[i] = p;
}
for (size_t i = 0; i < size; ++i) {
array[i] = logf(array[i] / sum);
}
}
|
85954 |
| llama-sampling.h |
|
754 |
| llama-vocab.cpp |
vocab |
149925 |
| llama-vocab.h |
|
5990 |
| llama.cpp |
.no_perf = |
19806 |
| unicode-data.cpp |
|
169029 |
| unicode-data.h |
|
630 |
| unicode.cpp |
0x0000 <= cpt && |
41913 |
| unicode.h |
|
2228 |