talk-llama : update to latest llama.cpp (improved performance)

This commit is contained in:
Georgi Gerganov
2023-04-10 22:59:13 +03:00
parent 69b8503935
commit ea36831459
4 changed files with 1324 additions and 845 deletions

View File

@ -0,0 +1,12 @@
// Internal header to be included by llama.cpp and tests/benchmarks only.
#ifndef LLAMA_INTERNAL_H
#define LLAMA_INTERNAL_H
#include <vector>
#include <string>
struct ggml_tensor;
std::vector<std::pair<std::string, struct ggml_tensor *>>& llama_internal_get_tensor_map(struct llama_context * ctx);
#endif // LLAMA_INTERNAL_H