llama : clean-up

ggerganov · ggerganov · commit fe28a7b9d8d0 · 2024-07-23T08:38:50.000+03:00
diff --git a/src/llama-impl.h b/src/llama-impl.h
@@ -3,24 +3,6 @@
 #define LLAMA_API_INTERNAL
 #include "llama.h"
 
-#ifdef __has_include
-    #if __has_include(<unistd.h>)
-        #include <unistd.h>
-        #if defined(_POSIX_MAPPED_FILES)
-            #include <sys/mman.h>
-            #include <fcntl.h>
-        #endif
-        #if defined(_POSIX_MEMLOCK_RANGE)
-            #include <sys/resource.h>
-        #endif
-    #endif
-#endif
-
-// bump if necessary
-#define LLAMA_MAX_NODES   8192
-#define LLAMA_MAX_LAYERS  512
-#define LLAMA_MAX_EXPERTS 160  // DeepSeekV2
-
 #ifdef __GNUC__
 #ifdef __MINGW32__
 #define LLAMA_ATTRIBUTE_FORMAT(...) __attribute__((format(gnu_printf, __VA_ARGS__)))
diff --git a/src/llama-sampling.h b/src/llama-sampling.h
@@ -18,8 +18,6 @@ struct llama_sampling {
     }
 };
 
-struct llama_sampling * llama_get_sampling(struct llama_context * ctx);
-
 //
 // internal API
 //
diff --git a/src/llama-vocab.h b/src/llama-vocab.h
@@ -62,7 +62,6 @@ struct llama_vocab {
 };
 
 const struct llama_vocab * llama_get_vocab(const struct llama_context * ctx);
-const struct llama_vocab * llama_get_vocab(const struct llama_model   * model);
 
 //
 // internal API
diff --git a/src/llama.cpp b/src/llama.cpp
@@ -36,6 +36,19 @@
 // TODO: replace with ggml API call
 #define QK_K 256
 
+#ifdef __has_include
+    #if __has_include(<unistd.h>)
+        #include <unistd.h>
+        #if defined(_POSIX_MAPPED_FILES)
+            #include <sys/mman.h>
+            #include <fcntl.h>
+        #endif
+        #if defined(_POSIX_MEMLOCK_RANGE)
+            #include <sys/resource.h>
+        #endif
+    #endif
+#endif
+
 #if defined(_WIN32)
     #define WIN32_LEAN_AND_MEAN
     #ifndef NOMINMAX
@@ -87,6 +100,11 @@
 #pragma warning(disable: 4244 4267) // possible loss of data
 #endif
 
+// bump if necessary
+#define LLAMA_MAX_NODES   8192
+#define LLAMA_MAX_LAYERS  512
+#define LLAMA_MAX_EXPERTS 160  // DeepSeekV2
+
 //
 // helpers
 //
@@ -16794,14 +16812,6 @@ const struct llama_vocab * llama_get_vocab(const struct llama_context * ctx) {
     return &ctx->model.vocab;
 }
 
-const struct llama_vocab * llama_get_vocab(const struct llama_model * model) {
-    return &model->vocab;
-}
-
-struct llama_sampling * llama_get_sampling(struct llama_context * ctx) {
-    return &ctx->sampling;
-}
-
 struct llama_grammar * llama_get_grammar(struct llama_context * ctx) {
     return &ctx->grammar;
 }
diff --git a/src/unicode.h b/src/unicode.h
@@ -4,6 +4,8 @@
 #include <string>
 #include <vector>
 
+// TODO: prefix all symbols with "llama_"
+
 struct codepoint_flags {
     enum {
         UNDEFINED       = 0x0001,

Original file line number	Diff line number	Diff line change
`@@ -18,8 +18,6 @@ struct llama_sampling {`
`18`	`18`	`}`
`19`	`19`	`};`
`20`	`20`
`21`		`-struct llama_sampling * llama_get_sampling(struct llama_context * ctx);`
`22`		`-`
`23`	`21`	`//`
`24`	`22`	`// internal API`
`25`	`23`	`//`