add arguments

tastelikefeet · tastelikefeet · commit a996e2f8d17e · 2025-03-28T11:45:20.000+08:00
diff --git a/README.md b/README.md
@@ -265,16 +265,24 @@ The [Hugging Face](https://huggingface.co) platform hosts a [number of LLMs](htt
 
 You can either manually download the GGUF file or directly use any `llama.cpp`-compatible models from Hugging Face by using this CLI argument: `-hf <user>/<model>[:quant]`
 
-llama.cpp also supports downloading and running models from [ModelScope](https://www.modelscope.cn/home), just add an env variable: `LLAMACPP_USE_MODELSCOPE=True` to your command with the same arguments(like `-hf <user>/<model>[:quant]`).
+llama.cpp also supports downloading and running models from [ModelScope](https://www.modelscope.cn/home), there are two ways to use models in ModelScope:
+
+1. Add an env variable: `LLAMACPP_USE_MODELSCOPE=True` to your command with the same arguments of Hugging Face(like `-hf <user>/<model>[:quant]`).
 
 ```shell
 LLAMACPP_USE_MODELSCOPE=True llama-cli -hf Qwen/QwQ-32B-GGUF
 ```
 
-Pay attention to change the model repo to the **existing repo** of ModelScope. If you want to use a private repo, please make sure you have the rights of the repo and run with the `--hf_token` argument:
+2. Use modelscope arguments instead of the ones of Hugging Face: `-ms <user>/<model>[:quant] -msf xxx.gguf -mst xxx_token` 
+
+```shell
+llama-cli -ms Qwen/QwQ-32B-GGUF
+```
+
+Pay attention to change the model repo to the **existing repo** of ModelScope. If you want to use a private repo, please make sure you have the rights of the repo and run with the `--ms_token` argument:
 
 ```shell
-LLAMACPP_USE_MODELSCOPE=True llama-cli -hf Qwen/QwQ-32B-GGUF --hf_token xxx
+llama-cli -ms Qwen/QwQ-32B-GGUF --ms_token xxx
 ```
 
 > You can change the endpoint of ModelScope by using `MODELSCOPE_DOMAIN=xxx`(like MODELSCOPE_DOMAIN=www.modelscope.ai).
diff --git a/common/arg.cpp b/common/arg.cpp
@@ -34,6 +34,14 @@ common_arg & common_arg::set_env(const char * env) {
     return *this;
 }
 
+static void set_ms_env() {
+#ifdef _WIN32
+    SetEnvironmentVariableA("LLAMACPP_USE_MODELSCOPE", "True")
+#else
+    setenv("LLAMACPP_USE_MODELSCOPE", "True", 1);
+#endif
+}
+
 common_arg & common_arg::set_sparam() {
     is_sparam = true;
     return *this;
@@ -211,6 +219,10 @@ static bool common_params_parse_ex(int argc, char ** argv, common_params_context
     std::string arg;
     const std::string arg_prefix = "--";
     common_params & params = ctx_arg.params;
+    std::vector<std::string> ms_params = {
+        "-ms", "-msr", "--ms-repo",
+        "-msv", "-msrv", "--ms-repo-v"
+    };
 
     std::unordered_map<std::string, common_arg *> arg_to_options;
     for (auto & opt : ctx_arg.options) {
@@ -224,6 +236,18 @@ static bool common_params_parse_ex(int argc, char ** argv, common_params_context
         std::string value;
         if (opt.get_value_from_env(value)) {
             try {
+                for (auto msp: ms_params) {
+                    bool ms_arg = false;
+                    for (auto _arg: opt.args) {
+                        if (std::string(_arg) == msp) {
+                            ms_arg = true;
+                        }
+                    }
+                    if (ms_arg && !value.empty()) {
+                        set_ms_env();
+                        break;
+                    }
+                }
                 if (opt.handler_void && (value == "1" || value == "true")) {
                     opt.handler_void(params);
                 }
@@ -271,6 +295,15 @@ static bool common_params_parse_ex(int argc, char ** argv, common_params_context
             // arg with single value
             check_arg(i);
             std::string val = argv[++i];
+
+            for (auto msp: ms_params) {
+                // Check whether is modelscope params
+                if (msp == arg && !val.empty()) {
+                    set_ms_env();
+                    break;
+                }
+            }
+
             if (opt.handler_int) {
                 opt.handler_int(params, std::stoi(val));
                 continue;
@@ -1849,6 +1882,43 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
             params.hf_token = value;
         }
     ).set_env("HF_TOKEN"));
+    add_opt(common_arg(
+        {"-ms", "-msr", "--ms-repo"}, "<user>/<model>[:quant]",
+        "ModelScope model repository; quant is optional, case-insensitive, default to Q4_K_M, or falls back to the first file in the repo if Q4_K_M doesn't exist.\n"
+        "example: unsloth/phi-4-GGUF:q4_k_m\n"
+        "(default: unused)",
+        [](common_params & params, const std::string & value) {
+            params.hf_repo = value;
+        }
+    ).set_env("LLAMA_ARG_MS_REPO"));
+    add_opt(common_arg(
+        {"-msf", "--ms-file"}, "FILE",
+        "ModelScope model file. If specified, it will override the quant in --ms-repo (default: unused)",
+        [](common_params & params, const std::string & value) {
+            params.hf_file = value;
+        }
+    ).set_env("LLAMA_ARG_MS_FILE"));
+    add_opt(common_arg(
+        {"-msv", "-msrv", "--ms-repo-v"}, "<user>/<model>[:quant]",
+        "ModelScope model repository for the vocoder model (default: unused)",
+        [](common_params & params, const std::string & value) {
+            params.vocoder.hf_repo = value;
+        }
+    ).set_env("LLAMA_ARG_MS_REPO_V"));
+    add_opt(common_arg(
+        {"-msfv", "--ms-file-v"}, "FILE",
+        "ModelScope model file for the vocoder model (default: unused)",
+        [](common_params & params, const std::string & value) {
+            params.vocoder.hf_file = value;
+        }
+    ).set_env("LLAMA_ARG_MS_FILE_V"));
+    add_opt(common_arg(
+        {"-mst", "--ms-token"}, "TOKEN",
+        "ModelScope access token (default: value from MS_TOKEN environment variable)",
+        [](common_params & params, const std::string & value) {
+            params.hf_token = value;
+        }
+    ).set_env("MS_TOKEN"));
     add_opt(common_arg(
         {"--context-file"}, "FNAME",
         "file to load context from (repeat to specify multiple files)",
diff --git a/common/common.cpp b/common/common.cpp
@@ -1229,8 +1229,6 @@ static bool common_download_file(const std::string & url, const std::string & pa
         return false;
     }
 
-    bool force_download = false;
-
     // Set the URL, allow to follow http redirection
     curl_easy_setopt(curl.get(), CURLOPT_URL, url.c_str());
     curl_easy_setopt(curl.get(), CURLOPT_FOLLOWLOCATION, 1L);
@@ -1329,6 +1327,7 @@ static bool common_download_file(const std::string & url, const std::string & pa
         curl_easy_setopt(curl.get(), CURLOPT_HEADERFUNCTION, static_cast<CURLOPT_HEADERFUNCTION_PTR>(header_callback));
         curl_easy_setopt(curl.get(), CURLOPT_HEADERDATA, &headers);
         if (!LLAMACPP_USE_MODELSCOPE_DEFINITION) {
+            bool force_download = false;
             bool was_perform_successful = curl_perform_with_retry(url, curl.get(), CURL_MAX_RETRY, CURL_RETRY_DELAY_SECONDS);
             if (!was_perform_successful) {
                 return false;