test-arg-parser.cpp 7.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197
  1. #include "arg.h"
  2. #include "common.h"
  3. #include <string>
  4. #include <vector>
  5. #include <sstream>
  6. #include <unordered_set>
  7. #undef NDEBUG
  8. #include <cassert>
  9. int main(void) {
  10. common_params params;
  11. printf("test-arg-parser: make sure there is no duplicated arguments in any examples\n\n");
  12. for (int ex = 0; ex < LLAMA_EXAMPLE_COUNT; ex++) {
  13. try {
  14. auto ctx_arg = common_params_parser_init(params, (enum llama_example)ex);
  15. std::unordered_set<std::string> seen_args;
  16. std::unordered_set<std::string> seen_env_vars;
  17. for (const auto & opt : ctx_arg.options) {
  18. // check for args duplications
  19. for (const auto & arg : opt.get_args()) {
  20. if (seen_args.find(arg) == seen_args.end()) {
  21. seen_args.insert(arg);
  22. } else {
  23. fprintf(stderr, "test-arg-parser: found different handlers for the same argument: %s", arg.c_str());
  24. exit(1);
  25. }
  26. }
  27. // check for env var duplications
  28. for (const auto & env : opt.get_env()) {
  29. if (seen_env_vars.find(env) == seen_env_vars.end()) {
  30. seen_env_vars.insert(env);
  31. } else {
  32. fprintf(stderr, "test-arg-parser: found different handlers for the same env var: %s", env.c_str());
  33. exit(1);
  34. }
  35. }
  36. // ensure shorter argument precedes longer argument
  37. if (opt.args.size() > 1) {
  38. const std::string first(opt.args.front());
  39. const std::string last(opt.args.back());
  40. if (first.length() > last.length()) {
  41. fprintf(stderr, "test-arg-parser: shorter argument should come before longer one: %s, %s\n",
  42. first.c_str(), last.c_str());
  43. assert(false);
  44. }
  45. }
  46. // same check for negated arguments
  47. if (opt.args_neg.size() > 1) {
  48. const std::string first(opt.args_neg.front());
  49. const std::string last(opt.args_neg.back());
  50. if (first.length() > last.length()) {
  51. fprintf(stderr, "test-arg-parser: shorter negated argument should come before longer one: %s, %s\n",
  52. first.c_str(), last.c_str());
  53. assert(false);
  54. }
  55. }
  56. }
  57. } catch (std::exception & e) {
  58. printf("%s\n", e.what());
  59. assert(false);
  60. }
  61. }
  62. auto list_str_to_char = [](std::vector<std::string> & argv) -> std::vector<char *> {
  63. std::vector<char *> res;
  64. for (auto & arg : argv) {
  65. res.push_back(const_cast<char *>(arg.data()));
  66. }
  67. return res;
  68. };
  69. std::vector<std::string> argv;
  70. printf("test-arg-parser: test invalid usage\n\n");
  71. // missing value
  72. argv = {"binary_name", "-m"};
  73. assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  74. // wrong value (int)
  75. argv = {"binary_name", "-ngl", "hello"};
  76. assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  77. // wrong value (enum)
  78. argv = {"binary_name", "-sm", "hello"};
  79. assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  80. // non-existence arg in specific example (--draft cannot be used outside llama-speculative)
  81. argv = {"binary_name", "--draft", "123"};
  82. assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_EMBEDDING));
  83. // negated arg
  84. argv = {"binary_name", "--no-mmap"};
  85. assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  86. printf("test-arg-parser: test valid usage\n\n");
  87. argv = {"binary_name", "-m", "model_file.gguf"};
  88. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  89. assert(params.model.path == "model_file.gguf");
  90. argv = {"binary_name", "-t", "1234"};
  91. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  92. assert(params.cpuparams.n_threads == 1234);
  93. argv = {"binary_name", "--verbose"};
  94. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  95. assert(params.verbosity > 1);
  96. argv = {"binary_name", "-m", "abc.gguf", "--predict", "6789", "--batch-size", "9090"};
  97. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  98. assert(params.model.path == "abc.gguf");
  99. assert(params.n_predict == 6789);
  100. assert(params.n_batch == 9090);
  101. // --draft cannot be used outside llama-speculative
  102. argv = {"binary_name", "--draft", "123"};
  103. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_SPECULATIVE));
  104. assert(params.speculative.n_max == 123);
  105. // skip this part on windows, because setenv is not supported
  106. #ifdef _WIN32
  107. printf("test-arg-parser: skip on windows build\n");
  108. #else
  109. printf("test-arg-parser: test environment variables (valid + invalid usages)\n\n");
  110. setenv("LLAMA_ARG_THREADS", "blah", true);
  111. argv = {"binary_name"};
  112. assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  113. setenv("LLAMA_ARG_MODEL", "blah.gguf", true);
  114. setenv("LLAMA_ARG_THREADS", "1010", true);
  115. argv = {"binary_name"};
  116. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  117. assert(params.model.path == "blah.gguf");
  118. assert(params.cpuparams.n_threads == 1010);
  119. printf("test-arg-parser: test negated environment variables\n\n");
  120. setenv("LLAMA_ARG_MMAP", "0", true);
  121. setenv("LLAMA_ARG_NO_PERF", "1", true); // legacy format
  122. argv = {"binary_name"};
  123. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  124. assert(params.use_mmap == false);
  125. assert(params.no_perf == true);
  126. printf("test-arg-parser: test environment variables being overwritten\n\n");
  127. setenv("LLAMA_ARG_MODEL", "blah.gguf", true);
  128. setenv("LLAMA_ARG_THREADS", "1010", true);
  129. argv = {"binary_name", "-m", "overwritten.gguf"};
  130. assert(true == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_COMMON));
  131. assert(params.model.path == "overwritten.gguf");
  132. assert(params.cpuparams.n_threads == 1010);
  133. #endif // _WIN32
  134. printf("test-arg-parser: test curl-related functions\n\n");
  135. const char * GOOD_URL = "http://ggml.ai/";
  136. const char * BAD_URL = "http://ggml.ai/404";
  137. {
  138. printf("test-arg-parser: test good URL\n\n");
  139. auto res = common_remote_get_content(GOOD_URL, {});
  140. assert(res.first == 200);
  141. assert(res.second.size() > 0);
  142. std::string str(res.second.data(), res.second.size());
  143. assert(str.find("llama.cpp") != std::string::npos);
  144. }
  145. {
  146. printf("test-arg-parser: test bad URL\n\n");
  147. auto res = common_remote_get_content(BAD_URL, {});
  148. assert(res.first == 404);
  149. }
  150. {
  151. printf("test-arg-parser: test max size error\n");
  152. common_remote_params params;
  153. params.max_size = 1;
  154. try {
  155. common_remote_get_content(GOOD_URL, params);
  156. assert(false && "it should throw an error");
  157. } catch (std::exception & e) {
  158. printf(" expected error: %s\n\n", e.what());
  159. }
  160. }
  161. printf("test-arg-parser: all tests OK\n\n");
  162. }