| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| #include "gemma/common.h" |
|
|
| #include <stddef.h> |
| #include <string.h> |
|
|
| #include <algorithm> |
| #include <cctype> |
| #include <string> |
| #include <vector> |
|
|
| #include "hwy/base.h" |
| #include "hwy/contrib/thread_pool/thread_pool.h" |
|
|
| namespace gcpp { |
|
|
| constexpr const char* kModelFlags[] = { |
| "2b-pt", "2b-it", |
| "7b-pt", "7b-it", |
| "9b-pt", "9b-it", |
| "27b-pt", "27b-it", |
| "gr2b-pt", "gr2b-it", |
| "tiny", |
| }; |
| constexpr Model kModelTypes[] = { |
| Model::GEMMA_2B, Model::GEMMA_2B, |
| Model::GEMMA_7B, Model::GEMMA_7B, |
| Model::GEMMA_9B, Model::GEMMA_9B, |
| Model::GEMMA_27B, Model::GEMMA_27B, |
| Model::GRIFFIN_2B, Model::GRIFFIN_2B, |
| Model::GEMMA_TINY, |
| }; |
| constexpr ModelTraining kModelTraining[] = { |
| ModelTraining::GEMMA_PT, ModelTraining::GEMMA_IT, |
| ModelTraining::GEMMA_PT, ModelTraining::GEMMA_IT, |
| ModelTraining::GEMMA_PT, ModelTraining::GEMMA_IT, |
| ModelTraining::GEMMA_PT, ModelTraining::GEMMA_IT, |
| ModelTraining::GEMMA_PT, ModelTraining::GEMMA_IT, |
| ModelTraining::GEMMA_IT, |
| }; |
|
|
| constexpr size_t kNumModelFlags = std::end(kModelFlags) - std::begin(kModelFlags); |
| static_assert(kNumModelFlags == |
| std::end(kModelTypes) - std::begin(kModelTypes)); |
| static_assert(kNumModelFlags == |
| std::end(kModelTraining) - std::begin(kModelTraining)); |
|
|
| const char* ParseModelTypeAndTraining(const std::string& model_flag, |
| Model& model, ModelTraining& training) { |
| static char kErrorMessageBuffer[kNumModelFlags * 8 + 1024] = |
| "Invalid or missing model flag, need to specify one of "; |
| for (size_t i = 0; i + 1 < kNumModelFlags; i++) { |
| strcat(kErrorMessageBuffer, kModelFlags[i]); |
| strcat(kErrorMessageBuffer, ", "); |
| } |
| strcat(kErrorMessageBuffer, kModelFlags[kNumModelFlags - 1]); |
| strcat(kErrorMessageBuffer, "."); |
|
|
| std::string model_type_lc = model_flag; |
| std::transform(begin(model_type_lc), end(model_type_lc), begin(model_type_lc), |
| [](unsigned char c) { return std::tolower(c); }); |
|
|
| for (size_t i = 0; i < kNumModelFlags; i++) { |
| if (kModelFlags[i] == model_type_lc) { |
| model = kModelTypes[i]; |
| training = kModelTraining[i]; |
| HWY_ASSERT(std::string(ModelString(model, training)) == model_type_lc); |
| return nullptr; |
| } |
| } |
| return kErrorMessageBuffer; |
| } |
|
|
| const char* ModelString(Model model, ModelTraining training) { |
| for (size_t i = 0; i < kNumModelFlags; i++) { |
| if (kModelTypes[i] == model && kModelTraining[i] == training) |
| return kModelFlags[i]; |
| } |
| HWY_ABORT("Unknown model %d training %d\n", static_cast<int>(model), |
| static_cast<int>(training)); |
| } |
|
|
| constexpr const char* kTypeStrings[] = {"f32", "bf16", "sfp"}; |
|
|
| const char* StringFromType(Type type) { |
| return kTypeStrings[static_cast<size_t>(type)]; |
| } |
|
|
| const char* ParseType(const std::string& type_string, Type& type) { |
| constexpr size_t kNum = std::end(kTypeStrings) - std::begin(kTypeStrings); |
| static char kErrorMessageBuffer[kNum * 8 + 100] = |
| "Invalid or missing type, need to specify one of "; |
| for (size_t i = 0; i + 1 < kNum; i++) { |
| strcat(kErrorMessageBuffer, kTypeStrings[i]); |
| strcat(kErrorMessageBuffer, ", "); |
| } |
| strcat(kErrorMessageBuffer, kTypeStrings[kNum - 1]); |
| strcat(kErrorMessageBuffer, "."); |
| std::string type_lc = type_string; |
| std::transform(begin(type_lc), end(type_lc), begin(type_lc), |
| [](unsigned char c) { return std::tolower(c); }); |
| for (size_t i = 0; i < kNum; i++) { |
| if (kTypeStrings[i] == type_lc) { |
| type = static_cast<Type>(i); |
| HWY_ASSERT(std::string(StringFromType(type)) == type_lc); |
| return nullptr; |
| } |
| } |
| return kErrorMessageBuffer; |
| } |
|
|
| } |
|
|