} break;
case LLM_ARCH_MODERN_BERT:
{
- llm = std::make_unique<llm_build_modern_bert<true>>(*this, params);
+ llm = std::make_unique<llm_build_modern_bert>(*this, params);
} break;
case LLM_ARCH_NEO_BERT:
{
llm_build_mistral3(const llama_model & model, const llm_graph_params & params);
};
-template <bool iswa>
struct llm_build_modern_bert : public llm_graph_context {
llm_build_modern_bert(const llama_model & model, const llm_graph_params & params);
};
#include "models.h"
-template <bool iswa>
-llm_build_modern_bert<iswa>::llm_build_modern_bert(const llama_model & model, const llm_graph_params & params) : llm_graph_context(params) {
+llm_build_modern_bert::llm_build_modern_bert(const llama_model & model, const llm_graph_params & params) : llm_graph_context(params) {
const int64_t n_embd_head = hparams.n_embd_head_v;
const int64_t n_embd_gqa = hparams.n_embd_v_gqa();
auto * inp_attn = build_attn_inp_no_cache();
for (int il = 0; il < n_layer; ++il) {
- float freq_base_l = 0.0f;
-
- if constexpr (iswa) {
- freq_base_l = model.get_rope_freq_base(cparams, il);
- } else {
- freq_base_l = freq_base;
- }
+ float freq_base_l = model.get_rope_freq_base(cparams, il);
cur = inpL;
res->t_embd = cur;
ggml_build_forward_expand(gf, cur);
}
-
-// Explicit template instantiations
-template struct llm_build_modern_bert<false>;
-template struct llm_build_modern_bert<true>;