@@ -4766,6 +4766,13 @@ export class NanoChatModel extends NanoChatPreTrainedModel {}
47664766export class NanoChatForCausalLM extends NanoChatPreTrainedModel { }
47674767//////////////////////////////////////////////////
47684768
4769+ //////////////////////////////////////////////////
4770+ // Apertus models
4771+ export class ApertusPreTrainedModel extends PreTrainedModel { }
4772+ export class ApertusModel extends ApertusPreTrainedModel { }
4773+ export class ApertusForCausalLM extends ApertusPreTrainedModel { }
4774+ //////////////////////////////////////////////////
4775+
47694776//////////////////////////////////////////////////
47704777// Arcee models
47714778export class ArceePreTrainedModel extends PreTrainedModel { }
@@ -8259,6 +8266,7 @@ const MODEL_MAPPING_NAMES_DECODER_ONLY = new Map([
82598266 [ 'gpt_neox' , [ 'GPTNeoXModel' , GPTNeoXModel ] ] ,
82608267 [ 'codegen' , [ 'CodeGenModel' , CodeGenModel ] ] ,
82618268 [ 'llama' , [ 'LlamaModel' , LlamaModel ] ] ,
8269+ [ 'apertus' , [ 'ApertusModel' , ApertusModel ] ] ,
82628270 [ 'nanochat' , [ 'NanoChatModel' , NanoChatModel ] ] ,
82638271 [ 'arcee' , [ 'ArceeModel' , ArceeModel ] ] ,
82648272 [ 'lfm2' , [ 'Lfm2Model' , Lfm2Model ] ] ,
@@ -8372,6 +8380,7 @@ const MODEL_FOR_CAUSAL_LM_MAPPING_NAMES = new Map([
83728380 [ 'codegen' , [ 'CodeGenForCausalLM' , CodeGenForCausalLM ] ] ,
83738381 [ 'llama' , [ 'LlamaForCausalLM' , LlamaForCausalLM ] ] ,
83748382 [ 'nanochat' , [ 'NanoChatForCausalLM' , NanoChatForCausalLM ] ] ,
8383+ [ 'apertus' , [ 'ApertusForCausalLM' , ApertusForCausalLM ] ] ,
83758384 [ 'llama4_text' , [ 'Llama4ForCausalLM' , Llama4ForCausalLM ] ] ,
83768385 [ 'arcee' , [ 'ArceeForCausalLM' , ArceeForCausalLM ] ] ,
83778386 [ 'lfm2' , [ 'Lfm2ForCausalLM' , Lfm2ForCausalLM ] ] ,
0 commit comments