Skip to content

Commit 11a6bfc

Browse files
authored
Add support for Apertus (#1465)
1 parent 41d618b commit 11a6bfc

File tree

2 files changed

+10
-0
lines changed

2 files changed

+10
-0
lines changed

src/configs.js

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -111,6 +111,7 @@ function getNormalizedConfig(config) {
111111
case 'llama':
112112
case 'llama4_text':
113113
case 'nanochat':
114+
case 'apertus':
114115
case 'arcee':
115116
case 'lfm2':
116117
case 'smollm3':

src/models.js

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4766,6 +4766,13 @@ export class NanoChatModel extends NanoChatPreTrainedModel {}
47664766
export class NanoChatForCausalLM extends NanoChatPreTrainedModel {}
47674767
//////////////////////////////////////////////////
47684768

4769+
//////////////////////////////////////////////////
4770+
// Apertus models
4771+
export class ApertusPreTrainedModel extends PreTrainedModel {}
4772+
export class ApertusModel extends ApertusPreTrainedModel {}
4773+
export class ApertusForCausalLM extends ApertusPreTrainedModel {}
4774+
//////////////////////////////////////////////////
4775+
47694776
//////////////////////////////////////////////////
47704777
// Arcee models
47714778
export class ArceePreTrainedModel extends PreTrainedModel {}
@@ -8259,6 +8266,7 @@ const MODEL_MAPPING_NAMES_DECODER_ONLY = new Map([
82598266
['gpt_neox', ['GPTNeoXModel', GPTNeoXModel]],
82608267
['codegen', ['CodeGenModel', CodeGenModel]],
82618268
['llama', ['LlamaModel', LlamaModel]],
8269+
['apertus', ['ApertusModel', ApertusModel]],
82628270
['nanochat', ['NanoChatModel', NanoChatModel]],
82638271
['arcee', ['ArceeModel', ArceeModel]],
82648272
['lfm2', ['Lfm2Model', Lfm2Model]],
@@ -8372,6 +8380,7 @@ const MODEL_FOR_CAUSAL_LM_MAPPING_NAMES = new Map([
83728380
['codegen', ['CodeGenForCausalLM', CodeGenForCausalLM]],
83738381
['llama', ['LlamaForCausalLM', LlamaForCausalLM]],
83748382
['nanochat', ['NanoChatForCausalLM', NanoChatForCausalLM]],
8383+
['apertus', ['ApertusForCausalLM', ApertusForCausalLM]],
83758384
['llama4_text', ['Llama4ForCausalLM', Llama4ForCausalLM]],
83768385
['arcee', ['ArceeForCausalLM', ArceeForCausalLM]],
83778386
['lfm2', ['Lfm2ForCausalLM', Lfm2ForCausalLM]],

0 commit comments

Comments
 (0)