feat: GPT-OSS models Token Limits & Rates

This commit is contained in:
Danny Avila 2025-08-07 15:03:19 -04:00
parent b9f72f4869
commit d95d8032cc
No known key found for this signature in database
GPG key ID: BF31EEB2C5CA0956
4 changed files with 51 additions and 4 deletions

View file

@ -1,4 +1,4 @@
const { matchModelName } = require('../utils');
const { matchModelName } = require('../utils/tokens');
const defaultRate = 6;
/**
@ -147,6 +147,9 @@ const tokenValues = Object.assign(
codestral: { prompt: 0.3, completion: 0.9 },
'ministral-8b': { prompt: 0.1, completion: 0.1 },
'ministral-3b': { prompt: 0.04, completion: 0.04 },
// GPT-OSS models
'gpt-oss-20b': { prompt: 0.05, completion: 0.2 },
'gpt-oss-120b': { prompt: 0.15, completion: 0.6 },
},
bedrockValues,
);