Portkey-AI · VisargD · Apr 22, 2025 · Apr 12, 2025 · Apr 13, 2025 · Apr 21, 2025
diff --git a/src/globals.ts b/src/globals.ts
@@ -91,6 +91,7 @@ export const NEBIUS: string = 'nebius';
 export const RECRAFTAI: string = 'recraft-ai';
 export const MILVUS: string = 'milvus';
 export const REPLICATE: string = 'replicate';
+export const LEPTON: string = 'lepton';
 
 export const VALID_PROVIDERS = [
   ANTHROPIC,
@@ -147,6 +148,7 @@ export const VALID_PROVIDERS = [
   MILVUS,
   REPLICATE,
   POWERED_BY,
+  LEPTON,
 ];
 
 export const CONTENT_TYPES = {

diff --git a/src/providers/index.ts b/src/providers/index.ts
@@ -55,6 +55,7 @@ import NebiusConfig from './nebius';
 import RecraftAIConfig from './recraft-ai';
 import MilvusConfig from './milvus';
 import ReplicateConfig from './replicate';
+import LeptonConfig from './lepton';
 
 const Providers: { [key: string]: ProviderConfigs } = {
   openai: OpenAIConfig,
@@ -110,6 +111,7 @@ const Providers: { [key: string]: ProviderConfigs } = {
   'recraft-ai': RecraftAIConfig,
   milvus: MilvusConfig,
   replicate: ReplicateConfig,
+  lepton: LeptonConfig,
 };
 
 export default Providers;
diff --git a/src/providers/lepton/api.ts b/src/providers/lepton/api.ts
@@ -0,0 +1,32 @@
+import { ProviderAPIConfig } from '../types';
+
+const LEPTON_API_URL = 'https://api.lepton.ai';
+
+const LeptonAPIConfig: ProviderAPIConfig = {
+  getBaseURL: () => LEPTON_API_URL,
+  headers: ({ providerOptions, fn }) => {
+    const headersObj: Record<string, string> = {
+      Authorization: `Bearer ${providerOptions.apiKey}`,
+    };
+
+    if (fn === 'createTranscription') {
+      headersObj['Content-Type'] = 'multipart/form-data';
+    }
+
+    return headersObj;
+  },
+  getEndpoint: ({ fn }) => {
+    switch (fn) {
+      case 'chatComplete':
+        return '/api/v1/chat/completions';
+      case 'complete':
+        return '/api/v1/completions';
+      case 'createTranscription':
+        return '/api/v1/audio/transcriptions';
+      default:
+        return '';
+    }
+  },
+};
+
+export default LeptonAPIConfig;
diff --git a/src/providers/lepton/chatComplete.ts b/src/providers/lepton/chatComplete.ts
@@ -0,0 +1,214 @@
+import { LEPTON } from '../../globals';
+import {
+  ChatCompletionResponse,
+  ErrorResponse,
+  ProviderConfig,
+} from '../types';
+import { OpenAIErrorResponseTransform } from '../openai/utils';
+
+interface LeptonChatCompleteResponse extends ChatCompletionResponse {}
+
+export const LeptonChatCompleteConfig: ProviderConfig = {
+  model: {
+    param: 'model',
+    required: true,
+  },
+  messages: {
+    param: 'messages',
+    required: true,
+  },
+  temperature: {
+    param: 'temperature',
+    default: 0.7,
+    min: 0,
+    max: 2,
+  },
+  top_p: {
+    param: 'top_p',
+    default: 1,
+    min: 0,
+    max: 1,
+  },
+  n: {
+    param: 'n',
+    default: 1,
+  },
+  max_tokens: {
+    param: 'max_tokens',
+    default: 256,
+    min: 0,
+  },
+  stop: {
+    param: 'stop',
+  },
+  stream: {
+    param: 'stream',
+    default: false,
+  },
+  stream_options: {
+    param: 'stream_options',
+  },
+  presence_penalty: {
+    param: 'presence_penalty',
+    default: 0,
+    min: -2,
+    max: 2,
+  },
+  frequency_penalty: {
+    param: 'frequency_penalty',
+    default: 0,
+    min: -2,
+    max: 2,
+  },
+  logit_bias: {
+    param: 'logit_bias',
+  },
+  user: {
+    param: 'user',
+  },
+  tools: {
+    param: 'tools',
+  },
+  seed: {
+    param: 'seed',
+  },
+  logprobs: {
+    param: 'logprobs',
+    default: false,
+  },
+  top_logprobs: {
+    param: 'top_logprobs',
+    default: 0,
+  },
+  chat_template_kwargs: {
+    param: 'chat_template_kwargs',
+  },
+  length_penalty: {
+    param: 'length_penalty',
+    default: 1,
+  },
+  repetition_penalty: {
+    param: 'repetition_penalty',
+    default: 1,
+  },
+  dry_multiplier: {
+    param: 'dry_multiplier',
+    default: 0,
+  },
+  dry_base: {
+    param: 'dry_base',
+    default: 1.75,
+  },
+  dry_allowed_length: {
+    param: 'dry_allowed_length',
+    default: 2,
+  },
+  do_early_stopping: {
+    param: 'do_early_stopping',
+    default: false,
+  },
+  beam_size: {
+    param: 'beam_size',
+    default: 1,
+  },
+  top_k: {
+    param: 'top_k',
+    default: 50,
+  },
+  min_p: {
+    param: 'min_p',
+    default: 0,
+  },
+  id: {
+    param: 'id',
+  },
+  require_audio: {
+    param: 'require_audio',
+    default: false,
+  },
+  tts_preset_id: {
+    param: 'tts_preset_id',
+    default: 'jessica',
+  },
+  tts_audio_format: {
+    param: 'tts_audio_format',
+    default: 'mp3',
+  },
+  tts_audio_bitrate: {
+    param: 'tts_audio_bitrate',
+    default: 64,
+  },
+  audio_history_b64: {
+    param: 'audio_history_b64',
+  },
+  for_quant_calibration: {
+    param: 'for_quant_calibration',
+    default: false,
+  },
+};
+
+interface LeptonStreamChunk {
+  id: string;
+  object: string;
+  created: number;
+  model: string;
+  choices: {
+    delta: {
+      role?: string | null;
+      content?: string;
+    };
+    index: number;
+    finish_reason: string | null;
+  }[];
+}
+
+export const LeptonChatCompleteResponseTransform: (
+  response: LeptonChatCompleteResponse | ErrorResponse,
+  responseStatus: number
+) => ChatCompletionResponse | ErrorResponse = (response, responseStatus) => {
+  if (responseStatus !== 200 && 'error' in response) {
+    return OpenAIErrorResponseTransform(response, LEPTON);
+  }
+
+  Object.defineProperty(response, 'provider', {
+    value: LEPTON,
+    enumerable: true,
+  });
+
+  return response;
+};
+
+export const LeptonChatCompleteStreamChunkTransform = (
+  responseChunk: string
+) => {
+  let chunk = responseChunk.trim();
+  chunk = chunk.replace(/^data: /, '');
+  chunk = chunk.trim();
+
+  if (chunk === '[DONE]') {
+    return `data: ${chunk}\n\n`;
+  }
+
+  try {
+    const parsedChunk: LeptonStreamChunk = JSON.parse(chunk);
+    return (
+      `data: ${JSON.stringify({
+        id: parsedChunk.id,
+        object: parsedChunk.object,
+        created: parsedChunk.created,
+        model: parsedChunk.model,
+        provider: LEPTON,
+        choices: [
+          {
+            index: parsedChunk.choices[0].index,
+            delta: parsedChunk.choices[0].delta,
+            finish_reason: parsedChunk.choices[0].finish_reason,
+          },
+        ],
+      })}` + '\n\n'
+    );
+  } catch (error) {
+    console.error('Error parsing Lepton stream chunk:', error);
+    return `data: ${chunk}\n\n`;
+  }
+};