diff --git a/src/proxy/middleware/response/index.ts b/src/proxy/middleware/response/index.ts index c79f3df..1858712 100644 --- a/src/proxy/middleware/response/index.ts +++ b/src/proxy/middleware/response/index.ts @@ -34,7 +34,7 @@ const isSupportedContentEncoding = ( return contentEncoding in DECODER_MAP; }; -class RetryableError extends Error { +export class RetryableError extends Error { constructor(message: string) { super(message); this.name = "RetryableError"; diff --git a/src/shared/key-management/aws/provider.ts b/src/shared/key-management/aws/provider.ts index f7077c7..a4136cd 100644 --- a/src/shared/key-management/aws/provider.ts +++ b/src/shared/key-management/aws/provider.ts @@ -37,7 +37,7 @@ export interface AwsBedrockKey extends Key, AwsBedrockKeyUsage { * Upon being rate limited, a key will be locked out for this many milliseconds * while we wait for other concurrent requests to finish. */ -const RATE_LIMIT_LOCKOUT = 300; +const RATE_LIMIT_LOCKOUT = 1000; /** * Upon assigning a key, we will wait this many milliseconds before allowing it * to be used again. This is to prevent the queue from flooding a key with too