Skip to main content

自定义定价 - SageMaker、Azure 等

为 SageMaker 完成模型注册自定义定价。

对于按秒计费,您只需注册 input_cost_per_second

# !pip install boto3 
from litellm import completion, completion_cost

os.environ["AWS_ACCESS_KEY_ID"] = ""
os.environ["AWS_SECRET_ACCESS_KEY"] = ""
os.environ["AWS_REGION_NAME"] = ""


def test_completion_sagemaker():
try:
print("testing sagemaker")
response = completion(
model="sagemaker/berri-benchmarking-Llama-2-70b-chat-hf-4",
messages=[{"role": "user", "content": "Hey, how's it going?"}],
input_cost_per_second=0.000420,
)
# 在此处添加任何断言以检查响应
print(response)
cost = completion_cost(completion_response=response)
print(cost)
except Exception as e:
raise Exception(f"Error occurred: {e}")

按令牌计费(例如 Azure)

# !pip install boto3 
from litellm import completion, completion_cost

## 设置环境变量
os.environ["AZURE_API_KEY"] = ""
os.environ["AZURE_API_BASE"] = ""
os.environ["AZURE_API_VERSION"] = ""


def test_completion_azure_model():
try:
print("testing azure custom pricing")
# azure 调用
response = completion(
model = "azure/<your_deployment_name>",
messages = [{ "content": "Hello, how are you?","role": "user"}]
input_cost_per_token=0.005,
output_cost_per_token=1,
)
# 在此处添加任何断言以检查响应
print(response)
cost = completion_cost(completion_response=response)
print(cost)
except Exception as e:
raise Exception(f"Error occurred: {e}")

test_completion_azure_model()
优云智算