diff --git a/src/providers/cortex/trulens/providers/cortex/config/cortex_model_costs.json b/src/providers/cortex/trulens/providers/cortex/config/cortex_model_costs.json index c68a9ad8a..789c36a9c 100644 --- a/src/providers/cortex/trulens/providers/cortex/config/cortex_model_costs.json +++ b/src/providers/cortex/trulens/providers/cortex/config/cortex_model_costs.json @@ -1,17 +1,10 @@ { - "reka-core": 5.5, "mistral-large": 5.1, - "llama3.1-405b": 5, + "llama3.1-405b": 3, "mistral-large2": 1.95, - "llama3-70b": 1.21, "llama3.1-70b": 1.21, - "snowflake-arctic": 0.84, - "jamba-instruct": 0.83, - "llama2-chat-70b": 0.45, - "reka-flash": 0.45, - "mixtral-8x7b": 0.22, - "llama3-8b": 0.19, "llama3.1-8b": 0.19, "mistral-7b": 0.12, - "gemma-7b": 0.12 + "llama3.2-3b": 0.06, + "llama3.2-1b": 0.04 } diff --git a/src/providers/cortex/trulens/providers/cortex/endpoint.py b/src/providers/cortex/trulens/providers/cortex/endpoint.py index 8a543e180..37a20711f 100644 --- a/src/providers/cortex/trulens/providers/cortex/endpoint.py +++ b/src/providers/cortex/trulens/providers/cortex/endpoint.py @@ -26,6 +26,7 @@ def _compute_credits_consumed( if self._model_costs is None: # the credit consumption table needs to be kept up-to-date with # the latest cost information https://www.snowflake.com/legal-files/CreditConsumptionTable.pdf#page=9. + # We should refer to the latest model availability of REST api https://docs.snowflake.com/en/user-guide/snowflake-cortex/cortex-llm-rest-api#model-availability with open( os.path.join(