Gemini tests (#23)

Katsiarynka · web-flow · commit e83c839e8dbb · 2024-09-02T18:08:38.000+03:00
diff --git a/flow_prompt/ai_models/ai_model.py b/flow_prompt/ai_models/ai_model.py
@@ -31,6 +31,15 @@ def name(self) -> str:
     def price_per_prompt_1k_tokens(self) -> Decimal:
         return self._price_per_prompt_1k_tokens
 
+    def _decimal(self, value) -> Decimal:
+        return Decimal(value).quantize(Decimal(".00001"))
+    
+    def get_prompt_price(self, count_tokens: int) -> Decimal:
+        return self._decimal(self.price_per_prompt_1k_tokens * Decimal(count_tokens) / 1000)
+    
+    def get_sample_price(self, prompt_sample, count_tokens: int) -> Decimal:
+        return self._decimal(self.price_per_sample_1k_tokens * Decimal(count_tokens) / 1000)
+
     @property
     def price_per_sample_1k_tokens(self) -> Decimal:
         return self._price_per_sample_1k_tokens
diff --git a/flow_prompt/ai_models/claude/claude_model.py b/flow_prompt/ai_models/claude/claude_model.py
@@ -1,6 +1,7 @@
 from flow_prompt.ai_models.ai_model import AI_MODELS_PROVIDER, AIModel
 import logging
 
+from flow_prompt.ai_models.constants import C_200K
 from flow_prompt.responses import AIResponse
 from decimal import Decimal
 from enum import Enum
@@ -20,8 +21,6 @@
 logger = logging.getLogger(__name__)
 
 
-C_200K = 200000
-
 
 class FamilyModel(Enum):
     haiku = "Claude 3 Haiku"
@@ -30,8 +29,8 @@ class FamilyModel(Enum):
 
 
 DEFAULT_PRICING = {
-    "price_per_prompt_1k_tokens": Decimal(0.00025),
-    "price_per_sample_1k_tokens": Decimal(0.00125),
+    "price_per_prompt_1k_tokens": Decimal(0.003),
+    "price_per_sample_1k_tokens": Decimal(0.015),
 }
 
 CLAUDE_AI_PRICING = {
@@ -156,13 +155,17 @@ def name(self) -> str:
 
     @property
     def price_per_prompt_1k_tokens(self) -> Decimal:
-        return CLAUDE_AI_PRICING[self.family].get(self.max_tokens, DEFAULT_PRICING)[
+        keys = list(CLAUDE_AI_PRICING[self.family].keys())
+        def_pricing = CLAUDE_AI_PRICING[self.family].get(keys[0])
+        return CLAUDE_AI_PRICING[self.family].get(self.max_tokens, def_pricing)[
             "price_per_prompt_1k_tokens"
         ]
 
     @property
     def price_per_sample_1k_tokens(self) -> Decimal:
-        return CLAUDE_AI_PRICING[self.family].get(self.max_tokens, DEFAULT_PRICING)[
+        keys = list(CLAUDE_AI_PRICING[self.family].keys())
+        def_pricing = CLAUDE_AI_PRICING[self.family].get(keys[0])
+        return CLAUDE_AI_PRICING[self.family].get(self.max_tokens, def_pricing)[
             "price_per_sample_1k_tokens"
         ]
 
diff --git a/flow_prompt/ai_models/constants.py b/flow_prompt/ai_models/constants.py
@@ -0,0 +1,9 @@
+
+C_4K = 4096
+C_8K = 8192
+C_16K = 16384
+C_32K = 32768
+
+C_128K = 128_000
+C_200K = 200_000
+C_1M = 1_000_000
diff --git a/flow_prompt/ai_models/gemini/constants.py b/flow_prompt/ai_models/gemini/constants.py
diff --git a/flow_prompt/ai_models/gemini/gemini_model.py b/flow_prompt/ai_models/gemini/gemini_model.py
@@ -1,6 +1,7 @@
 from flow_prompt.ai_models.ai_model import AI_MODELS_PROVIDER, AIModel
 import logging
 
+from flow_prompt.ai_models.constants import C_1M, C_128K
 from flow_prompt.responses import AIResponse
 from decimal import Decimal
 from enum import Enum
@@ -9,22 +10,27 @@
 from dataclasses import dataclass
 
 from flow_prompt.ai_models.gemini.responses import GeminiAIResponse
-from flow_prompt.ai_models.gemini.constants import FLASH, PRO
+
 from flow_prompt.ai_models.utils import get_common_args
 from openai.types.chat import ChatCompletionMessage as Message
 from flow_prompt.responses import Prompt
 from flow_prompt.exceptions import RetryableCustomError, ConnectionLostError
 import google.generativeai as genai
 
+
 logger = logging.getLogger(__name__)
 
 
-C_128K = 127_000
+FLASH = "gemini-1.5-flash"
+PRO = "gemini-1.5-pro"
+PRO_1_0 = "gemini-1.0-pro"
+
 
 
 class FamilyModel(Enum):
     flash = "Gemini 1.5 Flash"
     pro = "Gemini 1.5 Pro"
+    pro_1_0 = "Gemini 1.0 Pro"
 
 
 DEFAULT_PRICING = {
@@ -35,14 +41,28 @@ class FamilyModel(Enum):
 GEMINI_AI_PRICING = {
     FamilyModel.flash.value: {
         C_128K: {
-            "price_per_prompt_1k_tokens": Decimal(0.00035),
-            "price_per_sample_1k_tokens": Decimal(0.00105),
+            "price_per_prompt_1k_tokens": Decimal(0.0075),
+            "price_per_sample_1k_tokens": Decimal(0.030),
+        },
+        C_1M: {
+            "price_per_prompt_1k_tokens": Decimal(0.015),
+            "price_per_sample_1k_tokens": Decimal(0.060),
+        }
+    },
+    FamilyModel.pro_1_0.value: {
+        C_1M: {
+            "price_per_prompt_1k_tokens": Decimal(0.0005),
+            "price_per_sample_1k_tokens": Decimal(0.0015),
         }
     },
     FamilyModel.pro.value: {
         C_128K: {
             "price_per_prompt_1k_tokens": Decimal(0.0035),
             "price_per_sample_1k_tokens": Decimal(0.0105),
+        },
+        C_1M: {
+            "price_per_prompt_1k_tokens": Decimal(0.007),
+            "price_per_sample_1k_tokens": Decimal(0.021),
         }
     },
 }
@@ -51,13 +71,17 @@ class FamilyModel(Enum):
 @dataclass(kw_only=True)
 class GeminiAIModel(AIModel):
     model: str
+    max_tokens: int = C_1M
     gemini_model: genai.GenerativeModel = None
     provider: AI_MODELS_PROVIDER = AI_MODELS_PROVIDER.GEMINI
     family: str = None
 
     def __post_init__(self):
+        self.model = self.model.lower()
         if FLASH in self.model:
             self.family = FamilyModel.flash.value
+        elif PRO_1_0 in self.model:
+            self.family = FamilyModel.pro_1_0.value
         elif PRO in self.model:
             self.family = FamilyModel.pro.value
         else:
@@ -129,18 +153,6 @@ def call(self, messages: t.List[dict], max_tokens: int, client_secrets: dict = {
     def name(self) -> str:
         return self.model
 
-    @property
-    def price_per_prompt_1k_tokens(self) -> Decimal:
-        return GEMINI_AI_PRICING[self.family].get(self.max_tokens, DEFAULT_PRICING)[
-            "price_per_prompt_1k_tokens"
-        ]
-
-    @property
-    def price_per_sample_1k_tokens(self) -> Decimal:
-        return GEMINI_AI_PRICING[self.family].get(self.max_tokens, DEFAULT_PRICING)[
-            "price_per_sample_1k_tokens"
-        ]
-
     def get_params(self) -> t.Dict[str, t.Any]:
         return {
             "model": self.model,
@@ -152,3 +164,19 @@ def get_metrics_data(self) -> t.Dict[str, t.Any]:
             "model": self.model,
             "max_tokens": self.max_tokens,
         }
+    
+
+    def get_prompt_price(self, count_tokens: int) -> Decimal:
+        for key in sorted(GEMINI_AI_PRICING[self.family].keys()):
+            if count_tokens < key:
+                logger.info(f"Prompt price for {count_tokens} tokens is {GEMINI_AI_PRICING[self.family][key]['price_per_prompt_1k_tokens'] * Decimal(count_tokens) / 1000}")
+                return self._decimal(GEMINI_AI_PRICING[self.family][key]["price_per_prompt_1k_tokens"] * Decimal(count_tokens) / 1000)
+        
+        return self._decimal(self.price_per_prompt_1k_tokens * Decimal(count_tokens) / 1000)
+    
+    def get_sample_price(self, prompt_sample, count_tokens: int) -> Decimal:
+        for key in sorted(GEMINI_AI_PRICING[self.family].keys()):
+            if prompt_sample < key:
+                logger.info(f"Sample price for {count_tokens} tokens is {GEMINI_AI_PRICING[self.family][key]['price_per_prompt_1k_tokens'] * Decimal(count_tokens) / 1000}")
+                return self._decimal(GEMINI_AI_PRICING[self.family][key]["price_per_sample_1k_tokens"] * Decimal(count_tokens) / 1000)
+        return self._decimal(self.price_per_sample_1k_tokens * Decimal(count_tokens) / 1000)
diff --git a/flow_prompt/ai_models/openai/openai_models.py b/flow_prompt/ai_models/openai/openai_models.py
@@ -7,6 +7,7 @@
 from openai import OpenAI
 
 from flow_prompt.ai_models.ai_model import AI_MODELS_PROVIDER, AIModel
+from flow_prompt.ai_models.constants import C_128K, C_16K, C_32K, C_4K
 from flow_prompt.ai_models.openai.responses import OpenAIResponse
 from flow_prompt.ai_models.utils import get_common_args
 from flow_prompt.exceptions import ConnectionLostError
@@ -16,11 +17,6 @@
 
 from .utils import raise_openai_exception
 
-C_4K = 4096
-C_8K = 8192
-C_128K = 127_000
-C_16K = 16384
-C_32K = 32768
 M_DAVINCI = "davinci"
 
 logger = logging.getLogger(__name__)
diff --git a/flow_prompt/prompt/flow_prompt.py b/flow_prompt/prompt/flow_prompt.py
@@ -200,14 +200,7 @@ def calculate_budget_for_text(self, user_prompt: UserPrompt, text: str) -> int:
             return 0
         return len(user_prompt.encoding.encode(text))
 
-    def _decimal(self, value) -> Decimal:
-        return Decimal(value).quantize(Decimal(".00001"))
-
     def get_price(
         self, attempt: AttemptToCall, sample_budget: int, prompt_budget: int
     ) -> Decimal:
-        return self._decimal(
-            prompt_budget * attempt.ai_model.price_per_prompt_1k_tokens / 1000
-        ) + self._decimal(
-            sample_budget * attempt.ai_model.price_per_sample_1k_tokens / 1000
-        )
+        return attempt.ai_model.get_prompt_price(prompt_budget) + attempt.ai_model.get_sample_price(prompt_budget, sample_budget)
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "flow-prompt"
-version = "0.1.22a1"
+version = "0.1.26"
 description = ""
 authors = ["Flow-prompt Engineering Team <engineering@flow-prompt.com>"]
 readme = "README.md"
diff --git a/tests/ai_models/test_gemini.py b/tests/ai_models/test_gemini.py