valory-xyz · 0xArdi · Feb 7, 2024 · Jan 31, 2024 · Feb 6, 2024 · Feb 6, 2024
diff --git a/.github/workflows/common_checks.yaml b/.github/workflows/common_checks.yaml
@@ -17,9 +17,10 @@ jobs:
         os: [ ubuntu-latest, macos-latest, windows-latest ]
         python-version: [ "3.10" ]
         poetry-version: ["1.3.2"]
-
     timeout-minutes: 10
-
+    defaults:
+      run:
+        shell: bash
     steps:
     - uses: actions/checkout@v3
     - uses: actions/setup-python@v4
@@ -33,6 +34,10 @@ jobs:
         virtualenvs-in-project: false
         virtualenvs-path: ~/my-custom-path
         installer-parallel: true
+    - name: Check if dependencies can be locked
+      run: poetry lock
+    - name: Poetry install requirements and check they can be locked
+      run: poetry install --all-extras --no-interaction -vvv
 
   copyright_and_dependencies_check:
     continue-on-error: False

diff --git a/.pylintrc b/.pylintrc
@@ -0,0 +1,58 @@
+[MASTER]
+ignore-patterns=.*_pb2.py,contract_dispatcher.py,test_abci_messages.py,test_tendermint_messages.py
+ignore=packages/valory/protocols/abci,packages/valory/connections/abci/gogoproto
+
+[MESSAGES CONTROL]
+disable=C0103,R0801,C0301,C0201,C0204,C0209,W1203,C0302,R1735,R1729,W0511,E0611
+
+# See here for more options: https://www.codeac.io/documentation/pylint-configuration.html
+R1735: use-dict-literal
+R1729: use-a-generator
+C0103: invalid-name
+C0201: consider-iterating-dictionary
+W1203: logging-fstring-interpolation
+C0204: bad-mcs-classmethod-argument
+C0209: consider-using-f-string
+C0301: http://pylint-messages.wikidot.com/messages:c0301 > Line too long
+C0302: http://pylint-messages.wikidot.com/messages:c0302 > Too many lines in module
+R0801: similar lines
+E0611: no-name-in-module
+
+[IMPORTS]
+ignored-modules=pandas,numpy,aea_cli_ipfs,compose,multidict,gql,anthropic,tiktoken
+
+[DESIGN]
+# min-public-methods=1
+max-public-methods=58
+# max-returns=10
+# max-bool-expr=7
+max-args=6
+# max-locals=31
+# max-statements=80
+max-parents=10
+max-branches=36
+max-attributes=8
+
+[REFACTORING]
+# max-nested-blocks=6
+
+[SPELLING]
+# uncomment to enable
+# spelling-dict=en_US
+
+# List of comma separated words that should not be checked.
+spelling-ignore-words=nocover,pragma,params,noqa,kwargs,str,async,json,boolean,config,pytest,args,url,tx,jsonschema,traceback,api,nosec
+
+[SIMILARITIES]
+
+# Minimum lines number of a similarity.
+min-similarity-lines=10
+
+# Ignore comments when computing similarities.
+ignore-comments=yes
+
+# Ignore docstrings when computing similarities.
+ignore-docstrings=yes
+
+# Ignore imports when computing similarities.
+ignore-imports=no
diff --git a/packages/packages.json b/packages/packages.json
@@ -2,18 +2,18 @@
     "dev": {
         "connection/valory/websocket_client/0.1.0": "bafybeiflmystocxaqblhpzqlcop2vkhsknpzjx2jomohomaxamwskeokzm",
         "skill/valory/contract_subscription/0.1.0": "bafybeicyugrkx5glat4p4ezwf6i7oduh26eycfie6ftd4uxrknztzl3ik4",
-        "agent/valory/mech/0.1.0": "bafybeigpvlyzu2d6xjf2ij4gvmtefrcn5rmmzp237mpsb7ejdpuzskvspu",
-        "skill/valory/mech_abci/0.1.0": "bafybeicekwscm72ujrwc5vzbgnshoxjna7a4vluugiylh4gq7r4yaskuly",
+        "agent/valory/mech/0.1.0": "bafybeiepdstu23qid2pcrugkpwtibh7jhlshmnmclwwbgjmefio27cp4im",
+        "skill/valory/mech_abci/0.1.0": "bafybeieimp7xzxcnbzsuunf2xkcy5juulhmzsmkq2v3sw3o3lgssb53cnu",
         "contract/valory/agent_mech/0.1.0": "bafybeiepxumywg6z2zapqzc3bg3iey23cmlgjzxisqox5j74o5i2texr5e",
-        "service/valory/mech/0.1.0": "bafybeiag3d54b7spafsicjx64ymh5hpmtwoggecnshrdndf67zjtlcksum",
+        "service/valory/mech/0.1.0": "bafybeifzkrmgejdce5nvp7s63dpvthde6wn6etolesh4dmf5pno7jplzcy",
         "protocol/valory/acn_data_share/0.1.0": "bafybeih5ydonnvrwvy2ygfqgfabkr47s4yw3uqxztmwyfprulwfsoe7ipq",
-        "skill/valory/task_submission_abci/0.1.0": "bafybeidned5sysejuakraqa4ssmc76chqnvyu7qqg4aywzddsayyooqflm",
-        "skill/valory/task_execution/0.1.0": "bafybeid7kneedwb3hu2nlsjusxgkfq4mvnsobxsbuqpfwkxnaeor6ffbpi",
+        "skill/valory/task_submission_abci/0.1.0": "bafybeib4m2bwgchloqss3wotsx4rz7qqkwydaesiqkls2zq7zbtp6jtpsi",
+        "skill/valory/task_execution/0.1.0": "bafybeicthrgfdv6q56htrsradow445smojjk2zqqizm4cdxyfxfor22vyy",
         "contract/valory/agent_registry/0.1.0": "bafybeiargayav6yiztdnwzejoejstcx4idssch2h4f5arlgtzj3tgsgfmu",
         "protocol/valory/websocket_client/0.1.0": "bafybeih43mnztdv3v2hetr2k3gezg7d3yj4ur7cxdvcyaqhg65e52s5sf4",
         "skill/valory/websocket_client/0.1.0": "bafybeidwntmkk4b2ixq5454ycbkknclqx7a6vpn7aqpm2nw3duszqrxvta",
         "contract/valory/hash_checkpoint/0.1.0": "bafybeieys27hidb5m267jwqsxdgorf5v37o6lvrfy2oga557stjn4xgoaa",
-        "skill/valory/subscription_abci/0.1.0": "bafybeick4zicydp42ieum74wekcz25uim3uyt7vugzjgfzsriqhswlxfti"
+        "skill/valory/subscription_abci/0.1.0": "bafybeigaxq7m2dqv2huhg5jvb4jx3rysqwvvjj2xhojow3t3zzuwq2k4ie"
     },
     "third_party": {
         "skill/valory/transaction_settlement_abci/0.1.0": "bafybeiaefgqbs7zsn5xe5kdwrujj7ivygkn3ujpw6crnvi3knvxw75qmja",

diff --git a/packages/valory/agents/mech/aea-config.yaml b/packages/valory/agents/mech/aea-config.yaml
@@ -38,12 +38,12 @@ skills:
 - valory/abstract_abci:0.1.0:bafybeiflcfufixmsrhobf56bn5745m2iipcfqyulwk2qegtnagb3kvaaxi
 - valory/abstract_round_abci:0.1.0:bafybeiaqcl7h2famylusiffigwem7tevkcsyocdu5xd42jkmgq6kvowzgq
 - valory/contract_subscription:0.1.0:bafybeicyugrkx5glat4p4ezwf6i7oduh26eycfie6ftd4uxrknztzl3ik4
-- valory/mech_abci:0.1.0:bafybeicekwscm72ujrwc5vzbgnshoxjna7a4vluugiylh4gq7r4yaskuly
+- valory/mech_abci:0.1.0:bafybeieimp7xzxcnbzsuunf2xkcy5juulhmzsmkq2v3sw3o3lgssb53cnu
 - valory/registration_abci:0.1.0:bafybeic2ynseiak7jpta7jfwuqwyp453b4p7lolr4wihxmpn633uekv5am
 - valory/reset_pause_abci:0.1.0:bafybeidzajbe3erygeh2xbd6lrjv7nsptznjuzrt24ykgvhgotdeyhfnba
-- valory/subscription_abci:0.1.0:bafybeick4zicydp42ieum74wekcz25uim3uyt7vugzjgfzsriqhswlxfti
-- valory/task_execution:0.1.0:bafybeid7kneedwb3hu2nlsjusxgkfq4mvnsobxsbuqpfwkxnaeor6ffbpi
-- valory/task_submission_abci:0.1.0:bafybeidned5sysejuakraqa4ssmc76chqnvyu7qqg4aywzddsayyooqflm
+- valory/subscription_abci:0.1.0:bafybeigaxq7m2dqv2huhg5jvb4jx3rysqwvvjj2xhojow3t3zzuwq2k4ie
+- valory/task_execution:0.1.0:bafybeicthrgfdv6q56htrsradow445smojjk2zqqizm4cdxyfxfor22vyy
+- valory/task_submission_abci:0.1.0:bafybeib4m2bwgchloqss3wotsx4rz7qqkwydaesiqkls2zq7zbtp6jtpsi
 - valory/termination_abci:0.1.0:bafybeie4zvjfxvdu7qrulmur3chpjz3kpj5m4bjsxvpk4gvj5zbyyayfaa
 - valory/transaction_settlement_abci:0.1.0:bafybeiaefgqbs7zsn5xe5kdwrujj7ivygkn3ujpw6crnvi3knvxw75qmja
 - valory/websocket_client:0.1.0:bafybeidwntmkk4b2ixq5454ycbkknclqx7a6vpn7aqpm2nw3duszqrxvta
@@ -196,7 +196,7 @@ models:
     args:
       agent_mech_contract_addresses: ${list:["0xFf82123dFB52ab75C417195c5fDB87630145ae81"]}
       task_deadline: ${float:240.0}
-      file_hash_to_tools_json: ${list:[["bafybeifp6tn3ovhuz4oipy67ijfdm4y7t2o7en3xuggn6kh5wbwokxmczu",["claude-prediction-offline","claude-prediction-online"]],["bafybeiaodddyn4eruafqg5vldkkjfglj7jg76uvyi5xhi2cysktlu4w6r4",["openai-gpt-3.5-turbo-instruct","openai-gpt-3.5-turbo","openai-gpt-4"]],["bafybeiafdm3jctiz6wwo3rmo3vdubk7j7l5tumoxi5n5rc3x452mtkgyua",["stabilityai-stable-diffusion-v1-5","stabilityai-stable-diffusion-xl-beta-v2-2-2","stabilityai-stable-diffusion-512-v2-1","stabilityai-stable-diffusion-768-v2-1"]],["bafybeidpbnqbruzqlq424qt3i5dcvyqmcimshjilftabnrroujmjhdmteu",["transfer-native"]],["bafybeiglhy5epaytvt5qqdx77ld23ekouli53qrf2hjyebd5xghlunidfi",["prediction-online","prediction-offline"]]]}
+      file_hash_to_tools_json: ${list:[["bafybeicziwfw7nb7gaxso357hrvtdlv6f23grm2c2rlfngpz4vbvoz2bke",["openai-gpt-3.5-turbo-instruct","openai-gpt-3.5-turbo","openai-gpt-4"]],["bafybeibaalr745aqajcaijykactx2nmg3jviefvnvpuk5kkxlt2yeedc2q",["stabilityai-stable-diffusion-v1-5","stabilityai-stable-diffusion-xl-beta-v2-2-2","stabilityai-stable-diffusion-512-v2-1","stabilityai-stable-diffusion-768-v2-1"]],["bafybeideuyqn4uslp4ccanzd5tjladzotyi6tiwfxbouecw5ufzgyi4ryy",["transfer-native"]],["bafybeig7yntvhhfufaadhd43zr4loivpit43kwfgban72w43xz4u3tansi",["prediction-offline","prediction-online","prediction-online-summarized-info"]],["bafybeiautzxe3faq53ceogfjtfbml5373wvqpsk77c4k3hjivloblivuxy",["prediction-online-sme","prediction-offline-sme"]],["bafybeifp6tn3ovhuz4oipy67ijfdm4y7t2o7en3xuggn6kh5wbwokxmczu",["claude-prediction-online","claude-prediction-offline"]],["bafybeievl777e2425q7zy6qkt26luu2i6xzp4q6pquykntx2yzivy3iwum",["deepmind-optimization-strong","deepmind-optimization"]],["bafybeihsyxhchqgtdwsd53z4a2lswt6ri4fre2yg2bpjo36kwboilsp7ai",["prediction-sentence-embedding-conservative","prediction-sentence-embedding-bold"]],["bafybeial5a56vsowqu4suynnmv5pkt5iebkxtmpgrae57qzi7s6tg4vq6e",["prediction-online-sum-url-content"]]]}
       api_keys_json: ${list:[["openai", "dummy_api_key"],["stabilityai", "dummy_api_key"],["google_api_key",
         "dummy_api_key"],["google_engine_id", "dummy_api_key"]]}
       polling_interval: ${float:30.0}

diff --git a/packages/valory/services/mech/service.yaml b/packages/valory/services/mech/service.yaml
@@ -7,7 +7,7 @@ license: Apache-2.0
 fingerprint:
   README.md: bafybeif7ia4jdlazy6745ke2k2x5yoqlwsgwr6sbztbgqtwvs3ndm2p7ba
 fingerprint_ignore_patterns: []
-agent: valory/mech:0.1.0:bafybeigpvlyzu2d6xjf2ij4gvmtefrcn5rmmzp237mpsb7ejdpuzskvspu
+agent: valory/mech:0.1.0:bafybeiepdstu23qid2pcrugkpwtibh7jhlshmnmclwwbgjmefio27cp4im
 number_of_agents: 4
 deployment:
   agent:

diff --git a/packages/valory/skills/mech_abci/skill.yaml b/packages/valory/skills/mech_abci/skill.yaml
@@ -23,10 +23,10 @@ skills:
 - valory/abstract_round_abci:0.1.0:bafybeiaqcl7h2famylusiffigwem7tevkcsyocdu5xd42jkmgq6kvowzgq
 - valory/registration_abci:0.1.0:bafybeic2ynseiak7jpta7jfwuqwyp453b4p7lolr4wihxmpn633uekv5am
 - valory/reset_pause_abci:0.1.0:bafybeidzajbe3erygeh2xbd6lrjv7nsptznjuzrt24ykgvhgotdeyhfnba
-- valory/task_submission_abci:0.1.0:bafybeidned5sysejuakraqa4ssmc76chqnvyu7qqg4aywzddsayyooqflm
+- valory/task_submission_abci:0.1.0:bafybeib4m2bwgchloqss3wotsx4rz7qqkwydaesiqkls2zq7zbtp6jtpsi
 - valory/termination_abci:0.1.0:bafybeie4zvjfxvdu7qrulmur3chpjz3kpj5m4bjsxvpk4gvj5zbyyayfaa
 - valory/transaction_settlement_abci:0.1.0:bafybeiaefgqbs7zsn5xe5kdwrujj7ivygkn3ujpw6crnvi3knvxw75qmja
-- valory/subscription_abci:0.1.0:bafybeick4zicydp42ieum74wekcz25uim3uyt7vugzjgfzsriqhswlxfti
+- valory/subscription_abci:0.1.0:bafybeigaxq7m2dqv2huhg5jvb4jx3rysqwvvjj2xhojow3t3zzuwq2k4ie
 behaviours:
   main:
     args: {}

diff --git a/packages/valory/skills/subscription_abci/skill.yaml b/packages/valory/skills/subscription_abci/skill.yaml
@@ -166,7 +166,7 @@ dependencies:
   googlesearch-python:
     version: ==1.2.3
   openai:
-    version: ==0.27.2
+    version: ==1.11.0
   py-multibase:
     version: ==1.0.3
   py-multicodec:

diff --git a/packages/valory/skills/task_execution/behaviours.py b/packages/valory/skills/task_execution/behaviours.py
@@ -48,6 +48,7 @@
 from packages.valory.protocols.ipfs.dialogues import IpfsDialogue
 from packages.valory.protocols.ledger_api import LedgerApiMessage
 from packages.valory.skills.task_execution.models import Params
+from packages.valory.skills.task_execution.utils.benchmarks import TokenCounterCallback
 from packages.valory.skills.task_execution.utils.ipfs import (
     ComponentPackageLoader,
     get_ipfs_file_hash,
@@ -291,8 +292,16 @@ def _handle_done_task(self, task_result: Any) -> None:
         }
         if task_result is not None:
             # task succeeded
-            deliver_msg, prompt, transaction = task_result
-            response = {**response, "result": deliver_msg, "prompt": prompt}
+            deliver_msg, prompt, transaction, counter_callback = task_result
+            cost_dict = {}
+            if counter_callback is not None:
+                cost_dict = cast(TokenCounterCallback, counter_callback).cost_dict
+            response = {
+                **response,
+                "result": deliver_msg,
+                "prompt": prompt,
+                "cost_dict": cost_dict,
+            }
             self._done_task["transaction"] = transaction
 
         self.context.logger.info(f"Task result for request {req_id}: {task_result}")
@@ -371,6 +380,7 @@ def _prepare_task(self, task_data: Dict[str, Any]) -> None:
         task_data["tool_py"] = tool_py
         task_data["callable_method"] = callable_method
         task_data["api_keys"] = self.params.api_keys
+        task_data["counter_callback"] = TokenCounterCallback()
         future = self._submit_task(tool_task.execute, **task_data)
         executing_task = cast(Dict[str, Any], self._executing_task)
         executing_task["timeout_deadline"] = time.time() + self.params.task_deadline

diff --git a/packages/valory/skills/task_execution/skill.yaml b/packages/valory/skills/task_execution/skill.yaml
@@ -7,11 +7,12 @@ license: Apache-2.0
 aea_version: '>=1.0.0, <2.0.0'
 fingerprint:
   __init__.py: bafybeidqhvvlnthkbnmrdkdeyjyx2f2ab6z4xdgmagh7welqnh2v6wczx4
-  behaviours.py: bafybeifa72egwarcmfneqmo3ak6wfygjc3i7hplxl6ptafb263vuaey3fm
+  behaviours.py: bafybeihprwot27csugwpoimsqcwprxu5bstqpvanot3nkmfgvhbr66ww4y
   dialogues.py: bafybeid4zxalqdlo5mw4yfbuf34hx4jp5ay5z6chm4zviwu4cj7fudtwca
   handlers.py: bafybeidbt5ezj74cgfogk3w4uw4si2grlnk5g54veyumw7g5yh6gdscywu
   models.py: bafybeihgclxctyltuehj2f4fzj26edptqugrrm4phd6ovuulezrqot6qo4
   utils/__init__.py: bafybeiccdijaigu6e5p2iruwo5mkk224o7ywedc7nr6xeu5fpmhjqgk24e
+  utils/benchmarks.py: bafybeihdutp44ds4cupszbd34gsmcw6fsdda2tzkh5b27fpg65ejbpdvdm
   utils/ipfs.py: bafybeidinbdqkidix44ibz5hug7inkcbijooag53gr5mtbaa72tk335uqq
   utils/task.py: bafybeieuziu7owtk543z3umgmayhjh67klftk7vrhz24l6rlaii5lvkqh4
 fingerprint_ignore_patterns: []
@@ -99,11 +100,15 @@ dependencies:
   googlesearch-python:
     version: ==1.2.3
   openai:
-    version: ==0.27.2
+    version: ==1.11.0
   py-multibase:
     version: ==1.0.3
   py-multicodec:
     version: ==0.2.1
   pyyaml:
     version: <=6.0.1,>=3.10
+  tiktoken:
+    version: ==0.5.1
+  anthropic:
+    version: ==0.3.11
 is_abstract: false
diff --git a/packages/valory/skills/task_execution/utils/benchmarks.py b/packages/valory/skills/task_execution/utils/benchmarks.py
@@ -0,0 +1,105 @@
+# -*- coding: utf-8 -*-
+# ------------------------------------------------------------------------------
+#
+#   Copyright 2024 Valory AG
+#
+#   Licensed under the Apache License, Version 2.0 (the "License");
+#   you may not use this file except in compliance with the License.
+#   You may obtain a copy of the License at
+#
+#       http://www.apache.org/licenses/LICENSE-2.0
+#
+#   Unless required by applicable law or agreed to in writing, software
+#   distributed under the License is distributed on an "AS IS" BASIS,
+#   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#   See the License for the specific language governing permissions and
+#   limitations under the License.
+#
+# ------------------------------------------------------------------------------
+"""Benchmarking for tools."""
+
+import logging
+from typing import Any, Dict, Union
+
+import anthropic
+import tiktoken
+from tiktoken import Encoding
+
+
+PRICE_NUM_TOKENS = 1000
+
+
+def encoding_for_model(model: str) -> Encoding:
+    """Get the encoding for a model."""
+    return tiktoken.encoding_for_model(model)
+
+
+def count_tokens(text: str, model: str) -> int:
+    """Count the number of tokens in a text."""
+    if "claude" in model:
+        return anthropic.Anthropic().count_tokens(text)
+
+    enc = encoding_for_model(model)
+    return len(enc.encode(text))
+
+
+class TokenCounterCallback:
+    """Callback to count the number of tokens used in a generation."""
+
+    TOKEN_PRICES = {
+        "gpt-3.5-turbo": {"input": 0.001, "output": 0.002},
+        "gpt-4": {"input": 0.03, "output": 0.06},
+        "gpt-4-turbo": {"input": 0.01, "output": 0.03},
+        "claude-2": {"input": 0.008, "output": 0.024},
+    }
+
+    def __init__(self) -> None:
+        """Initialize the callback."""
+        self.cost_dict: Dict[str, Union[int, float]] = {
+            "input_tokens": 0,
+            "output_tokens": 0,
+            "total_tokens": 0,
+            "input_cost": 0,
+            "output_cost": 0,
+            "total_cost": 0,
+        }
+
+    @staticmethod
+    def token_to_cost(tokens: int, model: str, tokens_type: str) -> float:
+        """Converts a number of tokens to a cost in dollars."""
+        return (
+            tokens
+            / PRICE_NUM_TOKENS
+            * TokenCounterCallback.TOKEN_PRICES[model][tokens_type]
+        )
+
+    def calculate_cost(self, tokens_type: str, model: str, **kwargs: Any) -> None:
+        """Calculate the cost of a generation."""
+        # Check if it its prompt or tokens are passed in
+        prompt_key = f"{tokens_type}_prompt"
+        token_key = f"{tokens_type}_tokens"
+        if prompt_key in kwargs:
+            tokens = count_tokens(kwargs[prompt_key], model)
+        elif token_key in kwargs:
+            tokens = kwargs[token_key]
+        else:
+            logging.warning(f"No {token_key}_tokens or {tokens_type}_prompt found.")
+        cost = self.token_to_cost(tokens, model, tokens_type)
+        self.cost_dict[token_key] += tokens
+        self.cost_dict[f"{tokens_type}_cost"] += cost
+
+    def __call__(self, model: str, **kwargs: Any) -> None:
+        """Callback to count the number of tokens used in a generation."""
+        if model not in list(TokenCounterCallback.TOKEN_PRICES.keys()):
+            raise ValueError(f"Model {model} not supported.")
+        try:
+            self.calculate_cost("input", model, **kwargs)
+            self.calculate_cost("output", model, **kwargs)
+            self.cost_dict["total_tokens"] = (
+                self.cost_dict["input_tokens"] + self.cost_dict["output_tokens"]
+            )
+            self.cost_dict["total_cost"] = (
+                self.cost_dict["input_cost"] + self.cost_dict["output_cost"]
+            )
+        except Exception as e:
+            logging.error(f"Error in TokenCounterCallback: {e}")
diff --git a/packages/valory/skills/task_submission_abci/skill.yaml b/packages/valory/skills/task_submission_abci/skill.yaml
@@ -171,7 +171,7 @@ dependencies:
   googlesearch-python:
     version: ==1.2.3
   openai:
-    version: ==0.27.2
+    version: ==1.11.0
   py-multibase:
     version: ==1.0.3
   py-multicodec: