Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat: add ofv_market_resolver tool #245

Closed
wants to merge 2 commits into from
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
20 changes: 20 additions & 0 deletions packages/gnosis/customs/ofv_market_resolver/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,20 @@
# -*- coding: utf-8 -*-
# ------------------------------------------------------------------------------
#
# Copyright 2023-2024 Valory AG
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# ------------------------------------------------------------------------------

"""This module contains the bet amount per threshold strategy."""
29 changes: 29 additions & 0 deletions packages/gnosis/customs/ofv_market_resolver/component.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,29 @@
name: ofv_market_resolver
author: gnosis
version: 0.1.0
type: custom
description: Tool for resolving markets using
license: Apache-2.0
aea_version: '>=1.0.0, <2.0.0'
fingerprint:
__init__.py: bafybeibbn67pnrrm4qm3n3kbelvbs3v7fjlrjniywmw2vbizarippidtvi
ofv_market_resolver.py: bafybeibwi4ybaw6epwbqmdc3ulgkhqp7f5n6vfdmna7vclqrnt6zz64ejy
fingerprint_ignore_patterns: []
entry_point: omen_buy_sell.py
callable: run
dependencies:
pydantic:
version: '>=1.9.0,<3'
prediction-market-agent-tooling:
version: '>=0.39.0,<0.40.0'
langchain:
version: ==0.1.20
langchain-core:
version: ==0.1.52
langchain-openai:
version: ==0.1.6
langchain_community:
version: ==0.2.1
openai:
version: ==1.30.2
openfactverification: {}
280 changes: 280 additions & 0 deletions packages/gnosis/customs/ofv_market_resolver/ofv_market_resolver.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,280 @@
# -*- coding: utf-8 -*-
# ------------------------------------------------------------------------------
#
# Copyright 2024 Valory AG
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# ------------------------------------------------------------------------------
"""This module contains the ofv market resolver."""
import functools

import openai
from factcheck import FactCheck
from factcheck.utils.multimodal import modal_normalization
import json
from langchain_openai import ChatOpenAI
from typing import Annotated, Any, Dict, Optional, Tuple, Callable
from pydantic import BaseModel, BeforeValidator


MechResponse = Tuple[str, Optional[str], Optional[Dict[str, Any]], Any, Any]

def with_key_rotation(func: Callable):
@functools.wraps(func)
def wrapper(*args, **kwargs) -> MechResponse:
# this is expected to be a KeyChain object,
# although it is not explicitly typed as such
api_keys = kwargs["api_keys"]
retries_left: Dict[str, int] = api_keys.max_retries()

def execute() -> MechResponse:
"""Retry the function with a new key."""
try:
result = func(*args, **kwargs)
return result + (api_keys,)
except openai.RateLimitError as e:
# try with a new key again
if retries_left["openai"] <= 0 and retries_left["openrouter"] <= 0:
raise e
retries_left["openai"] -= 1
retries_left["openrouter"] -= 1
api_keys.rotate("openai")
api_keys.rotate("openrouter")
return execute()
except Exception as e:
return str(e), "", None, None, api_keys

mech_response = execute()
return mech_response

return wrapper


DEFAULT_OPENAI_MODEL = "gpt-4-0125-preview"
ALLOWED_TOOLS = ["ofv_market_resolver"]
ALLOWED_MODELS = [DEFAULT_OPENAI_MODEL]

Factuality = Annotated[
bool | None,
BeforeValidator(lambda v: None if v in ("Nothing to check.", "non-factual") else v),
]


class FactCheckClaimDetails(BaseModel):
claim: str
factuality: Factuality
correction: str | None
reference_url: str


class FactCheckResult(BaseModel):
factuality: Factuality
claims_details: list[FactCheckClaimDetails] | None


def factcheck(
statement: str,
model: str = DEFAULT_OPENAI_MODEL,
openai_api_key: str | None = None,
serper_api_key: str | None = None,
) -> FactCheckResult:
api_config = {
"OPENAI_API_KEY": openai_api_key,
"SERPER_API_KEY": serper_api_key,
}
factcheck = FactCheck(
default_model=model,
api_config=api_config,
retriever="serper",
num_seed_retries=5,
)
content = modal_normalization("string", statement)
res = factcheck.check_response(content)

return FactCheckResult.model_validate(res)


def rewrite_as_sentence(
question: str,
model: str = DEFAULT_OPENAI_MODEL,
openai_api_key: str | None = None,
) -> str:
"""
Rewrites the question into a sentence, example:
`Will former Trump Organization CFO Allen Weisselberg be sentenced to jail by 15 April 2024?`
->
`Former Trump Organization CFO Allen Weisselberg was sentenced to jail by 15 April 2024.`
"""
llm = ChatOpenAI(
model=model,
temperature=0.0,
api_key=openai_api_key,
)

prompt = f"""
Rewrite the question into a simple annoucment sentence stating a fact or prediction like it is already known.
Make future tense into past tense.
For future questions that ask if something will happen "by" some date, rewrite it to "before" that date or any time sooner.
For future questions that ask if something will happen "on" some date, rewrite it to "on" that date.
If the question is both "on" and "by" some date, rewrite it as "before or any time sooner than" that date.
If the question is about exact date, keep it exact.
If the question is about a date range, keep it a range.
Always keep the same meaning.
Never negate the sentence into opposite meaning of the question.
Question: {question}
Sentence:
"""
completion = str(llm.invoke(prompt, max_tokens=512).content)

return completion


# TODO: This could be imported from prediction-market-agent-tooling, but given the conflict in the langchain versions,
# it would require changes in other mechs of this repository.
def is_predictable_binary(
question: str,
model: str = DEFAULT_OPENAI_MODEL,
openai_api_key: str | None = None,
) -> bool:
"""
Evaluate if the question is actually answerable.
"""
llm = ChatOpenAI(
model=model,
temperature=0.0,
api_key=openai_api_key,
)

prompt = f"""Main signs about a fully qualified question (sometimes referred to as a "market"):
- The market's question needs to be specific, without use of pronouns.
- The market's question needs to have a clear future event.
- The market's question needs to have a clear time frame.
- The event in the market's question doesn't have to be ultra-specific, it will be decided by a crowd later on.
- If the market's question contains date, but without an year, it's okay.
- If the market's question contains year, but without an exact date, it's okay.
- The market's question can not be about itself or refer to itself.
- The answer is probably Google-able, after the event happened.
- The potential asnwer can be only "Yes" or "No".
Follow a chain of thought to evaluate if the question is fully qualified:
First, write the parts of the following question:
"{question}"
Then, write down what is the future event of the question, what it refers to and when that event will happen if the question contains it.
Then, explain why do you think it is or isn't fully qualified.
Finally, write your final decision, write `decision: ` followed by either "yes it is fully qualified" or "no it isn't fully qualified" about the question. Don't write anything else after that. You must include "yes" or "no".
"""
completion = str(llm.invoke(prompt, max_tokens=512).content)

try:
decision = completion.lower().rsplit("decision", 1)[1]
except IndexError as e:
raise ValueError(
f"Invalid completion in is_predictable for `{question}`: {completion}"
) from e

if "yes" in decision:
is_predictable = True
elif "no" in decision:
is_predictable = False
else:
raise ValueError(
f"Invalid completion in is_predictable for `{question}`: {completion}"
)

return is_predictable


def build_run_result(
has_occurred: bool | None,
is_determinable: bool | None,
is_valid: bool | None,
) -> Tuple[str, Optional[str], Optional[Dict[str, Any]], Any]:
return (
json.dumps(
{
"has_occurred": has_occurred,
"is_determinable": is_determinable,
"is_valid": is_valid,
}
),
"",
None,
None,
)


def most_common_fact_result(results: list[FactCheckResult]) -> FactCheckResult:
"""
Given a list of fact check results, return the first `FactCheckResult` in the list with `factuality` being the most common.
"""
factualities = [fact.factuality for fact in results]
most_common_fact = max(set(factualities), key=factualities.count)
first_most_common_fact = [
fact for fact in results if fact.factuality == most_common_fact
][0]
return first_most_common_fact


@with_key_rotation
def run(
prompt: str,
api_keys: Any,
n_fact_runs: int = 3,
**kwargs: Any, # Just to ignore any other arguments passed to the resolver by the universal benchmark script.
) -> Tuple[str, Optional[str], Optional[Dict[str, Any]], Any]:
"""
Run the prediction market resolver based on Open Fact Verifier.
"""
assert (
n_fact_runs > 0 and n_fact_runs % 2 != 0
), "n_fact_runs must be greater than 0 and an odd number"
market_question = prompt # `prompt` argument name is for compatibility with the original resolver.
openai_api_key = api_keys["openai"]
serper_api_key = api_keys["serperapi"]

# Check if the question is reasonable to look for an answer.
is_answerable = is_predictable_binary(
market_question, openai_api_key=openai_api_key
)
if not is_answerable:
print(
f"Question `{market_question}` is not answerable, skipping fact checking."
)
return build_run_result(
has_occurred=None, is_determinable=is_answerable, is_valid=None
)

# Rewrite the question (which was about a future) into a sentence (which is about the past).
market_sentence = rewrite_as_sentence(
market_question, openai_api_key=openai_api_key
)
print(f"Question `{market_question}` rewritten into `{market_sentence}`.")
# Fact-check the sentence.
factresults = [
factcheck(
market_sentence,
openai_api_key=openai_api_key,
serper_api_key=serper_api_key,
)
for _ in range(n_fact_runs)
]
factresult = most_common_fact_result(factresults)
print(
f"Fact check result for `{market_sentence}` is `{factresult.factuality}`, because {factresult.claims_details}."
)

return build_run_result(
has_occurred=factresult.factuality,
is_determinable=is_answerable,
is_valid=factresult.factuality is not None,
)
1 change: 1 addition & 0 deletions packages/packages.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,6 +30,7 @@
"custom/gnosis/omen_tools/0.1.0": "bafybeibnjcgvy4l2libl34qz3aqfietjrevhxsbtisttuyfnelp3rfjlge",
"custom/victorpolisetty/dalle_request/0.1.0": "bafybeicgjdvgamkgjebdrowrxdil3aghsbcm7epup6aqidikvjpmvomn6q",
"custom/jhehemann/prediction_sentence_embeddings/0.1.0": "bafybeifivchm3pxiofu7y7a6gzfijfzgptvehcmd6auqsfsro7unaewbo4",
"custom/gnosis/ofv_market_resolver/0.1.0": "bafybeihshd446f4cqn34ef23mhkzauctyn3yl34t6p5kjvz4cn4mboj244",
"protocol/valory/acn_data_share/0.1.0": "bafybeih5ydonnvrwvy2ygfqgfabkr47s4yw3uqxztmwyfprulwfsoe7ipq",
"protocol/valory/websocket_client/0.1.0": "bafybeifjk254sy65rna2k32kynzenutujwqndap2r222afvr3zezi27mx4",
"contract/valory/agent_mech/0.1.0": "bafybeiah6b5epo2hlvzg5rr2cydgpp2waausoyrpnoarf7oa7bw33rex34",
Expand Down
Loading
Loading