diff --git a/prompting/baseminer/run.py b/prompting/baseminer/run.py index 3327a09..1c360ec 100644 --- a/prompting/baseminer/run.py +++ b/prompting/baseminer/run.py @@ -51,7 +51,7 @@ def run(self): # --- Check for registration. if not self.subtensor.is_hotkey_registered( netuid=self.config.netuid, - hotkey=self.wallet.hotkey.ss58_address, + hotkey_ss58=self.wallet.hotkey.ss58_address, ): bt.logging.error( f"Wallet: {self.wallet} is not registered on netuid {self.config.netuid}" diff --git a/prompting/validators/__init__.py b/prompting/validators/__init__.py index 24575cc..6855712 100644 --- a/prompting/validators/__init__.py +++ b/prompting/validators/__init__.py @@ -27,7 +27,7 @@ from . import event from . import dataset -__version__ = "2.1.0" +__version__ = "2.1.1" version_split = __version__.split(".") __spec_version__ = ( (1000 * int(version_split[0])) diff --git a/prompting/validators/forward.py b/prompting/validators/forward.py index 8dfcd1e..5ea5c94 100644 --- a/prompting/validators/forward.py +++ b/prompting/validators/forward.py @@ -241,11 +241,11 @@ async def forward(self): best_summary = summarization_event["best"] exclude = summarization_event["uids"] - prompt_context = "### SUMMARY CONTEXT:\n" + best_summary + best_summary_context = "### SUMMARY CONTEXT:\n" + best_summary for k in range(self.config.neuron.num_followup_steps): # Get a followup question, given the summarized context. - qg_task = create_qg_task(base_text=prompt_context, index=k) + qg_task = create_qg_task(base_text=best_summary_context, index=k) qg_event = await run_step( self, task=qg_task, @@ -257,9 +257,11 @@ async def forward(self): # Adds the best question to the prompt context. best_question = qg_event["best"] - prompt_context += f"\n### QUESTION {k}:\n{best_question}" + best_question_prompt = ( + best_summary_context + f"\n### QUESTION {k}:\n{best_question}" + ) - qa_task = create_qa_task(prompt_context, index=k) + qa_task = create_qa_task(best_question_prompt, index=k) qa_event = await run_step( self, task=qa_task, @@ -268,9 +270,6 @@ async def forward(self): exclude=exclude, ) - best_answer = qa_event["best"] - prompt_context += f"\n### ANSWER {k}:\n{best_answer}" - exclude += qa_event["uids"] self.blacklist.question_blacklist.append(qg_event["best"]) diff --git a/prompting/validators/reward/config.py b/prompting/validators/reward/config.py index ecf9160..7583924 100644 --- a/prompting/validators/reward/config.py +++ b/prompting/validators/reward/config.py @@ -39,8 +39,8 @@ class DefaultRewardFrameworkConfig: Note: All the weights should add up to 1.0. """ - dpo_model_weight: float = 0.425 - rlhf_model_weight: float = 0.15 - reciprocate_model_weight: float = 0.425 + dpo_model_weight: float = 0.6 + rlhf_model_weight: float = 0 + reciprocate_model_weight: float = 0.4 dahoas_model_weight: float = 0 prompt_model_weight: float = 0 diff --git a/prompting/validators/tasks.py b/prompting/validators/tasks.py index e161d7b..ccf63de 100644 --- a/prompting/validators/tasks.py +++ b/prompting/validators/tasks.py @@ -102,7 +102,8 @@ def compose_prompt(self) -> str: prompt_template = textwrap.dedent( """\ Read the preceding context delimited with triple backticks carefully. - Your task is to provide a step-by-step answer to the last question found in the text, elaborating on your thought process: + Your task is to provide a clear and direct answer to the last question found in the text. + Maintain an objective tone by sticking to factual information and logical deductions without personal opinions or emotional language: '''{base_text}''' The following criteria must be respected: diff --git a/run.sh b/run.sh index 6519cc1..1d46108 100755 --- a/run.sh +++ b/run.sh @@ -5,7 +5,7 @@ script="neurons/validators/validator.py" autoRunLoc=$(readlink -f "$0") proc_name="text_prompt_validators_main_process" args=() -version_location="./prompting/__init__.py" +version_location="./prompting/validators/__init__.py" version="__version__" old_args=$@ @@ -229,7 +229,7 @@ if [ "$?" -eq 1 ]; then if [ -d "./.git" ]; then # check value on github remotely - latest_version=$(check_variable_value_on_github "opentensor/validators" "openvalidators/__init__.py" "__version__ ") + latest_version=$(check_variable_value_on_github "opentensor/text-prompting" "prompting/validators/__init__.py" "__version__ ") # If the file has been updated if version_less_than $current_version $latest_version; then