Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 7 additions & 2 deletions neurons/miners/huggingface/miner.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,10 +17,11 @@
import time
import bittensor as bt
from prompting.miners import HuggingFaceMiner
from deprecated import deprecated


# This is the main function, which runs the miner.
if __name__ == "__main__":
@deprecated(version="2.4.1+", reason="Class is deprecated, use openai miner for reference on example miner.")
def main():
with HuggingFaceMiner() as miner:
while True:
miner.log_status()
Expand All @@ -29,3 +30,7 @@
if miner.should_exit:
bt.logging.warning("Ending miner...")
break


if __name__ == "__main__":
main()
41 changes: 26 additions & 15 deletions prompting/base/prompting_miner.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,7 +23,7 @@
from prompting.protocol import StreamPromptingSynapse
from prompting.base.miner import BaseStreamMinerNeuron
from datetime import datetime

from typing import List, Dict

class BaseStreamPromptingMiner(BaseStreamMinerNeuron):
"""
Expand Down Expand Up @@ -159,27 +159,38 @@ def init_wandb(self):

def log_event(
self,
synapse: StreamPromptingSynapse,
timing: float,
prompt: str,
completion: str,
system_prompt: str,
messages,
accumulated_chunks: List[str] = [],
accumulated_chunks_timings: List[float] = [],
extra_info: dict = {},
):
if not getattr(self, "wandb_run", None):
self.init_wandb()


dendrite_uid = self.metagraph.hotkeys.index(synapse.dendrite.hotkey)
step_log = {
"epoch_time": timing,
# "block": self.last_epoch_block,
"prompt": prompt,
"completion": completion,
"system_prompt": system_prompt,
"uid": self.metagraph.hotkeys.index(self.wallet.hotkey.ss58_address),
"stake": self.metagraph.S[self.uid].item(),
"trust": self.metagraph.T[self.uid].item(),
"incentive": self.metagraph.I[self.uid].item(),
"consensus": self.metagraph.C[self.uid].item(),
"dividends": self.metagraph.D[self.uid].item(),
# TODO: add block to logs in the future in a way that doesn't impact performance
# "block": self.block,
"messages": messages,
"accumulated_chunks": accumulated_chunks,
"accumulated_chunks_timings": accumulated_chunks_timings,
"validator_uid": dendrite_uid,
"validator_ip": synapse.dendrite.ip,
"validator_coldkey": self.metagraph.coldkeys[dendrite_uid],
"validator_hotkey": self.metagraph.hotkeys[dendrite_uid],
"validator_stake": self.metagraph.S[dendrite_uid].item(),
"validator_trust": self.metagraph.T[dendrite_uid].item(),
"validator_incentive": self.metagraph.I[dendrite_uid].item(),
"validator_consensus": self.metagraph.C[dendrite_uid].item(),
"validator_dividends": self.metagraph.D[dendrite_uid].item(),
"miner_stake": self.metagraph.S[self.uid].item(),
"miner_trust": self.metagraph.T[self.uid].item(),
"miner_incentive": self.metagraph.I[self.uid].item(),
"miner_consensus": self.metagraph.C[self.uid].item(),
"miner_dividends": self.metagraph.D[self.uid].item(),
**extra_info,
}

Expand Down
3 changes: 1 addition & 2 deletions prompting/miners/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,5 +4,4 @@
from .phrase import PhraseMiner

# Real miners
from .hf_miner import HuggingFaceMiner
from .openai_miner import OpenAIMiner
from .openai_miner import OpenAIMiner
3 changes: 2 additions & 1 deletion prompting/miners/hf_miner.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,8 +28,9 @@

# import base miner class which takes care of most of the boilerplate
from prompting.base.prompting_miner import BaseStreamPromptingMiner
from deprecated import deprecated


@deprecated(version="2.4.1+", reason="Class is deprecated, use openai miner for reference on example miner.")
class HuggingFaceMiner(BaseStreamPromptingMiner):
"""
Base miner which runs zephyr (https://huggingface.co/HuggingFaceH4/zephyr-7b-beta)
Expand Down
169 changes: 169 additions & 0 deletions prompting/miners/langchain_miner.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,169 @@
# The MIT License (MIT)
# Copyright © 2024 Yuma Rao

# Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated
# documentation files (the “Software”), to deal in the Software without restriction, including without limitation
# the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software,
# and to permit persons to whom the Software is furnished to do so, subject to the following conditions:

# The above copyright notice and this permission notice shall be included in all copies or substantial portions of
# the Software.

# THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO
# THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
# OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
# DEALINGS IN THE SOFTWARE.

import time
import os
import bittensor as bt
import argparse
from starlette.types import Send
from functools import partial
from typing import Dict, Awaitable

# Bittensor Miner Template:
from prompting.base.prompting_miner import BaseStreamPromptingMiner
from prompting.protocol import StreamPromptingSynapse

# import base miner class which takes care of most of the boilerplate

from prompting.miners.utils import OpenAIUtils

from langchain.prompts import ChatPromptTemplate
from langchain_core.output_parsers import StrOutputParser
from langchain.chat_models import ChatOpenAI
from dotenv import load_dotenv, find_dotenv
from langchain_core.runnables.base import RunnableSequence
from deprecated import deprecated

@deprecated(version="2.4.1+", reason="Class is deprecated, use openai miner for reference on example miner.")
class LangchainMiner(BaseStreamPromptingMiner, OpenAIUtils):
"""Langchain-based miner which uses OpenAI's API as the LLM.
This miner does not use any tools or external APIs when processing requests - it relies entirely on the models' own representation and world model. In some cases, this can produce lower quality results.
You should also install the dependencies for this miner, which can be found in the requirements.txt file in this directory.
"""

@classmethod
def add_args(cls, parser: argparse.ArgumentParser):
"""
Adds OpenAI-specific arguments to the command line parser.
"""
super().add_args(parser)

def __init__(self, config=None):
super().__init__(config=config)

bt.logging.info(f"Initializing with model {self.config.neuron.model_id}...")

if self.config.wandb.on:
self.identity_tags = ("openai_miner",) + (self.config.neuron.model_id,)

_ = load_dotenv(find_dotenv())
api_key = os.environ.get("OPENAI_API_KEY")

# Set openai key and other args
self.model = ChatOpenAI(
api_key=api_key,
model_name=self.config.neuron.model_id,
max_tokens=self.config.neuron.max_tokens,
temperature=self.config.neuron.temperature,
)

self.system_prompt = self.config.neuron.system_prompt
self.accumulated_total_tokens = 0
self.accumulated_prompt_tokens = 0
self.accumulated_completion_tokens = 0
self.accumulated_total_cost = 0

def forward(self, synapse: StreamPromptingSynapse) -> Awaitable:
async def _forward(
self,
message: str,
init_time: float,
timeout_threshold: float,
chain: RunnableSequence,
chain_formatter: Dict[str, str],
send: Send,
):
buffer = []
temp_completion = "" # for wandb logging
timeout_reached = False

try:
# Langchain built in streaming. 'astream' also available for async
for token in chain.stream(chain_formatter):
buffer.append(token)

if time.time() - init_time > timeout_threshold:
bt.logging.debug(f"⏰ Timeout reached, stopping streaming")
timeout_reached = True
break

if len(buffer) == self.config.neuron.streaming_batch_size:
joined_buffer = "".join(buffer)
temp_completion += joined_buffer
bt.logging.debug(f"Streamed tokens: {joined_buffer}")

await send(
{
"type": "http.response.body",
"body": joined_buffer.encode("utf-8"),
"more_body": True,
}
)
buffer = []

if (
buffer and not timeout_reached
): # Don't send the last buffer of data if timeout.
joined_buffer = "".join(buffer)
await send(
{
"type": "http.response.body",
"body": joined_buffer.encode("utf-8"),
"more_body": False,
}
)

except Exception as e:
bt.logging.error(f"Error in forward: {e}")
if self.config.neuron.stop_on_forward_exception:
self.should_exit = True

finally:
synapse_latency = time.time() - init_time
if self.config.wandb.on:
self.log_event(
timing=synapse_latency,
prompt=message,
completion=temp_completion,
system_prompt=self.system_prompt,
)

bt.logging.debug(f"📧 Message received, forwarding synapse: {synapse}")

prompt = ChatPromptTemplate.from_messages(
[("system", self.system_prompt), ("user", "{input}")]
)
chain = prompt | self.model | StrOutputParser()

role = synapse.roles[-1]
message = synapse.messages[-1]

chain_formatter = {"role": role, "input": message}

init_time = time.time()
timeout_threshold = synapse.timeout

token_streamer = partial(
_forward,
self,
message,
init_time,
timeout_threshold,
chain,
chain_formatter,
)
return synapse.create_streaming_response(token_streamer)
Loading