Spaces:

macrocosm-os
/

prompting-dashboard

Sleeping

App Files Files Community

steffenc commited on Apr 4, 2024

Commit

82b3169

1 Parent(s): 2e2d80e

Add server

Browse files

Files changed (1) hide show

server.py +243 -0

server.py ADDED Viewed

	@@ -0,0 +1,243 @@

+import os
+import re
+import asyncio
+import json
+import traceback
+import bittensor as bt
+from collections import Counter
+from neurons.validator import Validator
+from prompting.dendrite import DendriteResponseEvent
+from prompting.protocol import PromptingSynapse
+from prompting.utils.uids import get_random_uids
+from prompting.rewards import DateRewardModel, FloatDiffModel
+from aiohttp import web
+from aiohttp.web_response import Response
+"""
+# test
+```
+curl -X POST http://0.0.0.0:10000/chat/ -H "api_key: hello" -d '{"k": 5, "timeout": 3, "roles": ["user"], "messages": ["hello world"]}'
+curl -X POST http://0.0.0.0:10000/chat/ -H "api_key: hey-michal" -d '{"k": 5, "timeout": 3, "roles": ["user"], "messages": ["on what exact date did the 21st century begin?"]}'
+```
+TROUBLESHOOT
+check if port is open
+```
+sudo ufw allow 10000/tcp
+sudo ufw allow 10000/tcp
+```
+# run
+```
+EXPECTED_ACCESS_KEY="hey-michal" pm2 start app.py --interpreter python3 --name app -- --neuron.model_id mock --wallet.name sn1 --wallet.hotkey v1 --netuid 1 --neuron.tasks math --neuron.task_p 1 --neuron.device cpu
+```
+"""
+EXPECTED_ACCESS_KEY = os.environ.get('EXPECTED_ACCESS_KEY')
+validator = None
+reward_models = {
+    'date_qa': DateRewardModel(),
+    'math': FloatDiffModel(),
+}
+def completion_is_valid(completion: str):
+    """
+    Get the completion statuses from the completions.
+    """
+    patt = re.compile(r'I\'m sorry|unable to|I cannot|I can\'t|I am unable|I am sorry|I can not|don\'t know|not sure|don\'t understand')
+    if not len(re.findall(r'\w+',completion)) or patt.search(completion):
+        return False
+    return True
+def ensemble_result(completions: list, task_name: str, prefer: str = 'longest'):
+    """
+    Ensemble completions from multiple models.
+    # TODO: Measure agreement
+    # TODO: Figure out how to mitigate the cabal effect (large groups will appear to be more credible)
+    # TODO: Reward pipeline
+    """
+    if not completions:
+        return None
+    answer = None
+    if task_name in ('qa', 'summarization'):
+        # No special handling for QA or summarization
+        supporting_completions = completions
+    elif task_name == 'date_qa':
+        # filter the completions to be the ones that contain valid dates and if there are multiple dates, select the most common one (with support > 1)
+        dates = list(map(reward_models[task_name].parse_dates_from_text, completions))
+        bt.logging.info(f"Unprocessed dates: {dates}")
+        valid_date_indices = [i for i, d in enumerate(dates) if d]
+        valid_completions = [completions[i] for i in valid_date_indices]
+        valid_dates = [dates[i] for i in valid_date_indices]
+        dates = [f"{d[0].strftime('%-d %B')} {d[1]}" for d in valid_dates]
+        if not dates:
+            return None
+        counter = Counter(dates)
+        most_common, count = counter.most_common()[0]
+        answer = most_common
+        if count == 1:
+            supporting_completions = valid_completions
+        else:
+            supporting_completions = [c for i, c in enumerate(valid_completions) if dates[i]==most_common]
+    elif task_name == 'math':
+        # filter the completions to be the ones that contain valid numbers and if there are multiple values, select the most common one (with support > 1)
+        # TODO: use the median instead of the most common value
+        vals = list(map(reward_models[task_name].extract_number, completions))
+        vals = [val for val in vals if val]
+        if not vals:
+            return None
+        most_common, count = Counter(dates).most_common()[0]
+        bt.logging.info(f"Most common value: {most_common}, count: {count}")
+        answer = most_common
+        if count == 1:
+            supporting_completions = completions
+        else:
+            supporting_completions = [c for i, c in enumerate(completions) if vals[i]==most_common]
+    bt.logging.info(f"Supporting completions: {supporting_completions}")
+    if prefer == 'longest':
+        preferred_completion = sorted(supporting_completions, key=len)[-1]
+    elif prefer == 'shortest':
+        preferred_completion = sorted(supporting_completions, key=len)[0]
+    elif prefer == 'most_common':
+        preferred_completion = max(set(supporting_completions), key=supporting_completions.count)
+    else:
+        raise ValueError(f"Unknown ensemble preference: {prefer}")
+    return {
+        'completion': preferred_completion,
+        'accepted_answer': answer,
+        'support': len(supporting_completions),
+        'support_indices': [completions.index(c) for c in supporting_completions],
+        'method': f'Selected the {prefer.replace("_", " ")} completion'
+    }
+def guess_task_name(challenge: str):
+    categories = {
+        'summarization': re.compile('summar|quick rundown|overview'),
+        'date_qa': re.compile('exact date|tell me when|on what date|on what day|was born?|died?'),
+        'math': re.compile('math|solve|solution| sum |problem|geometric|vector|calculate|degrees|decimal|factorial'),
+    }
+    for task_name, patt in categories.items():
+        if patt.search(challenge):
+            return task_name
+    return 'qa'
+async def chat(request: web.Request) -> Response:
+    """
+    Chat endpoint for the validator.
+    Required headers:
+    - api_key: The access key for the validator.
+    Required body:
+    - roles: The list of roles to query.
+    - messages: The list of messages to query.
+    Optional body:
+    - k: The number of nodes to query.
+    - exclude: The list of nodes to exclude from the query.
+    - timeout: The timeout for the query.
+    """
+    bt.logging.info(f'chat()')
+    # Check access key
+    access_key = request.headers.get("api_key")
+    if EXPECTED_ACCESS_KEY is not None and access_key != EXPECTED_ACCESS_KEY:
+        bt.logging.error(f'Invalid access key: {access_key}')
+        return Response(status=401, reason="Invalid access key")
+    try:
+        request_data = await request.json()
+    except ValueError:
+        bt.logging.error(f'Invalid request data: {request_data}')
+        return Response(status=400)
+    bt.logging.info(f'Request data: {request_data}')
+    k = request_data.get('k', 10)
+    exclude = request_data.get('exclude', [])
+    timeout = request_data.get('timeout', 10)
+    prefer = request_data.get('prefer', 'longest')
+    try:
+        # Guess the task name of current request
+        task_name = guess_task_name(request_data['messages'][-1])
+        # Get the list of uids to query for this step.
+        uids = get_random_uids(validator, k=k, exclude=exclude or []).to(validator.device)
+        axons = [validator.metagraph.axons[uid] for uid in uids]
+        # Make calls to the network with the prompt.
+        bt.logging.info(f'Calling dendrite')
+        responses = await validator.dendrite(
+            axons=axons,
+            synapse=PromptingSynapse(roles=request_data['roles'], messages=request_data['messages']),
+            timeout=timeout,
+        )
+        bt.logging.info(f"Creating DendriteResponseEvent:\n {responses}")
+        # Encapsulate the responses in a response event (dataclass)
+        response_event = DendriteResponseEvent(responses, uids)
+        # convert dict to json
+        response = response_event.__state_dict__()
+        response['completion_is_valid'] = valid = list(map(completion_is_valid, response['completions']))
+        valid_completions = [response['completions'][i] for i, v in enumerate(valid) if v]
+        response['task_name'] = task_name
+        response['ensemble_result'] = ensemble_result(valid_completions, task_name=task_name, prefer=prefer)
+        bt.logging.info(f"Response:\n {response}")
+        return Response(status=200, reason="I can't believe it's not butter!", text=json.dumps(response))
+    except Exception:
+        bt.logging.error(f'Encountered in {chat.__name__}:\n{traceback.format_exc()}')
+        return Response(status=500, reason="Internal error")
+class ValidatorApplication(web.Application):
+    def __init__(self, *a, **kw):
+        super().__init__(*a, **kw)
+        # TODO: Enable rewarding and other features
+validator_app = ValidatorApplication()
+validator_app.add_routes([web.post('/chat/', chat)])
+bt.logging.info("Starting validator application.")
+bt.logging.info(validator_app)
+def main(run_aio_app=True, test=False) -> None:
+    loop = asyncio.get_event_loop()
+    # port = validator.metagraph.axons[validator.uid].port
+    port = 10000
+    if run_aio_app:
+        try:
+            web.run_app(validator_app, port=port, loop=loop)
+        except KeyboardInterrupt:
+            bt.logging.info("Keyboard interrupt detected. Exiting validator.")
+        finally:
+            pass
+if __name__ == "__main__":
+    validator = Validator()
+    main()