gini-chatgpt-4.1-reasoning

Sleeping

App Files Files Community

seawolf2357 commited on Jun 15, 2024

Commit

4509126

verified ·

1 Parent(s): 0926d14

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -6

app.py CHANGED Viewed

@@ -14,6 +14,9 @@ intents.messages = True
 # 추론 API 클라이언트 설정
 hf_client = InferenceClient("meta-llama/Meta-Llama-3-70B-Instruct", token=os.getenv("HF_TOKEN"))
 class MyClient(discord.Client):
     def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
@@ -26,7 +29,7 @@ class MyClient(discord.Client):
             logging.info('자신의 메시지는 무시합니다.')
             return
-        logging.debug(f'Receiving message: {message.content}')  # 로깅 추가
         response = await generate_response(message.content)
         await message.channel.send(response)
@@ -40,22 +43,25 @@ async def generate_response(user_input):
     반드시 한글로 답변하십시오.
     """
-    # 구체적인 프롬프트를 제공하여 모델의 응답을 유도합니다.
-    messages = [{"role": "system", "content": f"{system_prefix} {system_message}"}]
-    messages.append({"role": "user", "content": user_input})
     # 동기 함수를 비동기로 처리하기 위한 래퍼 사용, stream=true로 변경
     loop = asyncio.get_event_loop()
     response = await loop.run_in_executor(None, lambda: hf_client.chat_completion(
-        messages, max_tokens=200, stream=True, temperature=0.9, top_p=0.9))  # 조정된 파라미터
     # 스트리밍 응답을 처리하는 로직 추가
     full_response = ""
     for part in response:
         full_response += part.choices[0].delta.content.strip()
-    logging.debug(f'Model response: {full_response}')  # 응답 로깅
     return full_response
 # 디스코드 봇 인스턴스 생성 및 실행

 # 추론 API 클라이언트 설정
 hf_client = InferenceClient("meta-llama/Meta-Llama-3-70B-Instruct", token=os.getenv("HF_TOKEN"))
+# 대화 히스토리를 저장할 변수
+conversation_history = []
 class MyClient(discord.Client):
     def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
             logging.info('자신의 메시지는 무시합니다.')
             return
+        logging.debug(f'Receiving message: {message.content}')
         response = await generate_response(message.content)
         await message.channel.send(response)
     반드시 한글로 답변하십시오.
     """
+    # 대화 히스토리 관리
+    global conversation_history
+    conversation_history.append({"role": "user", "content": user_input})
+    messages = [{"role": "system", "content": f"{system_prefix} {system_message}"}] + conversation_history
     # 동기 함수를 비동기로 처리하기 위한 래퍼 사용, stream=true로 변경
     loop = asyncio.get_event_loop()
     response = await loop.run_in_executor(None, lambda: hf_client.chat_completion(
+        messages, max_tokens=200, stream=True, temperature=0.9, top_p=0.9))
     # 스트리밍 응답을 처리하는 로직 추가
     full_response = ""
     for part in response:
         full_response += part.choices[0].delta.content.strip()
+    conversation_history.append({"role": "assistant", "content": full_response})
+    logging.debug(f'Model response: {full_response}')
     return full_response
 # 디스코드 봇 인스턴스 생성 및 실행