Spaces:

Dovakiins
/

qwerrwe

Build error

winglian commited on Mar 5, 2024

Commit

2598c9f

unverified ·

1 Parent(s): decb66e

allow the sharegpt handler to also better handle datasets destined for openai finetuning (#1361)

* allow the sharegpt handler to also better handle datasets destined for openai finetuning

* make sure to support system role

Files changed (1) hide show

src/axolotl/prompt_strategies/sharegpt.py CHANGED Viewed

@@ -82,7 +82,7 @@ class SimpleShareGPTPromptTokenizingStrategy(ShareGPTPromptTokenizingStrategy):
     basic sharegpt strategy to grab conversations from the sample row
     """
-    _strict = True
     @property
     def strict(self):
@@ -96,10 +96,25 @@ class SimpleShareGPTPromptTokenizingStrategy(ShareGPTPromptTokenizingStrategy):
         conversations = prompt["conversations"]
         if self.strict:
             return conversations
-        # remap roles - allow for assistant turn
-        role_map = {"human": "human", "assistant": "gpt", "gpt": "gpt"}
         turns = [
-            {"from": role_map[t["from"]], "value": t["value"]} for t in conversations
         ]
         return turns

     basic sharegpt strategy to grab conversations from the sample row
     """
+    _strict = False
     @property
     def strict(self):
         conversations = prompt["conversations"]
         if self.strict:
             return conversations
+        role_key = "from"
+        if "role" in conversations[0].keys():
+            role_key = "role"
+        value_key = "value"
+        if "text" in conversations[0].keys():
+            value_key = "text"
+        elif "content" in conversations[0].keys():
+            value_key = "content"
+        # remap roles - allow for assistant turn"
+        role_map = {
+            "user": "human",
+            "human": "human",
+            "assistant": "gpt",
+            "gpt": "gpt",
+            "system": "system",
+        }
         turns = [
+            {"from": role_map[t[role_key]], "value": t[value_key]}
+            for t in conversations
         ]
         return turns