Selaa lähdekoodia

model change to llama3.1 & add system message for convert.py

kevin 1 vuosi sitten
vanhempi
commit
4e67618bd7
2 muutettua tiedostoa jossa 16 lisäystä ja 8 poistoa
  1. 10 5
      convert.py
  2. 6 3
      main.py

+ 10 - 5
convert.py

@@ -2,9 +2,14 @@ import pandas as pd
 import json
 import jsonlines
 from io import BytesIO, StringIO
-def alpaca_to_chatgpt(jsf):
+
+
+def alpaca_to_chatgpt(jsf, sys_m=None):
     res = []
-    SYSTEM_MESSAGE = "Please respond professionally and in a friendly manner, using the same language as the original request."
+    if sys_m is not None:
+        SYSTEM_MESSAGE = sys_m
+    else:
+        SYSTEM_MESSAGE = "Please respond professionally and in a friendly manner, using the same language as the original request."
     js = None
     if isinstance(jsf, str):
         js = json.loads(jsf)
@@ -27,9 +32,9 @@ def alpaca_to_chatgpt(jsf):
         writer.write(j)
     return fp
 
-def csv_to_jsonl(csvf):
+
+def csv_to_jsonl(csvf, sys_m=None):
     df = pd.read_csv(BytesIO(csvf))
     df.fillna("", inplace=True)
     json_string = df.to_json(orient="records")
-    return alpaca_to_chatgpt(json_string)
-
+    return alpaca_to_chatgpt(json_string, sys_m)

+ 6 - 3
main.py

@@ -380,18 +380,21 @@ def gpt():
 @app.route('/train', methods=['POST'])
 def train():
     prev_model = "gpt-3.5-turbo"
+    instructions = None
     if 'job_id' in request.form:
         return train_with_id(job_id=request.form['job_id'])
     elif 'train_file' in request.files:
         train_file = request.files['train_file']
         app.logger.info({"filename": train_file.filename})
+        if 'instructions' in request.form:
+            instructions = request.form['instructions']
         openai_file = None
         if train_file.filename.split('.')[1] == 'jsonl':
             openai_file = train_file.stream.read()
         elif train_file.filename.split('.')[1] == 'csv':
-            openai_file = csv_to_jsonl(train_file.stream.read())
+            openai_file = csv_to_jsonl(train_file.stream.read(), instructions)
         elif train_file.filename.split('.')[1] == 'json':
-            openai_file = alpaca_to_chatgpt(train_file)
+            openai_file = alpaca_to_chatgpt(train_file, instructions)
         if 'prev_model' in request.form:
             prev_model = request.form['prev_model']
         app.logger.info(f"Previous model: {prev_model}")
@@ -596,7 +599,7 @@ def llama():
     content = content + " Jawab dengan Bahasa Indonesia"
     try:
         json_request = {
-            "model": "llama3",
+            "model": "llama3.1",
             "prompt": content,
             "stream": False
         }