create llama2-7B lora finetune shell command; complete part of the template, complete the reasning experiment

Wzs010429 · Wzs010429 · commit 5dc24332ee48 · 2023-10-04T23:07:08.000+13:00
diff --git a/complete_reasoning_3.5.py b/complete_reasoning_3.5.py
@@ -26,14 +26,6 @@ def extract_string(input_string):
 
     return None
 
-def check_pos_neg(string):
-    words = string.split()
-    for word in words:
-        if word.lower() == "true":
-            return "true"
-        elif word.lower() == "false":
-            return "false"
-    return None
 
 def Judgement(demo, question, model):
     result_string = call_openai_API.ai_generation_check(demo, question, model = "gpt-3.5-turbo")
@@ -80,7 +72,7 @@ def Regeneration(demo, code, text, model = "gpt-3.5-turbo"):
 
 
 correct_num = 0
-for i in range(0, 40):
+for i in range(0, 1):
     try:
         # first time generate the code from propositions
         result_string = extract_string(Generation(templates.templates["agent_engineer"], data[i]['context'],
@@ -93,15 +85,17 @@ def Regeneration(demo, code, text, model = "gpt-3.5-turbo"):
 
         # Comparison
         # zero-shot CoT is here
-        tag = Comparison(templates.templates["check_error_part1"], f"Questions:{data[i]['context']}, Question:{data[i]['question']}", propositions_generated)
+        tag = Comparison(templates.templates["check_error_part1"], f"Propositions:{data[i]['context']}, Question:{data[i]['question']}", propositions_generated)
         tag_final = Extraction(templates.templates["check_error_part2"], tag)
-
+        print(f"tag: {tag}")
+        print(f"tag_final: {tag_final}")
         # if it pass the comparison
         if "1" in tag_final:
             flag = 0
             with open(PY_filename, 'w') as file:
                 file.write("{}".format(result_string))
             output = subprocess.check_output(['python', PY_filename], universal_newlines=True)
+            print(f"output: {output}")
             while (output.strip() != '1' and output.strip() != '0'):
                 result_string = extract_string(Adjustment(templates.templates["adjustment_agent"],
                                                             result_string, output))
@@ -115,9 +109,10 @@ def Regeneration(demo, code, text, model = "gpt-3.5-turbo"):
                 if (flag == 3):
                     break
         else:
+            print("enter the regeneration part")
             # regenaration
-            result_string = extract_string(Regeneration(templates.templates["regeneration"], f"Questions:{data[i]['context']}, Question:{data[i]['question']}", result_string, tag_final))
-
+            result_string = extract_string(Regeneration(templates.templates["regeneration"], f"Propositions:{data[i]['context']}, Question:{data[i]['question']}", result_string, tag_final))
+            print(f"regeneration result: {result_string}")
             with open(PY_filename, 'w') as file:
                 file.write("{}".format(result_string))
             output = subprocess.check_output(['python', PY_filename], universal_newlines=True)
@@ -144,4 +139,4 @@ def Regeneration(demo, code, text, model = "gpt-3.5-turbo"):
             continue
     except Exception as e:
         continue
-print(correct_num)
+print(f"correct_num: {correct_num}")
diff --git a/complete_reasoning_Llama2.py b/complete_reasoning_Llama2.py
@@ -0,0 +1,160 @@
+from transformers import AutoTokenizer
+import transformers
+import torch
+import re
+import json
+import csv
+import templates
+import subprocess
+
+model = "meta-llama/Llama-2-7b-chat-hf"
+
+JSON_filename = 'PARARULE_plus_step2_People_sample.json'
+PY_filename = 'pyDatalog_processing.py'
+
+
+def remove_spaces(text):
+    # Replace multiple spaces with a single space
+    text = re.sub(r' +', ' ', text)
+    # Remove leading and trailing spaces from each line
+    text = re.sub(r'^ +| +$', '', text, flags=re.MULTILINE)
+    return text
+
+template = {
+    "Llama2_baseline": remove_spaces("""Based on the closed world assumption, please help me complete a multi-step logical reasoning task (judge true or not). Please help me answer whether the question is correct or not based on the facts and rules formed by these natural language propositions. 、
+                                            You should just return me one number as the final answer  (1 for true and 0 for wrong) and providing reasoning process simply. The Propositions and Questions are as follows: \n""")
+}
+
+tokenizer = AutoTokenizer.from_pretrained(model)
+pipeline = transformers.pipeline(
+    "text-generation",
+    model=model,
+    torch_dtype=torch.float16,
+    device_map="auto",
+)
+
+def extract_string(input_string):
+    left_boundary = 'import'
+    right_boundary = ')'
+
+    start_index = input_string.find(left_boundary)
+    end_index = input_string.rfind(right_boundary, start_index)
+
+    if start_index != -1 and end_index != -1:
+        extracted_string = input_string[start_index:end_index + 1]
+        return extracted_string.strip()
+
+    return None
+
+
+def batch_process(text):
+    sequences = pipeline(
+        text,
+        do_sample=True,
+        top_k=10,
+        num_return_sequences=1,
+        eos_token_id=tokenizer.eos_token_id,
+        max_length=2048,
+    )
+    return sequences[0]['generated_text']
+
+
+# List of json file names
+json_files = [
+    "../PARARULE_plus_step2_Animal_sample.json",
+    "../PARARULE_plus_step3_Animal_sample.json",
+    "../PARARULE_plus_step4_Animal_sample.json",
+    "../PARARULE_plus_step5_Animal_sample.json",
+    "../PARARULE_plus_step2_People_sample.json",
+    "../PARARULE_plus_step3_People_sample.json",
+    "../PARARULE_plus_step4_People_sample.json",
+    "../PARARULE_plus_step5_People_sample.json"
+]
+
+with open(JSON_filename, 'r') as file:
+    data = json.load(file)
+
+
+# # Open the CSV file for writing
+# with open("Llama2-7B-ChatLogic.csv", "w", newline="", encoding="utf-8") as csv_file:
+#     csv_writer = csv.writer(csv_file)
+#     csv_writer.writerow(["step", "return", "label"])  # Write header
+#
+#     for json_file in json_files:
+#         step = '_'.join(json_file.split("_")[2:4])
+#         with open(json_file, "r", encoding="utf-8") as f:
+#             data = json.load(f)
+#             for entry in data:
+#                 context = entry["context"]
+#                 question = entry["question"]
+#                 label = entry["label"]
+#                 # Replace this with your actual function call
+#                 responses = batch_process(f"Instructions: ```{template['Llama2_baseline']}```Propositions: ```{context}```\nQuestion: ```{question}```")
+#
+#                 csv_writer.writerow([step, responses, label])
+
+correct_num = 0
+for i in range(0, 1):
+    try:
+
+        # first time generate the code from propositions
+        result_string = extract_string(batch_process(f"""{templates.templates['agent_engineer']}, Here are the propositions: {data[i]['context']} and the Question:{data[i]['question']},
+                        {templates.templates['no_extra_content']}"""))
+        # print(result_string)
+
+        # convert code back 2 propositions
+        propositions_generated = batch_process(f"""{templates.templates["agent_engineer_neg"]}, and the following is the generated code: {result_string}""")
+
+        # Comparison
+        # zero-shot CoT is here
+        tag = batch_process(f"""{templates.templates['check_error_part1']}, and the original Propositions:{data[i]['context']}, and Question:{data[i]['question']}, the generated Propositions and Questions: {propositions_generated}""")
+        tag_final = batch_process(f"""{templates.templates['check_error_part2']}, the following is the analysis processing: {tag}""")
+
+        # if it pass the comparison
+        if "1" in tag_final:
+            flag = 0
+            with open(PY_filename, 'w') as file:
+                file.write("{}".format(result_string))
+            output = subprocess.check_output(['python', PY_filename], universal_newlines=True)
+            while (output.strip() != '1' and output.strip() != '0'):
+                result_string = extract_string(batch_process(f"""{templates.templates['adjustment_agent']}, and here is the generated code: {result_string}, and the error message: {output}"""))
+                with open(PY_filename, 'w') as file:
+                    file.write("{}".format(result_string))
+                print("reprocessing...")
+                output = subprocess.check_output(['python', PY_filename], universal_newlines=True)
+                print("New output:" + output)
+                print(type(output))
+                flag += 1
+                if (flag == 3):
+                    break
+        else:
+            print("enter the regeneration part")
+            # regenaration
+            result_string = extract_string(batch_process(f"""{templates.templates['regeneration']},The original propositions are:{data[i]['context']}, and Question:{data[i]['question']}, and the following is the generated code: {result_string}, and the differences: {tag_final}"""))
+
+            with open(PY_filename, 'w') as file:
+                file.write("{}".format(result_string))
+            output = subprocess.check_output(['python', PY_filename], universal_newlines=True)
+            flag = 0
+            while (output.strip() != '1' and output.strip() != '0'):
+                result_string = extract_string(batch_process(f"""{templates.templates['adjustment_agent']}, and here is the generated code: {result_string}, and the error message: {output}"""))
+                with open(PY_filename, 'w') as file:
+                    file.write("{}".format(result_string))
+                print("reprocessing...")
+                output = subprocess.check_output(['python', PY_filename], universal_newlines=True)
+                print("New output:" + output)
+                print(type(output))
+                flag += 1
+                if (flag == 3):
+                    break
+
+        # check correctness
+        if (output.strip() != '1' and output.strip() != '0'):
+            correct_num += 1
+        if int(output.strip()) == data[i]['label']:
+            correct_num += 1
+        else:
+            continue
+    except Exception as e:
+        continue
+print(correct_num)
diff --git a/templates.py b/templates.py
@@ -119,16 +119,13 @@ def remove_spaces(text):
                                 2. The number of propositions in the two texts must be consistent (including propositions and rules), otherwise it will be regarded as a difference.\n \
                                 3. If there is a difference, please tell me the difference.\n \
                                 Please think about this question step by step. """),
-    # TODO: need change
     "check_error_part2": remove_spaces("""Based on your analysis process of text comparison, please give me a final conclusion. We only consider differences in content expression of texts and ignore differences in expression or structure. \
                                             If there is no difference between the two texts, please return only the number 1 to me. If there is a difference, please return to me the content of the difference."""),
-    "update_code": remove_spaces("""I interacted with you and completed the following actions:\n \
+    "regeneration": remove_spaces("""I interacted with you and completed the following actions:\n \
                                 1. I asked you to help me convert logical reasoning problems described in natural language into pydatalog code.\n \
                                 2. After the first step is completed, I asked you to convert the pydatalog code you generated back into a logical reasoning problem described in natural language (note that in this step, I did not provide you with the context of the first step's behavior)\n \
                                 3. I asked you to compare the logical reasoning questions in the original natural language form in the first step with the logical reasoning questions in the natural language form converted according to the code in the second step, and asked you to return any possible differences.\n \
                                 It is known that the difference you return is as follows:\n \
-                                Now please regenerate the pydatalog code for me considering the differences:"""),
-    # TODO: need change
-    "regeneration":
+                                Now please regenerate the pydatalog code for me considering the differences:""")
 
 }