RedHatResearch
diff --git a/‎netconfeval/common/model_configs.py
+5 b/‎netconfeval/common/model_configs.py
+5
diff --git a/‎netconfeval/foundation/langchain/chat_models/hf.py
+3-1 b/‎netconfeval/foundation/langchain/chat_models/hf.py
+3-1
diff --git a/‎netconfeval/step_1_formal_spec_conflict_detection.py
+2-2 b/‎netconfeval/step_1_formal_spec_conflict_detection.py
+2-2
diff --git a/‎netconfeval/step_1_function_call.py
+1-1 b/‎netconfeval/step_1_function_call.py
+1-1
diff --git a/‎plots/step_1_graph_conflict.py ‎plot/step_1_plot_formal_spec_conflict_detection.py
+38-10 b/‎plots/step_1_graph_conflict.py ‎plot/step_1_plot_formal_spec_conflict_detection.py
+38-10
diff --git a/‎plots/step_1_heat_map.py ‎plot/step_1_plot_formal_spec_conflict_heatmap.py
+30-10 b/‎plots/step_1_heat_map.py ‎plot/step_1_plot_formal_spec_conflict_heatmap.py
+30-10
diff --git a/‎plots/step_1_graph_model_compare_ad_hoc.py ‎plot/step_1_plot_formal_spec_translation.py
+50-38 b/‎plots/step_1_graph_model_compare_ad_hoc.py ‎plot/step_1_plot_formal_spec_translation.py
+50-38
diff --git a/‎plots/step_1_graph_function_call_adhoc.py ‎plot/step_1_plot_function_call_ad_hoc.py
+8-8 b/‎plots/step_1_graph_function_call_adhoc.py ‎plot/step_1_plot_function_call_ad_hoc.py
+8-8
@@ -118,6 +118,11 @@ def _build_mistral_lite_prompt(messages):
             'seed': 5000,
         }
     },
+    'gpt-3.5-0613': {
+        'model_name': 'gpt-3.5-turbo-0613',
+        'type': 'openai',
+        'args': {}
+    },
     'gpt-4': {
         'model_name': 'gpt-4',
         'type': 'openai',
 
@@ -40,7 +40,7 @@ def _parse_chat_history(history: List[BaseMessage]) -> list[str]:
 class ChatHF(BaseChatModel):
     model_name: str
     max_length: int
-    temperature: float
+    temperature: float | None
     use_quantization: bool
     text_pipeline: Any
     prompt_func: Any
@@ -51,6 +51,8 @@ class ChatHF(BaseChatModel):
     # and then add it to the path For example: export LD_LIBRARY_PATH="/opt/cuda/11.8.0/targets/x86_64-linux/lib/:$LD_LIBRARY_PATH"
     # And then run `python -m bitsandbytes`
 
+    #TODO: add parameter, plot by model name
+
     def __init__(self, **kwargs: Any) -> None:
         super().__init__(**kwargs)
         self.model_name = kwargs.get('model_name', None)
 
@@ -69,7 +69,7 @@ def main(args: argparse.Namespace) -> None:
         os.path.abspath(
             os.path.join(
                 args.results_path,
-                f"log-{args.model}-{'_'.join(policy_types)}-conflict-{results_time}.log"
+                f"log-{args.model}{"-combined" if args.combined else ""}-{'_'.join(policy_types)}-conflict-{results_time}.log"
             )
         )
     )
@@ -100,7 +100,7 @@ def main(args: argparse.Namespace) -> None:
     max_n_requirements = max(args.batch_size) * n_policy_types
     w = None
 
-    filename = f"result-{args.model}-{'_'.join(policy_types)}-conflict-{results_time}.csv"
+    filename = f"result-{args.model}-{'_'.join(policy_types)}-conflict{"-combined" if args.combined else ""}-{results_time}.csv"
 
     with open(os.path.join(args.results_path, filename), 'w') as f:
         for it in range(0, args.n_runs):
 
@@ -139,7 +139,7 @@ def main(args: argparse.Namespace) -> None:
         os.path.abspath(
             os.path.join(
                 args.results_path,
-                f"log-{args.model}-{'_'.join(policy_types)}-function_{'adhoc' if args.adhoc else 'native'}-{results_time}.log"
+                f"log-{args.model}-{'adhoc' if args.adhoc else 'native'}-{'_'.join(policy_types)}-function-{results_time}.log"
             )
         )
     )
 
@@ -13,25 +13,53 @@
 import matplotlib.pyplot as plt
 import numpy as np
 from sortedcontainers import SortedSet
-from src.utils import strtobool
+# TODO: change the location of "combined" in experiments
+# TODO: add model_selection
+
+def strtobool(val: str) -> bool:
+    """Convert a string representation of truth to true or false.
+
+    Args:
+        val (str): The value to convert. True values are 'y', 'yes', 't', 'true', 'on', and '1';
+            false values are 'n', 'no', 'f', 'false', 'off', and '0'.
+
+        Returns:
+            bool: The value converted to bool.
+
+        Raises:
+            ValueError: If the specified value is not a valid representation of truth.
+    """
+    val = val.lower()
+    if val in ('y', 'yes', 't', 'true', 'on', '1'):
+        return True
+    elif val in ('n', 'no', 'f', 'false', 'off', '0'):
+        return False
+    else:
+        raise ValueError(f"Invalid truth value `{val}`.")
+
 
 model2plot = {
-    "gpt-4-turbo": {
+    "gpt-4-1106": {
         "label": "GPT-4-Turbo",
         "color": "#377eb8",
         "marker": "o"
     },
-    "gpt-4": {
+    "gpt-4-": {
         "label": "GPT-4",
-        "color": "#e41a1c",
+        "color": "#a65628",
         "marker": "s"
     },
-    "gpt-3.5-turbo": {
+    "gpt-3.5-0613": {
         "label": "GPT-3.5-Turbo",
-        "color": "#4daf4a",
+        "color": "#984ea3",
         "marker": ">"
     },
-    "gpt-4-combined": {
+    # "gpt-4-turbo-function": {
+    #     "label": "gpt-4-turbo-function",
+    #     "color": "#e41a1c",
+    #     "marker": "1"
+    # },
+    "gpt-4-1106-combined": {
         "label": "GPT-4 (Combined)",
         "color": "#984ea3",
         "marker": "<"
@@ -141,7 +169,7 @@ def plot_by_requirements(results_path: str, figures_path: str, requirements: Sor
     model_list = model2plot.keys()
     for model_name in model_list:
         results_files_list = glob.glob(
-            os.path.join(".", results_path, f"result-{model_name}-{requirements_str}-conflict-*.csv"))
+            os.path.join("../", results_path, f"result-{model_name}-{requirements_str}-conflict-*.csv"))
 
         if len(results_files_list) == 0:
             continue
@@ -158,7 +186,7 @@ def plot_by_requirements(results_path: str, figures_path: str, requirements: Sor
         print(model2result[model_name]["accuracy"], model2result[model_name]["precision"],
               model2result[model_name]["recall"], model2result[model_name]["f1_score"])
 
-    base_figures_path = os.path.join(".", figures_path)
+    base_figures_path = os.path.join(figures_path)
     os.makedirs(base_figures_path, exist_ok=True)
 
     for param in ["accuracy", "precision", "recall", "f1_score"]:
@@ -220,4 +248,4 @@ def main(args: argparse.Namespace) -> None:
 
 
 if __name__ == "__main__":
-    main(parse_args())
+    main(parse_args())
@@ -1,10 +1,14 @@
+import argparse
 import csv
+import glob
 
 import matplotlib
 import numpy as np
 import seaborn as sns
 from matplotlib import pyplot as plt
-
+import sys
+import os
+sys.path.append(os.path.join(os.path.dirname(os.path.abspath(__file__)), ".."))
 
 def heatmap(data_loc: str, fig_path: str) -> None:
     results = [[0] * 34 for i in range(34)]
@@ -50,17 +54,33 @@ def heatmap(data_loc: str, fig_path: str) -> None:
     fig.savefig(fig_path, format="pdf", bbox_inches='tight')
 
 
-if __name__ == "__main__":
+def main(args: argparse.Namespace) -> None:
     matplotlib.rc('font', size=10)
     matplotlib.rcParams['hatch.linewidth'] = 0.3
     matplotlib.rcParams['pdf.fonttype'] = 42
     matplotlib.rcParams['ps.fonttype'] = 42
 
-    heatmap(
-        "evaluation/result_conflict/result_distance/result-gpt-3.5-turbo-loadbalancing_reachability_waypoint-conflict-1700742765.7879624.csv",
-        "evaluation/result_conflict/result_distance/heatmap-gpt-3.5.pdf"
-    )
-    heatmap(
-        "evaluation/result_conflict/result_distance/result-gpt-4-turbo-loadbalancing_reachability_waypoint-conflict-1700747740.0543778.csv",
-        "evaluation/result_conflict/result_distance/heatmap-gpt-4.pdf"
-    )
+    results_files_list = glob.glob(os.path.join("../", args.results_path, f"*.csv"))
+    base_figures_path = os.path.join("../plot", args.figures_path)
+    os.makedirs(base_figures_path, exist_ok=True)
+
+    for file in results_files_list:
+        heatmap(
+            file,
+            os.path.join(base_figures_path, "heatmap-gpt-3.5.pdf")
+        )
+    # heatmap(
+    #     "evaluation/result_conflict/result_distance/result-gpt-4-turbo-loadbalancing_reachability_waypoint-conflict-1700747740.0543778.csv",
+    #     "evaluation/result_conflict/result_distance/heatmap-gpt-4.pdf"
+    # )
+
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--results_path', type=str, required=False, default="result")
+    parser.add_argument('--figures_path', type=str, required=True)
+
+    return parser.parse_args()
+
+
+if __name__ == "__main__":
+    main(parse_args())
@@ -10,34 +10,6 @@
 import numpy as np
 from sortedcontainers import SortedSet
 
-model2plot = {
-    # "gpt-3.5-finetuned": {
-    #     "label": "GPT-3.5-FT",
-    #     "color": "#a65628",
-    #     "marker": "s"
-    # },
-    "gpt-3.5-1106-function": {
-        "label": "GPT-3.5-function",
-        "color": "#984ea3",
-        "marker": ">"
-    },
-    "gpt-4-turbo-function": {
-        "label": "gpt-4-turbo-function",
-        "color": "#e41a1c",
-        "marker": "1"
-    },
-    # "gpt-4": {
-    #     "label": "GPT-4",
-    #     "color": "#ffff33",
-    #     "marker": "+"
-    # },
-    "codellama-7b-instruct": {
-        "label": "CL-7B-Instruct",
-        "color": "#ff7f00",
-        "marker": "<"
-    },
-}
-
 
 def extract_result(file_path: str, model_name: str) -> (dict, dict):
     average = {}
@@ -112,15 +84,15 @@ def extract_result(file_path: str, model_name: str) -> (dict, dict):
     return to_plot_accuracy, to_plot_cost
 
 
-def plot_by_requirements(results_path: str, figures_path: str, requirements: SortedSet) -> None:
+def plot_by_requirements(results_path: str, figures_path: str, requirements: SortedSet, model2plot) -> None:
+    # print(model2plot)
+    # exit()
     model2result = {}
     requirements_str = "_".join(requirements)
 
     for model_name in model2plot.keys():
-        # if include not in model_name or 'function' in model_name:
-        #     continue
 
-        results_files_list = glob.glob(os.path.join(".", results_path, f"result-{model_name}-ad-hoc-{requirements_str}-*.csv"))
+        results_files_list = glob.glob(os.path.join("../", results_path, f"result-{model_name}-{requirements_str}-*.csv"))
         if results_files_list:
             results_file = results_files_list.pop()
 
@@ -130,7 +102,7 @@ def plot_by_requirements(results_path: str, figures_path: str, requirements: Sor
             model2result[model_name]["accuracy"], model2result[model_name]["cost"] = extract_result(results_file,
                                                                                                     model_name)
 
-    base_figures_path = os.path.join(".", figures_path)
+    base_figures_path = os.path.join("../plot", figures_path)
     os.makedirs(base_figures_path, exist_ok=True)
 
     # Accuracy
@@ -161,6 +133,9 @@ def plot_by_requirements(results_path: str, figures_path: str, requirements: Sor
     plt.ylim([-0.1, 1.2])
     plt.yticks(np.arange(0, 1.2, 0.25))
     plt.xscale('log', base=10)
+
+    # print(model2result)
+    # exit()
     x_ticks = list(model2result.values())[0]["accuracy"]["x"]
     plt.xticks(x_ticks)
     ax.xaxis.set_major_formatter(matplotlib.ticker.ScalarFormatter())
@@ -215,7 +190,7 @@ def parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser()
     parser.add_argument('--results_path', type=str, required=False, default="result")
     parser.add_argument('--figures_path', type=str, required=True)
-    # parser.add_argument('--include', type=str, choices=['gpt', 'codellama'])
+    parser.add_argument("--models", type=str, choices=["gpt", "codellama"])
 
     return parser.parse_args()
 
@@ -226,11 +201,48 @@ def main(args: argparse.Namespace) -> None:
     matplotlib.rcParams['pdf.fonttype'] = 42
     matplotlib.rcParams['ps.fonttype'] = 42
 
-    plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability"}))
-    plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability", "waypoint"}))
+    if args.models == "gpt":
+        model2plot = {
+            "gpt-4-1106": {
+                "label": "GPT-4-Turbo",
+                "color": "#377eb8",
+                "marker": "o"
+            },
+            "gpt-3.5-finetuned": {
+                "label": "GPT-3.5-FT",
+                "color": "#a65628",
+                "marker": "s"
+            },
+            "gpt-3.5-0613": {
+                "label": "GPT-3.5-Turbo",
+                "color": "#984ea3",
+                "marker": ">"
+            },
+        }
+    if args.models == "codellama":
+        model2plot = {
+            "codellama-13b-instruct": {
+                "label": "CL-13B-Instruct",
+                "color": "#ff7f00",
+                "marker": "<"
+            },
+            "codellama-7b-instruct-finetuned": {
+                "label": "CL-7B-Instruct-FT (QLoRA)",
+                "color": "#4daf4a",
+                "marker": ">"
+            },
+            "codellama-7b-instruct": {
+                "label": "CL-7B-Instruct",
+                "color": "#f781bf",
+                "marker": "^"
+            },
+        }
+
+    # plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability"}), model2plot)
+    # plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability", "waypoint"}), model2plot)
     plot_by_requirements(args.results_path, args.figures_path,
-                         SortedSet({"loadbalancing", "reachability", "waypoint"}))
+                         SortedSet({"loadbalancing", "reachability", "waypoint"}), model2plot)
 
 
 if __name__ == "__main__":
-    main(parse_args())
+    main(parse_args())
@@ -10,22 +10,22 @@
 from sortedcontainers import SortedSet
 
 model2plot = {
-    "gpt-3.5-1106-function-ad-hoc": {
+    "gpt-3.5-1106-adhoc": {
         "label": "GPT-3.5-Turbo",
         "color": "#984ea3",
         "marker": ">"
     },
-    "gpt-4-turbo-function": {
+    "gpt-4-1106-native": {
         "label": "GPT-4-Turbo (Native)",
         "color": "#e41a1c",
         "marker": "s"
     },
-    "gpt-4-turbo-ad-hoc": {
+    "gpt-4-turbo-adhoc": {
         "label": "GPT-4-Turbo (Ad-hoc)",
         "color": "#377eb8",
         "marker": "o"
     },
-    "codellama-7b-instruct-ad-hoc": {
+    "codellama-7b-instruct-adhoc": {
         "label": "CL-7B-Instruct",
         "color": "#f781bf",
         "marker": "^"
@@ -84,7 +84,7 @@ def plot_by_requirements(results_path: str, figures_path: str, requirements: Sor
 
     for model_name in model2plot.keys():
         results_files_list = glob.glob(
-            os.path.join(".", results_path, f"result-{model_name}-{requirements_str}-*.csv")
+            os.path.join("../", results_path, f"result-{model_name}-{requirements_str}-*.csv")
         )
         if results_files_list:
             results_file = results_files_list.pop()
@@ -150,10 +150,10 @@ def main(args: argparse.Namespace) -> None:
     matplotlib.rcParams['pdf.fonttype'] = 42
     matplotlib.rcParams['ps.fonttype'] = 42
 
-    plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability"}))
-    plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability", "waypoint"}))
+    # plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability"}))
+    # plot_by_requirements(args.results_path, args.figures_path, SortedSet({"reachability", "waypoint"}))
     plot_by_requirements(args.results_path, args.figures_path, SortedSet({"loadbalancing", "reachability", "waypoint"}))
 
 
 if __name__ == "__main__":
-    main(parse_args())
+    main(parse_args())
Original file line number	Diff line number	Diff line change
`@@ -69,7 +69,7 @@ def main(args: argparse.Namespace) -> None:`
`69`	`69`	`os.path.abspath(`
`70`	`70`	`os.path.join(`
`71`	`71`	`args.results_path,`
`72`		`- f"log-{args.model}-{'_'.join(policy_types)}-conflict-{results_time}.log"`
	`72`	`+ f"log-{args.model}{"-combined" if args.combined else ""}-{'_'.join(policy_types)}-conflict-{results_time}.log"`
`73`	`73`	`)`
`74`	`74`	`)`
`75`	`75`	`)`
`@@ -100,7 +100,7 @@ def main(args: argparse.Namespace) -> None:`
`100`	`100`	`max_n_requirements = max(args.batch_size) * n_policy_types`
`101`	`101`	`w = None`
`102`	`102`
`103`		`- filename = f"result-{args.model}-{'_'.join(policy_types)}-conflict-{results_time}.csv"`
	`103`	`+ filename = f"result-{args.model}-{'_'.join(policy_types)}-conflict{"-combined" if args.combined else ""}-{results_time}.csv"`
`104`	`104`
`105`	`105`	`with open(os.path.join(args.results_path, filename), 'w') as f:`
`106`	`106`	`for it in range(0, args.n_runs):`
Original file line number	Diff line number	Diff line change
`@@ -139,7 +139,7 @@ def main(args: argparse.Namespace) -> None:`
`139`	`139`	`os.path.abspath(`
`140`	`140`	`os.path.join(`
`141`	`141`	`args.results_path,`
`142`		`- f"log-{args.model}-{'_'.join(policy_types)}-function_{'adhoc' if args.adhoc else 'native'}-{results_time}.log"`
	`142`	`+ f"log-{args.model}-{'adhoc' if args.adhoc else 'native'}-{'_'.join(policy_types)}-function-{results_time}.log"`
`143`	`143`	`)`
`144`	`144`	`)`
`145`	`145`	`)`