the minimum length of answer is set in config which is a global class, need to set it back to 0 if the same config is being called elsewhere: self.config.response_num_required = 4

BigBigboss02 · BigBigboss02 · commit fbe36e7631bc · 2025-02-12T16:47:49.000Z
result = evaluation_function(response, answer, self.config)
        self.config.response_num_required = 0
diff --git a/app/evaluation.py b/app/evaluation.py
@@ -19,7 +19,7 @@ def __init__(self, mode='gpt', llama_version='3_1_8B', temperature=0.01, max_new
         self.huggingfacehub_api_token = os.getenv("HUGGINGFACE_AUTHORIZATION")
         self.endpoint_3_1_8B = os.getenv("LLAMA3_1_8B_ENDPOINT")
 
-        self.response_num_required = 3
+        self.response_num_required = 0 #initialise it with 0
 
 def setup_llm(config):
     """Initialize the LLM model (GPT-4o or LLaMA 3) based on the given configuration."""
@@ -145,6 +145,7 @@ def evaluation_function(response, answer, config=None):
     #check if student is inputting enough answers
     if len(response) < config.response_num_required:
         is_correct = False
+    
     return {
         "is_correct": is_correct,
         "result": {
@@ -160,8 +161,8 @@ def evaluation_function(response, answer, config=None):
 if __name__ == "__main__":
     custom_config = Config()
     print(evaluation_function(
-        ["Density","Density","Density"], #response
-        ["Density","Viscosity","Length","Density","Gravity","Viscosity","Length"], #answer
+        ["speed"], #response
+        ["velocity"], #answer
         custom_config
     ))
     
diff --git a/app/evaluation_tests.py b/app/evaluation_tests.py
@@ -42,13 +42,14 @@ def test_partial_match(self):
 
         self.config.response_num_required = 4
         result = evaluation_function(response, answer, self.config)
+        self.config.response_num_required = 0
         self.assertFalse(result.get("is_correct"))
 
 
     def test_synonyms_match(self):
         """Test if abbriviations are correctly identified."""
-        response = ['speed']
-        answer = ['velocity']
+        response = ['velocity']
+        answer = ['speed']
         result = evaluation_function(response, answer, self.config)
 
         self.assertTrue(result.get("is_correct"))