Add keyphrases parameter

cc1619 · cc1619 · commit 71df3469a250 · 2023-04-24T04:58:12.000+03:00
diff --git a/app/evaluation.py b/app/evaluation.py
@@ -49,7 +49,31 @@ def evaluation_function(response, answer, params):
     #             "feedback": f"Cannot determine if the answer is correct. Please provide more details about '{keyword}"
     #         }
 
-
+    # params of the form {'keyphrase': ['phrase1', 'phrase2', ...]}
+    if params is not None and "keyphrases" in params:
+        keyphrases = params["keyphrases"]
+        for keyphrase in keyphrases:
+            response_tokens = preprocess_tokens(response)
+            keyphrase_tokens = preprocess_tokens(keyphrase)
+            window_size = len(keyphrase_tokens)
+            i = 0
+            found = False
+            while i + window_size <= len(response_tokens):
+                response_substring = " ".join(response_tokens[i:i+window_size])
+                score = sentence_similarity_mean_w2v(response_substring, keyphrase)
+                i += 1
+                if score > 0.75:
+                    found = True
+                    continue
+            if not found:
+                return {
+                    "is_correct": False,
+                    "result": {
+                        "similarity_value": w2v_similarity,
+                        "Problematic_word": keyphrase
+                    },
+                    "feedback": f"Cannot determine if the answer is correct. Could not identify '{keyphrase}"
+                }
 
     if w2v_similarity > 0.75:
         return {
@@ -151,6 +175,8 @@ def sentence_similarity_mean_w2v(response: str, answer: str):
     answer = preprocess_tokens(answer)
     response_embeddings = [w2v[word] for word in response if w2v.has_index_for(word)]
     answer_embeddings = [w2v[word] for word in answer if w2v.has_index_for(word)]
+    if len(response_embeddings) == 0 or len(answer_embeddings) == 0:
+        return 0
     response_vector = np.mean(response_embeddings, axis=0)
     answer_vector = np.mean(answer_embeddings, axis=0)
     return float(np.dot(response_vector, answer_vector) / (np.linalg.norm(response_vector) * np.linalg.norm(answer_vector)))
@@ -159,6 +185,6 @@ def sentence_similarity_mean_w2v(response: str, answer: str):
 if __name__ == "__main__":
     pass
     # print(time.process_time())
-    # print(evaluation_function("density, velocity,", "Density, Velocity, Viscosity, Length", None))
+    # print(evaluation_function("density, velocity,Visc", "Density, Velocity, Viscosity, Length", {'keyphrases': ['Density', 'Velocity', 'Viscosity', 'Length']}))
     # print(evaluation_function("test", "test", None))
     # print(time.process_time())
diff --git a/app/evaluation_tests.py b/app/evaluation_tests.py
@@ -54,13 +54,41 @@ def test_reynolds_number_is_incorrect(self):
         incorrect_responses = [
             'density,,,',
             'rho,u,mu,L',
-            #'density,velocity,visc,',
         ]
 
         for response in incorrect_responses:
             result = evaluation_function(response, answer, params)
 
             self.assertEqual(result.get("is_correct"), False, msg=f'Response: {response}')
 
+    def test_reynolds_number_is_incorrect_with_keyphrase(self):
+        answer, params = 'Density, Velocity, Viscosity, Length', {'keyphrases': ['density', 'velocity', 'viscosity', 'length']}
+        incorrect_responses = [
+            'density,velocity,visc,',
+        ]
+
+        for response in incorrect_responses:
+            result = evaluation_function(response, answer, params)
+
+            self.assertEqual(result.get("is_correct"), False, msg=f'Response: {response}')
+
+    navier_stokes_answer = "The density of the film is uniform and constant, therefore the flow is incompressible. " \
+                           "Since we have incompressible flow, uniform viscosity, Newtonian fluid, " \
+                           "the most appropriate set of equations for the solution of the problem is the " \
+                           "Navier-Stokes equations. The Navier-Stokes equations in Cartesian coordinates are used."
+    # TODO: Navier-stokes equations
+
+    def test_navier_stokes_equation(self):
+        answer, params = self.navier_stokes_answer, dict()
+        correct_responses = [
+            #'Navier-stokes. Continuum, const and uniform density and viscosity so incompressible, newtonian. Fits all '
+            #'requirements for navier stokes'
+        ]
+
+        for response in correct_responses:
+            result = evaluation_function(response, answer, params)
+            print(result)
+            self.assertEqual(result.get("is_correct"), True, msg=f'Response: {response}')
+
 if __name__ == "__main__":
     unittest.main()