diff --git a/src/ragas/metrics/_answer_relevance.py b/src/ragas/metrics/_answer_relevance.py index 03b6ea4f9..15085e968 100644 --- a/src/ragas/metrics/_answer_relevance.py +++ b/src/ragas/metrics/_answer_relevance.py @@ -139,15 +139,13 @@ async def _ascore(self, row: t.Dict, callbacks: Callbacks) -> float: assert self.llm is not None, "LLM is not set" prompt_input = ResponseRelevanceInput(response=row["response"]) - tasks = [ - self.question_generation.generate( - data=prompt_input, - llm=self.llm, - callbacks=callbacks, - ) - for _ in range(self.strictness) - ] - responses = await asyncio.gather(*tasks) + + responses = await self.question_generation.generate_multiple( + data=prompt_input, + llm=self.llm, + callbacks=callbacks, + n=self.strictness + ) return self._calculate_score(responses, row)