ENCOA-305

2025-01-05 14:09:49 +00:00
parent 4fc58523bc
commit b4d4afd83a
2 changed files with 73 additions and 6 deletions
--- a/ielts_be/dtos/listening.py
+++ b/ielts_be/dtos/listening.py
@@ -30,7 +30,7 @@ class ConversationPayload(BaseModel):
    name: str
    gender: str
    text: str
-    voice: str
+    voice: Optional[str] = None
 class Dialog(BaseModel):
    conversation: Optional[List[ConversationPayload]] = Field(default_factory=list)
--- a/ielts_be/services/impl/exam/listening/init.py
+++ b/ielts_be/services/impl/exam/listening/init.py
@@ -1,7 +1,7 @@
 import asyncio
 from logging import getLogger
 import random
-from typing import Dict, Any
+from typing import Dict, Any, Union
 from starlette.datastructures import UploadFile
@@ -111,6 +111,15 @@ class ListeningService(IListeningService):
        return dialog
    async def generate_mp3(self, dto: Dialog) -> bytes:
        convo = dto.conversation
        voices_assigned = True
        for segment in convo:
            if segment.voice is None:
                voices_assigned = False
        if not voices_assigned:
            dto = self._get_conversation_voices(dto, True)
        return await self._tts.text_to_speech(dto)
    async def create_instructions(self, text: str) -> bytes:
@@ -263,7 +272,13 @@ class ListeningService(IListeningService):
        )
        return {"dialog": response["monologue"]}
-    def _get_conversation_voices(self, response: Dict, unique_voices_across_segments: bool):
+    # TODO: This was a refactor from the previous ielts-be, don't know why there is a distinction between
    #   section 1 and 3, I think it would make sense to only keep only the section 1 logic, only bringing this up since
    #   there would need to be a refactor of the POST /api/listening/media endpoint which imo is pointless
    # https://bitbucket.org/ecropdev/ielts-be/src/676f660f3e80220e3db0418dbeef0b1c0f257edb/helper/exercises.py?at=release%2Fmongodb-migration
    """
    def generate_listening_1_conversation(topic: str):
        ...
        chosen_voices = []
        name_to_voice = {}
        for segment in response['conversation']:
@@ -273,18 +288,70 @@ class ListeningService(IListeningService):
                    voice = name_to_voice[name]
                else:
                    voice = None
                    while voice is None:
                        if segment['gender'].lower() == 'male':
                            available_voices = MALE_NEURAL_VOICES
                        else:
                            available_voices = FEMALE_NEURAL_VOICES
                        chosen_voice = random.choice(available_voices)['Id']
                        if chosen_voice not in chosen_voices:
                            voice = chosen_voice
                            chosen_voices.append(voice)
                    name_to_voice[name] = voice
                segment['voice'] = voice
        return response
    def generate_listening_3_conversation(topic: str):
        ...
        name_to_voice = {}
        for segment in response['conversation']:
            if 'voice' not in segment:
                name = segment['name']
                if name in name_to_voice:
                    voice = name_to_voice[name]
                else:
                    if segment['gender'].lower() == 'male':
                        voice = random.choice(MALE_NEURAL_VOICES)['Id']
                    else:
                        voice = random.choice(FEMALE_NEURAL_VOICES)['Id']
                    name_to_voice[name] = voice
                segment['voice'] = voice
        return response
    """
    def _get_conversation_voices(self, response: Union[Dict, Dialog], unique_voices_across_segments: bool):
        chosen_voices = []
        name_to_voice = {}
        is_model = isinstance(response, Dialog)
        conversation = response.conversation if is_model else response['conversation']
        for segment in conversation:
            voice_check = (segment.voice is None) if is_model else ('voice' not in segment)
            if voice_check:
                name = segment.name if is_model else segment['name']
                if name in name_to_voice:
                    voice = name_to_voice[name]
                else:
                    voice = None
                    gender = segment.gender if is_model else segment['gender']
                    # section 1
                    if unique_voices_across_segments:
                        while voice is None:
-                            chosen_voice = self._get_random_voice(segment['gender'])
+                            chosen_voice = self._get_random_voice(gender)
                            if chosen_voice not in chosen_voices:
                                voice = chosen_voice
                                chosen_voices.append(voice)
                    # section 3
                    else:
-                        voice = self._get_random_voice(segment['gender'])
+                        voice = self._get_random_voice(gender)
                    name_to_voice[name] = voice
-                segment['voice'] = voice
+
                if is_model:
                    segment.voice = voice
                else:
                    segment['voice'] = voice
        return response
    @staticmethod