Skip to content

Commit 3805cac

Browse files
authored
fix: fix TransliterationPlugin for changing english to hindi date-tim… (#218)
* fix: fix TransliterationPlugin for changing english to hindi date-time mappings for deepgram ASR * update: bind spacy to a version for stability
1 parent 32aeba5 commit 3805cac

File tree

4 files changed

+612
-577
lines changed

4 files changed

+612
-577
lines changed

dialogy/plugins/text/transliteration_plugin/__init__.py

+14-18
Original file line numberDiff line numberDiff line change
@@ -117,37 +117,33 @@ def map_to_hindi(self, transcript: str) -> str:
117117
]
118118
return ' '.join(translated_words)
119119

120-
def modify_utterances(self, utterances: List[List[Dict[str, str]]]) -> List[List[Dict[str, str]]]:
120+
def modify_transcripts(self, transcripts: List[str]) -> List[str]:
121121
"""
122-
Modifies utterances by transliterating date/time words.
122+
Modifies transcripts by transliterating date/time words.
123123
124124
Args:
125-
utterances: List of ASR transcripts with confidence scores
125+
transcripts: List of transcripts to process
126126
127127
Returns:
128-
Modified utterances with transliterated text
128+
Modified transcripts with transliterated text
129129
"""
130-
if not utterances or not utterances[0]:
131-
return utterances
130+
if not transcripts:
131+
return transcripts
132132

133-
for transcript in utterances[0]:
134-
if 'transcript' in transcript:
135-
transcript['transcript'] = self.map_to_hindi(transcript['transcript'])
136-
137-
return utterances
133+
return [self.map_to_hindi(transcript) for transcript in transcripts]
138134

139135
async def utility(self, input_: Input, output: Output) -> Any:
140136
"""
141-
Plugin utility method that processes the input utterances.
137+
Plugin utility method that processes the input transcripts.
142138
143139
Args:
144-
input_: Input object containing utterances
140+
input_: Input object containing transcripts
145141
output: Output object for results
146142
147143
Returns:
148-
Modified utterances with transliterated text
144+
Modified transcripts with transliterated text
149145
"""
150-
logger.debug(f"Input utterances for transliteration:\n{input_.utterances}")
151-
modified_utterances = self.modify_utterances(input_.utterances)
152-
logger.debug(f"Transliterated utterances:\n{modified_utterances}")
153-
return modified_utterances
146+
logger.debug(f"Input transcripts for transliteration:\n{input_.transcripts}")
147+
modified_transcripts = self.modify_transcripts(input_.transcripts)
148+
logger.debug(f"Transliterated transcripts:\n{modified_transcripts}")
149+
return modified_transcripts

0 commit comments

Comments
 (0)