WIP: parakeet

This commit is contained in:
root
2026-05-18 23:07:34 -03:00
parent 2e4aeb3b6f
commit db76ac34f0
10 changed files with 549 additions and 654 deletions

View File

@@ -15,17 +15,24 @@
from __future__ import annotations
import logging
from functools import partial
from pathlib import Path
from gi.repository import GLib, Gtk
from gajim.common import app
from gajim.plugins import GajimPlugin
from gajim.plugins.plugins_i18n import _
from .gtk.config_dialog import *
from .gtk.config_dialog import Configuration, STTVoiceMessagesConfigDialog
from .gtk.sttbox import STTBox
from .models.model_settings import *
from .models.model_settings import OnnxAsrSettings
log = logging.getLogger('gajim.p.stt_voice_messages')
_FOCUS_LOSS_UNLOAD_SECONDS = 30
class STTVoiceMessagesPlugin(GajimPlugin):
def init(self) -> None:
@@ -33,42 +40,64 @@ class STTVoiceMessagesPlugin(GajimPlugin):
self.config_default_values = {
'auto_transcribe': (False, ''),
'model': ('model_openaiwhisper', ''),
'model_openaiwhisper': (
OpenAIWhisperSettings(
model_size='tiny',
translate_to_english=False),
''),
'model_faster-whisper': (
FasterWhisperSettings(
model_size='tiny',
translate_to_english=False),
'')
'model_id': ('nemo-parakeet-tdt-0.6b-v3', ''),
'model_path': ('', ''),
}
self._config = Configuration(self)
self._config.check_available_moduls()
self.config_dialog = partial(STTVoiceMessagesConfigDialog, self._config)
self.gui_extension_points = {
'preview_audio': (self._on_preview_audio_created, None),
}
self._audio_file: str = ''
self._preview_audio_widget = None
self._stt_box = None
self._active_handler_id = 0
self._focus_unload_source = None
def activate(self) -> None:
if app.window is not None and self._active_handler_id == 0:
self._active_handler_id = app.window.connect(
'notify::is-active', self._on_window_active_changed)
def deactivate(self) -> None:
if self._focus_unload_source is not None:
GLib.source_remove(self._focus_unload_source)
self._focus_unload_source = None
if self._active_handler_id != 0 and app.window is not None:
app.window.disconnect(self._active_handler_id)
self._active_handler_id = 0
if self._config.is_available:
self._config.unload_model()
def _on_window_active_changed(self,
window: Gtk.Window,
_pspec: object,
) -> None:
if window.is_active():
if self._focus_unload_source is not None:
GLib.source_remove(self._focus_unload_source)
self._focus_unload_source = None
elif self._focus_unload_source is None:
self._focus_unload_source = GLib.timeout_add_seconds(
_FOCUS_LOSS_UNLOAD_SECONDS, self._on_focus_unload_fired)
def _on_focus_unload_fired(self) -> bool:
self._focus_unload_source = None
if self._config.is_available:
self._config.unload_model()
return GLib.SOURCE_REMOVE
def _on_preview_audio_created(self,
preview_audio_widget: Gtk.Box,
drawing_box: Gtk.Box,
control_box: Gtk.Box,
audio_file: Path
) -> None:
self._preview_audio_widget = preview_audio_widget
self._drawing_box = drawing_box;
self._control_box = control_box;
self._audio_file = audio_file.as_posix()
self._create_stt_box()
def _create_stt_box(self) -> None:
assert self._preview_audio_widget is not None
self._stt_box = STTBox(self._preview_audio_widget,
self.config,
self._audio_file)
self._preview_audio_widget.pack_end(self._stt_box, False, False, 0)
self._stt_box = STTBox(self._config, self._audio_file)
self._control_box.append(self._stt_box.button)
self._drawing_box.append(self._stt_box)