Upgrade default Whisper model: small/medium → large-v3 for much better Slovenian/Slavic transcription accuracy
This commit is contained in:
parent
4bc5ac6756
commit
69fb2f5ce8
@ -240,7 +240,7 @@ def process_job(job_id):
|
|||||||
# lang: če None ali 'auto', pusti analyze.py auto-detect
|
# lang: če None ali 'auto', pusti analyze.py auto-detect
|
||||||
if job.get("lang") and job["lang"] not in ("auto", ""):
|
if job.get("lang") and job["lang"] not in ("auto", ""):
|
||||||
cmd += ["--lang", job["lang"]]
|
cmd += ["--lang", job["lang"]]
|
||||||
cmd += ["--model", job.get("whisper_model", "small")]
|
cmd += ["--model", job.get("whisper_model", "large-v3")]
|
||||||
|
|
||||||
proc = subprocess.run(cmd, capture_output=True, text=True)
|
proc = subprocess.run(cmd, capture_output=True, text=True)
|
||||||
srt_from_claude = None # Pot do SRT iz Claude-popravljenega transcript-a
|
srt_from_claude = None # Pot do SRT iz Claude-popravljenega transcript-a
|
||||||
@ -334,7 +334,7 @@ def process_job(job_id):
|
|||||||
cmd += ["--lang", chosen_lang]
|
cmd += ["--lang", chosen_lang]
|
||||||
if job.get("no_subs"):
|
if job.get("no_subs"):
|
||||||
cmd += ["--no-subs"]
|
cmd += ["--no-subs"]
|
||||||
cmd += ["--model", job.get("whisper_model", "small")]
|
cmd += ["--model", job.get("whisper_model", "large-v3")]
|
||||||
|
|
||||||
# DEBUG: zapiši natanko kakšen ukaz se izvede
|
# DEBUG: zapiši natanko kakšen ukaz se izvede
|
||||||
update_job(job_id, debug_clip_cmd=" ".join(cmd))
|
update_job(job_id, debug_clip_cmd=" ".join(cmd))
|
||||||
@ -391,7 +391,7 @@ class YouTubeJobIn(BaseModel):
|
|||||||
duration: Optional[float] = 30
|
duration: Optional[float] = 30
|
||||||
no_subs: bool = False
|
no_subs: bool = False
|
||||||
subtitle_style: str = "reels"
|
subtitle_style: str = "reels"
|
||||||
whisper_model: str = "small"
|
whisper_model: str = "large-v3"
|
||||||
quality: str = "medium"
|
quality: str = "medium"
|
||||||
|
|
||||||
|
|
||||||
@ -407,7 +407,7 @@ class StartJobIn(BaseModel):
|
|||||||
min_duration: Optional[float] = 20
|
min_duration: Optional[float] = 20
|
||||||
no_subs: bool = False
|
no_subs: bool = False
|
||||||
subtitle_style: str = "reels"
|
subtitle_style: str = "reels"
|
||||||
whisper_model: str = "small"
|
whisper_model: str = "large-v3"
|
||||||
quality: str = "medium"
|
quality: str = "medium"
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@ -592,7 +592,7 @@ def main():
|
|||||||
ap = argparse.ArgumentParser()
|
ap = argparse.ArgumentParser()
|
||||||
ap.add_argument("video", help="Vhod video file")
|
ap.add_argument("video", help="Vhod video file")
|
||||||
ap.add_argument("--lang", default=None, help="ISO 639-1 ali 'auto' (default: auto)")
|
ap.add_argument("--lang", default=None, help="ISO 639-1 ali 'auto' (default: auto)")
|
||||||
ap.add_argument("--model", default="small", help="Whisper model")
|
ap.add_argument("--model", default="large-v3", help="Whisper model")
|
||||||
ap.add_argument("--target-duration", type=float, default=30.0)
|
ap.add_argument("--target-duration", type=float, default=30.0)
|
||||||
ap.add_argument("--max-duration", type=float, default=45.0)
|
ap.add_argument("--max-duration", type=float, default=45.0)
|
||||||
ap.add_argument("--min-duration", type=float, default=20.0)
|
ap.add_argument("--min-duration", type=float, default=20.0)
|
||||||
|
|||||||
@ -112,7 +112,7 @@ def main():
|
|||||||
help="Več klipov: '0:30-1:00,2:15-2:45'")
|
help="Več klipov: '0:30-1:00,2:15-2:45'")
|
||||||
ap.add_argument("--mode", default="track", choices=["track", "center", "blur"])
|
ap.add_argument("--mode", default="track", choices=["track", "center", "blur"])
|
||||||
ap.add_argument("--lang", default=None, help="sl, de, en, ... (privzeto auto)")
|
ap.add_argument("--lang", default=None, help="sl, de, en, ... (privzeto auto)")
|
||||||
ap.add_argument("--model", default="small",
|
ap.add_argument("--model", default="large-v3",
|
||||||
choices=["tiny", "base", "small", "medium", "large-v3"])
|
choices=["tiny", "base", "small", "medium", "large-v3"])
|
||||||
ap.add_argument("--style", default="reels", choices=["reels", "yellow", "minimal"])
|
ap.add_argument("--style", default="reels", choices=["reels", "yellow", "minimal"])
|
||||||
ap.add_argument("--no-subs", action="store_true")
|
ap.add_argument("--no-subs", action="store_true")
|
||||||
|
|||||||
@ -279,7 +279,7 @@ def main():
|
|||||||
ap.add_argument("input")
|
ap.add_argument("input")
|
||||||
ap.add_argument("output")
|
ap.add_argument("output")
|
||||||
ap.add_argument("--lang", default=None, help="Jezik (sl, de, en, ...) ali auto")
|
ap.add_argument("--lang", default=None, help="Jezik (sl, de, en, ...) ali auto")
|
||||||
ap.add_argument("--model", default="small", choices=["tiny", "base", "small", "medium", "large-v3"])
|
ap.add_argument("--model", default="large-v3", choices=["tiny", "base", "small", "medium", "large-v3"])
|
||||||
ap.add_argument("--style", default="reels", choices=list(SUBTITLE_STYLES.keys()))
|
ap.add_argument("--style", default="reels", choices=list(SUBTITLE_STYLES.keys()))
|
||||||
ap.add_argument("--keep-srt", action="store_true", help="Ohrani .srt poleg output")
|
ap.add_argument("--keep-srt", action="store_true", help="Ohrani .srt poleg output")
|
||||||
ap.add_argument("--srt", default=None, help="Že-pripravljen SRT (preskoči Whisper transkripcijo)")
|
ap.add_argument("--srt", default=None, help="Že-pripravljen SRT (preskoči Whisper transkripcijo)")
|
||||||
|
|||||||
@ -214,7 +214,7 @@
|
|||||||
|
|
||||||
<!-- Skrita polja: jezik in model sta avto. Vrednosti uporabljene v JS submit. -->
|
<!-- Skrita polja: jezik in model sta avto. Vrednosti uporabljene v JS submit. -->
|
||||||
<input type="hidden" id="lang" value="">
|
<input type="hidden" id="lang" value="">
|
||||||
<input type="hidden" id="model" value="medium">
|
<input type="hidden" id="model" value="large-v3">
|
||||||
|
|
||||||
<div style="font-size: 12px; color: var(--text-dim); margin-top: 8px;">
|
<div style="font-size: 12px; color: var(--text-dim); margin-top: 8px;">
|
||||||
🤖 Jezik: avtomatsko zaznan (Whisper, 3-sample voting) · Model: medium · LLM analiza: Claude
|
🤖 Jezik: avtomatsko zaznan (Whisper, 3-sample voting) · Model: medium · LLM analiza: Claude
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user