Add minimum values for --summin, --summax and --segmax

2024-08-13 21:20:28 +02:00 · 2024-08-13 21:20:28 +02:00 · 27ee9a7d8b
commit 27ee9a7d8b
parent a480fdcd34
2 changed files with 9 additions and 7 deletions
--- a/README.md
+++ b/README.md
@ -38,9 +38,9 @@ audio-summarize.py -m filepath -i filepath -o filepath
 options:
  -h, --help   show this help message and exit
-  --summin n   The minimum lenght of a segment summary [10]
+  --summin n   The minimum lenght of a segment summary [10, min: 5]
-  --summax n   The maximum lenght of a segment summary [90]
+  --summax n   The maximum lenght of a segment summary [90, min: 5]
-  --segmax n   The maximum number of tokens per segment [375, max: 500]
+  --segmax n   The maximum number of tokens per segment [375, 5 - 500]
  -m filepath  The path to a whisper.cpp-compatible model file
  -i filepath  The path to the media file
  -o filepath  Where to save the output text to
--- a/audio-summarize.py
+++ b/audio-summarize.py
@ -69,14 +69,16 @@ def summarize(chunks: List[str], summary_min: int, summary_max: int) -> str:
 if __name__ == "__main__":
    argp = ArgumentParser()
-    argp.add_argument("--summin", metavar="n", type=int, default=10, help="The minimum lenght of a segment summary [10]")
+    argp.add_argument("--summin", metavar="n", type=int, default=10, help="The minimum lenght of a segment summary [10, min: 5]")
-    argp.add_argument("--summax", metavar="n", type=int, default=90, help="The maximum lenght of a segment summary [90]")
+    argp.add_argument("--summax", metavar="n", type=int, default=90, help="The maximum lenght of a segment summary [90, min: 5]")
-    argp.add_argument("--segmax", metavar="n", type=int, default=375, help="The maximum number of tokens per segment [375, max: 500]")
+    argp.add_argument("--segmax", metavar="n", type=int, default=375, help="The maximum number of tokens per segment [375, 5 - 500]")
    argp.add_argument("-m", required=True, metavar="filepath", type=Path, help="The path to a whisper.cpp-compatible model file")
    argp.add_argument("-i", required=True, metavar="filepath", type=Path, help="The path to the media file")
    argp.add_argument("-o", required=True, metavar="filepath", type=Path, help="Where to save the output text to")
    args = argp.parse_args()
-    args.segmax = min(args.segmax, 500)
+    args.summin = max(5, args.summin)
    args.summax = max(5, args.summax)
    args.segmax = max(5, min(args.segmax, 500))
    # create tmpdir
    with TemporaryDirectory(suffix="as") as d:
        converted_audio_path = (Path(d) / "audio.wav").__str__()