server : backport .srt output format (#1565)

author Oleg Sidorov <redacted>

Tue, 28 Nov 2023 13:42:58 +0000 (14:42 +0100)

committer GitHub <redacted>

Tue, 28 Nov 2023 13:42:58 +0000 (15:42 +0200)
author Oleg Sidorov <redacted>
Tue, 28 Nov 2023 13:42:58 +0000 (14:42 +0100)
committer GitHub <redacted>
Tue, 28 Nov 2023 13:42:58 +0000 (15:42 +0200)
diff --git a/examples/server/server.cpp b/examples/server/server.cpp

index e9d3f88b24692451f71e1c4b7b24fcdb2b6dbed0..2d15d4cc8af6d8adc17ad82d76184f70c9a0452f 100644 (file)
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@@ -11,6 +11,7 @@
  #include <thread>
  #include <vector>
  #include <cstring>
+#include <sstream>
  
  #if defined(_MSC_VER)
  #pragma warning(disable: 4244 4267) // possible loss of data
@@ -657,6 +658,27 @@ int main(int argc, char ** argv) {
              std::string results = output_str(ctx, params, pcmf32s);
              res.set_content(results.c_str(), "text/html");
          }
+        else if (params.response_format == srt_format)
+        {
+            std::stringstream ss;
+            const int n_segments = whisper_full_n_segments(ctx);
+            for (int i = 0; i < n_segments; ++i) {
+                const char * text = whisper_full_get_segment_text(ctx, i);
+                const int64_t t0 = whisper_full_get_segment_t0(ctx, i);
+                const int64_t t1 = whisper_full_get_segment_t1(ctx, i);
+                std::string speaker = "";
+
+                if (params.diarize && pcmf32s.size() == 2)
+                {
+                    speaker = estimate_diarization_speaker(pcmf32s, t0, t1);
+                }
+
+                ss << i + 1 + params.offset_n << "\n";
+                ss << to_timestamp(t0, true) << " --> " << to_timestamp(t1, true) << "\n";
+                ss << speaker << text << "\n\n";
+            }
+            res.set_content(ss.str(), "application/x-subrip");
+        }
          // TODO add more output formats
          else
          {
author	Oleg Sidorov <redacted>
	Tue, 28 Nov 2023 13:42:58 +0000 (14:42 +0100)
committer	GitHub <redacted>
	Tue, 28 Nov 2023 13:42:58 +0000 (15:42 +0200)