test added for transcribe.py

tyler232 · tyler232 · commit cafc4be0dba4 · 2024-10-09T15:43:39.000-05:00
diff --git a/PythonRpcServer/server.py b/PythonRpcServer/server.py
@@ -136,7 +136,7 @@ def TranscribeAudioRPC(self, request, context):
             logging.info(f"Starting transcription for file: {request.filePath}")
             transcription_result = LogWorker(
                 f"TranscribeAudioRPC({request.filePath})",
-                lambda: transcribe_audio(request.filePath)
+                lambda: transcribe_audio(request.filePath, request.testing)
             )
             logging.info(f"Transcription completed successfully for: {request.filePath}")
             return ct_pb2.JsonString(json=json.dumps(transcription_result))
diff --git a/PythonRpcServer/transcribe.py b/PythonRpcServer/transcribe.py
@@ -38,8 +38,18 @@ def convert_video_to_wav(input_filepath, offset=None):
         print("Exception during conversion:" + str(e))
         raise e
 
-def transcribe_audio(media_filepath):
+def transcribe_audio(media_filepath, testing=False):
+    if testing:
+        json_output_path = f"/PythonRpcServer/transcribe_hellohellohello.wav.json"
+        with open(json_output_path, 'r') as json_file:
+            transcription_result = json.load(json_file)
+        
+        # Print the transcription result (testing purpose)
+        print("Transcription result:")
+        print(json.dumps(transcription_result, indent=4))
 
+        return transcription_result
+    
     if media_filepath == 'TEST-transcribe_example_result':
         result_json_file = 'transcribe_exampleffmp_result.json'
         with open(result_json_file, 'r') as json_file:
@@ -51,8 +61,10 @@ def transcribe_audio(media_filepath):
         raise FileNotFoundError(f"Media file not found: {media_filepath}")
 
     # convert video to wav if needed
+    wav_created = False  # Track if WAV was created
     if not media_filepath.endswith('.wav'):
         media_filepath, _ = convert_video_to_wav(media_filepath)
+        wav_created = True  # WAV file was created
 
 
     # Path to the output JSON file that Whisper will generate
@@ -87,26 +99,27 @@ def transcribe_audio(media_filepath):
         transcription_result = json.load(json_file)
     
     # Print the transcription result (testing purpose)
-    # print("Transcription result:")
-    # print(json.dumps(transcription_result, indent=4))
+    print("Transcription result:")
+    print(json.dumps(transcription_result, indent=4))
 
     # Delete the JSON file after reading it
     os.remove(json_output_path)
     print(f"Deleted the JSON file: {json_output_path}")
 
+    if wav_created:
+        try:
+            os.remove(media_filepath)
+            print(f"Deleted the WAV file: {media_filepath}")
+        except Exception as e:
+            print(f"Error deleting WAV file: {str(e)}")
+
     return transcription_result
 
 # Example usage
 if __name__ == '__main__':
     # Example media file path inside the container (the actual path will depend on where the file is located)
-    import sys
-    if len(sys.argv) > 1:
-        audio_filepath = sys.argv[1]
-    else:
-        audio_filepath = 'sharedVolume/recording0.wav'  # Update this path as needed
-    
-    try:
-        transcription_result = transcribe_audio(audio_filepath)
-        print("Transcription Result:", json.dumps(transcription_result, indent=4))
-    except Exception as e:
-        print(f"Error: {str(e)}")
+    json_output_path = f"/PythonRpcServer/transcribe_hellohellohello.wav.json"
+    with open(json_output_path, 'r') as json_file:
+        transcription_result = json.load(json_file)
+        
+    print("Transcription Result:", json.dumps(transcription_result, indent=4))
diff --git a/TaskEngine/Tasks/LocalTranscriptionTask.cs b/TaskEngine/Tasks/LocalTranscriptionTask.cs
@@ -98,7 +98,8 @@ protected async override Task OnConsume(string videoId, TaskParameters taskParam
                         LogId = videoId,
                         FilePath = video.Video1.VMPath,
                         Model = "en",
-                        Language = "en"
+                        Language = "en",
+                        Testing = true
                         // PhraseHints = phraseHints,
                         // CourseHints = "",
                         // OutputLanguages = "en"
diff --git a/TaskEngine/Tasks/QueueAwakerTask.cs b/TaskEngine/Tasks/QueueAwakerTask.cs
@@ -404,7 +404,7 @@ protected async override Task OnConsume(JObject jObject, TaskParameters taskPara
             else if (type == TaskType.TranscribeVideo.ToString())
             {
                 var id = jObject["videoOrMediaId"].ToString();
-
+                
 
                 GetLogger().LogInformation($"{type}:{id}");
                 var video = await _context.Videos.FindAsync(id);
diff --git a/ct.proto b/ct.proto
@@ -29,6 +29,7 @@ message TranscriptionRequest {
   string model = 2;      // Whisper model to use (e.g., 'base-en', 'tiny-en')
   string language = 3;  //  Language in audio.
   string logId = 4; 
+  bool testing = 5;
 }
 
 

Original file line number	Diff line number	Diff line change
`@@ -136,7 +136,7 @@ def TranscribeAudioRPC(self, request, context):`
`136`	`136`	`logging.info(f"Starting transcription for file: {request.filePath}")`
`137`	`137`	`transcription_result = LogWorker(`
`138`	`138`	`f"TranscribeAudioRPC({request.filePath})",`
`139`		`- lambda: transcribe_audio(request.filePath)`
	`139`	`+ lambda: transcribe_audio(request.filePath, request.testing)`
`140`	`140`	`)`
`141`	`141`	`logging.info(f"Transcription completed successfully for: {request.filePath}")`
`142`	`142`	`return ct_pb2.JsonString(json=json.dumps(transcription_result))`
Original file line number	Diff line number	Diff line change
`@@ -404,7 +404,7 @@ protected async override Task OnConsume(JObject jObject, TaskParameters taskPara`
`404`	`404`	`else if (type == TaskType.TranscribeVideo.ToString())`
`405`	`405`	`{`
`406`	`406`	`var id = jObject["videoOrMediaId"].ToString();`
`407`		`-`
	`407`	`+`
`408`	`408`
`409`	`409`	`GetLogger().LogInformation($"{type}:{id}");`
`410`	`410`	`var video = await _context.Videos.FindAsync(id);`
Original file line number	Diff line number	Diff line change
`@@ -29,6 +29,7 @@ message TranscriptionRequest {`
`29`	`29`	`string model = 2; // Whisper model to use (e.g., 'base-en', 'tiny-en')`
`30`	`30`	`string language = 3; // Language in audio.`
`31`	`31`	`string logId = 4;`
	`32`	`+ bool testing = 5;`
`32`	`33`	`}`
`33`	`34`
`34`	`35`