Update README.md

hate-alert · Jun 17, 2024 · 3dc3482 · 3dc3482
1 parent 13ece34
commit 3dc3482
Showing 1 changed file with 13 additions and 1 deletion.
diff --git a/Codes/README.md b/Codes/README.md
@@ -22,11 +22,23 @@
 # To Run the unimodal Vision Based models
 
 6.Vision+lstm_foldWise.py   
-7. 3DCNN_withFolds.py
+7.3DCNN_withFolds.py
 
 # To Run the Multimodal Model
        
 9. MultiModalFusionModelfoldWise.py
 
 # To extract all the video frames.
 frameExtract.py
+
+# Extraction of transcript
+
+The 'all__video_vosk_audioMap.p' has to be generated using the Vosk speech recognition toolkit(https://alphacephei.com/vosk/). The format of the file is in JSON format like the below:
+
+{
+  "video_name1": "transcript1",
+  "video_name2": "transcript2",
+  ...
+  "video_name3": "transcript3"
+}
+