Merge branch 'main' into guess_num

Mrinank-Bhowmick · web-flow · commit 0a2cbd7290e2 · 2023-10-01T19:01:22.000+05:30
diff --git a/README.md b/README.md
@@ -1333,6 +1333,13 @@
             <sub><b>Anju Chhetri</b></sub>
         </a>
     </td>
+    <td align="center">
+        <a href="https://github.com/ArifShariar">
+            <img src="https://avatars.githubusercontent.com/u/43639863?v=4" width="100;" alt="ArifShariar"/>
+            <br />
+            <sub><b>Arif Shariar Rahman</b></sub>
+        </a>
+    </td>
     <td align="center">
         <a href="https://github.com/AtharvaDeshmukh0909">
             <img src="https://avatars.githubusercontent.com/u/97836434?v=4" width="100;" alt="AtharvaDeshmukh0909"/>
@@ -1346,15 +1353,15 @@
             <br />
             <sub><b>Crack-er-jack</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/David-hosting">
             <img src="https://avatars.githubusercontent.com/u/67858186?v=4" width="100;" alt="David-hosting"/>
             <br />
             <sub><b>David-hosting</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/Dhandeep10">
             <img src="https://avatars.githubusercontent.com/u/106858770?v=4" width="100;" alt="Dhandeep10"/>
@@ -1389,15 +1396,15 @@
             <br />
             <sub><b>Gargi</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/harshhes">
             <img src="https://avatars.githubusercontent.com/u/93470145?v=4" width="100;" alt="harshhes"/>
             <br />
             <sub><b>HarsH</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/HimanshuSinghNegi">
             <img src="https://avatars.githubusercontent.com/u/72004239?v=4" width="100;" alt="HimanshuSinghNegi"/>
@@ -1432,15 +1439,15 @@
             <br />
             <sub><b>Krishna13515</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/iamkunalpitale">
             <img src="https://avatars.githubusercontent.com/u/26413565?v=4" width="100;" alt="iamkunalpitale"/>
             <br />
             <sub><b>Kunal Pitale</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/manav0702">
             <img src="https://avatars.githubusercontent.com/u/94554798?v=4" width="100;" alt="manav0702"/>
@@ -1475,15 +1482,15 @@
             <br />
             <sub><b>Nilay Banerjee </b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/KushalPareek">
             <img src="https://avatars.githubusercontent.com/u/105929422?v=4" width="100;" alt="KushalPareek"/>
             <br />
             <sub><b>Kushal Pareek</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/Prajwol-Shrestha">
             <img src="https://avatars.githubusercontent.com/u/70046321?v=4" width="100;" alt="Prajwol-Shrestha"/>
@@ -1518,15 +1525,15 @@
             <br />
             <sub><b>Raashika0201</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/Ramisky">
             <img src="https://avatars.githubusercontent.com/u/19819186?v=4" width="100;" alt="Ramisky"/>
             <br />
             <sub><b>Ramii Ahmed</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/RishiPastor05">
             <img src="https://avatars.githubusercontent.com/u/87607061?v=4" width="100;" alt="RishiPastor05"/>
@@ -1561,15 +1568,15 @@
             <br />
             <sub><b>Shreejan Dolai</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/shubham7668">
             <img src="https://avatars.githubusercontent.com/u/54644253?v=4" width="100;" alt="shubham7668"/>
             <br />
             <sub><b>Shubham Kumar</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/SulimanSagindykov">
             <img src="https://avatars.githubusercontent.com/u/115887342?v=4" width="100;" alt="SulimanSagindykov"/>
@@ -1604,15 +1611,15 @@
             <br />
             <sub><b>Ylavish64</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/yogesh78026">
             <img src="https://avatars.githubusercontent.com/u/77293859?v=4" width="100;" alt="yogesh78026"/>
             <br />
             <sub><b>Yogeshwar Kumar</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/ambushneupane">
             <img src="https://avatars.githubusercontent.com/u/56769633?v=4" width="100;" alt="ambushneupane"/>
@@ -1631,7 +1638,7 @@
         <a href="https://github.com/asingh4451">
             <img src="https://avatars.githubusercontent.com/u/108614474?v=4" width="100;" alt="asingh4451"/>
             <br />
-            <sub><b>asingh4451</b></sub>
+            <sub><b>Asingh4451</b></sub>
         </a>
     </td>
     <td align="center">
@@ -1647,15 +1654,15 @@
             <br />
             <sub><b>Emmanuel  Ogu</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/d-coder111">
             <img src="https://avatars.githubusercontent.com/u/82580017?v=4" width="100;" alt="d-coder111"/>
             <br />
             <sub><b>D-coder111</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/dab07">
             <img src="https://avatars.githubusercontent.com/u/78215681?v=4" width="100;" alt="dab07"/>
@@ -1690,15 +1697,15 @@
             <br />
             <sub><b>Zainab Ibraheem</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/mr-desilva">
             <img src="https://avatars.githubusercontent.com/u/47147935?v=4" width="100;" alt="mr-desilva"/>
             <br />
             <sub><b>Tharindu De Silva</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/myudak">
             <img src="https://avatars.githubusercontent.com/u/69108782?v=4" width="100;" alt="myudak"/>
@@ -1733,15 +1740,15 @@
             <br />
             <sub><b>PRATYUSHA CHATURVEDI</b></sub>
         </a>
-    </td>
+    </td></tr>
+<tr>
     <td align="center">
         <a href="https://github.com/samualmartin">
             <img src="https://avatars.githubusercontent.com/u/38009832?v=4" width="100;" alt="samualmartin"/>
             <br />
             <sub><b>Samual Martin</b></sub>
         </a>
-    </td></tr>
-<tr>
+    </td>
     <td align="center">
         <a href="https://github.com/rathoreshreya">
             <img src="https://avatars.githubusercontent.com/u/109817678?v=4" width="100;" alt="rathoreshreya"/>
diff --git a/projects/Video-subtitle-generator/main.py b/projects/Video-subtitle-generator/main.py
@@ -3,27 +3,106 @@
 import whisper
 
 
-def transcribe_audio(path):
-    model = whisper.load_model("base")  # Change this to your desired model
-    print("Whisper model loaded.")
-    transcribe = model.transcribe(audio=path)
-    segments = transcribe["segments"]
+def transcribe_audio(path, output_filetype="srt", whisper_model="base"):
+    # extract the filename from the path without extension
+    filename = os.path.splitext(os.path.basename(path))[0]
+    output_filename = os.path.join("SrtFiles", f"{filename}.{output_filetype}")
+    # chcek if the output file exists, if it does, append a number to the filename
+    if os.path.exists(output_filename):
+        i = 1
+        while os.path.exists(output_filename):
+            output_filename = os.path.join("SrtFiles", f"{filename}({i}).{output_filetype}")
+            i += 1
+    if output_filetype == "srt":
+        # open the output file in write mode
+        with open(output_filename, "w", encoding="utf-8") as srtFile:
+            srtFile.write("")
+        model = whisper.load_model(whisper_model)
+        print("Whisper model loaded.")
+        transcribe = model.transcribe(audio=path)
+        segments = transcribe["segments"]
 
-    for segment in segments:
-        startTime = str(0) + str(timedelta(seconds=int(segment["start"]))) + ",000"
-        endTime = str(0) + str(timedelta(seconds=int(segment["end"]))) + ",000"
-        text = segment["text"]
-        segmentId = segment["id"] + 1
-        segment = f"{segmentId}\n{startTime} --> {endTime}\n{text[1:] if text[0] is ' ' else text}\n\n"
+        for segment in segments:
+            startTime = str(0) + str(timedelta(seconds=int(segment["start"]))) + ",000"
+            endTime = str(0) + str(timedelta(seconds=int(segment["end"]))) + ",000"
+            text = segment["text"]
+            segmentId = segment["id"] + 1
+            segment = f"{segmentId}\n{startTime} --> {endTime}\n{text[1:] if text[0] == ' ' else text}\n\n"
+            with open(output_filename, "a", encoding="utf-8") as srtFile:
+                srtFile.write(segment)
+        return srtFile
+    
+    elif output_filetype == "json":
+        with open(output_filename, "w", encoding="utf-8") as jsonFile:
+            jsonFile.write("{\n \"captions\": [\n")
+        model = whisper.load_model(whisper_model)  
+        print("Whisper model loaded.")
+        transcribe = model.transcribe(audio=path)
+        segments = transcribe["segments"]
+        for segment in segments:
+            startTime = timedelta(seconds=int(segment["start"]))
+            endTime = timedelta(seconds=int(segment["end"]))
+            duration = endTime - startTime  # Calculate the duration
+            startTime_str = str(0) + str(startTime) + ",000"
+            endTime_str = str(0) + str(endTime) + ",000"
+            duration_str = str(0) + str(duration) + ",000"
+            text = segment["text"]
+            segmentId = segment["id"] + 1
+            segment = f"{{\t\n\"id\": {segmentId},\n\"start\": \"{startTime_str}\",\n\"end\": \"{endTime_str}\",\n\"duration\": \"{duration_str}\",\n\"text\": \"{text[1:] if text[0] == ' ' else text}\"\n}},\n"           
+            with open(output_filename, "a", encoding="utf-8") as jsonFile:
+                jsonFile.write(segment)
+        # remove the last comma 
+        with open(output_filename, "rb+") as jsonFile:
+            jsonFile.seek(-2, os.SEEK_END)
+            jsonFile.truncate()
+        with open(output_filename, "a", encoding="utf-8") as jsonFile:
+            jsonFile.write("\n]\n}")
+        return jsonFile
+    
+    elif output_filetype == "txt":
+        with open(output_filename, "w", encoding="utf-8") as txtFile:
+            txtFile.write("")
+        model = whisper.load_model(whisper_model)
+        print("Whisper model loaded.")
+        transcribe = model.transcribe(audio=path)
+        segments = transcribe["segments"]
+        for segment in segments:
+            startTime = str(0) + str(timedelta(seconds=int(segment["start"]))) + ",000"
+            endTime = str(0) + str(timedelta(seconds=int(segment["end"]))) + ",000"
+            text = segment["text"]
+            segmentId = segment["id"] + 1
+            segment = f"{segmentId}\n{startTime} --> {endTime}\n{text[1:] if text[0] == ' ' else text}\n\n"
+            with open(output_filename, "a", encoding="utf-8") as txtFile:
+                txtFile.write(segment)
+        return txtFile
 
-        srtFilename = os.path.join("SrtFiles", f"VIDEO_FILENAME.srt")
-        with open(srtFilename, "a", encoding="utf-8") as srtFile:
-            srtFile.write(segment)
 
-    return srtFilename
+output_dir = "SrtFiles"
+# check if the output directory exists, if it does not, create it
+if not os.path.exists(output_dir):
+    os.mkdir("SrtFiles")
+path = input("Please enter the path of the audio file:")
+output_filetype = int(input("Please enter the output file type (SRT is selected by default):\n1.SRT\n2.JSON\n3.TXT\n"))
+if output_filetype == 1:
+    output_filetype = "srt"
+elif output_filetype == 2:
+    output_filetype = "json"
+elif output_filetype == 3:
+    output_filetype = "txt"
 
+whisper_model = int(input("Please enter the name of the whisper model you want to use (base is selected by default):\n1.Tiny\n2.Base\n3.Small\n4.Medium\n5.Large\n"))
+if whisper_model == 1:
+    whisper_model = "tiny"
+elif whisper_model == 2:
+    whisper_model = "base"
+elif whisper_model == 3:
+    whisper_model = "small"
+elif whisper_model == 4:
+    whisper_model = "medium"
+elif whisper_model == 5:
+    whisper_model = "large"
 
-os.mkdir("SrtFiles")
-path = input("Please enter the path of the audio file:")
-srtFilename = transcribe_audio(path)
+srtFilename = transcribe_audio(path, output_filetype, whisper_model)
+# extract srt file name from srtFilename
+srtFilename = os.path.basename(srtFilename.name)
 print(f"Your subtitles are ready. You can find them in {srtFilename}")