Spaces:

MatteoFasulo
/

Whisper-TikTok-Demo

Running

App Files Files Community

MatteoFasulo commited on Aug 6, 2024

Commit

b9adb22

1 Parent(s): b7ab8d4

New [DEV] version

Browse files

Files changed (23) hide show

.gitignore +3 -0
.streamlit/config.toml +4 -1
CONTRIBUTING.md +1 -1
LICENSE +201 -0
README.md +12 -39
Home.py → app.py +42 -66
clips.csv +3 -0
example-reddit-post.txt +0 -2
example-video.json +0 -1
example.env +0 -7
main.py +16 -24
packages.txt +1 -0
pages/Reddit.py +0 -119
pages/__init__.py +0 -0
reddit-post.txt +0 -0
reddit2json.py +0 -133
requirements.txt +1 -1
src/subtitle_creator.py +10 -1
src/video_creator.py +61 -39
src/video_downloader.py +3 -8
src/video_prepare.py +28 -8
utils.py +10 -26
video.json +0 -19

.gitignore CHANGED Viewed

@@ -162,6 +162,9 @@ cython_debug/
 # media folder
 media/*
 # output folder
 output/*

 # media folder
 media/*
+# background folder
+background/*
 # output folder
 output/*

.streamlit/config.toml CHANGED Viewed

@@ -3,4 +3,7 @@ primaryColor="#BD93F9"
 backgroundColor="#282A36"
 secondaryBackgroundColor="#44475A"
 textColor="#F8F8F2"
-font="sans serif"

 backgroundColor="#282A36"
 secondaryBackgroundColor="#44475A"
 textColor="#F8F8F2"
+font="sans serif"
+[client]
+showSidebarNavigation = false

CONTRIBUTING.md CHANGED Viewed

@@ -37,4 +37,4 @@ Our project has a code of conduct to ensure that all contributors feel welcome a
 ## Conclusion
-We appreciate your interest in contributing to our project and look forward to your contributions. If you have any questions or need any help, please don't hesitate to reach out to us through the issue tracker or by email.


37
38	## Conclusion
39
40	+ We appreciate your interest in contributing to our project and look forward to your contributions. If you have any questions or need any help, please don't hesitate to reach out to us through the issue tracker or by email.

LICENSE ADDED Viewed

	@@ -0,0 +1,201 @@

+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+   1. Definitions.
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+   END OF TERMS AND CONDITIONS
+   APPENDIX: How to apply the Apache License to your work.
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+   Copyright [2023] [Matteo Fasulo]
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+       http://www.apache.org/licenses/LICENSE-2.0
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.

README.md CHANGED Viewed

@@ -1,15 +1,3 @@
----
-title: Whisper TikTok Demo
-emoji: 📚
-colorFrom: yellow
-colorTo: purple
-sdk: streamlit
-sdk_version: 1.36.0
-app_file: Home.py
-pinned: false
-license: apache-2.0
----
 # Introducing Whisper-TikTok 🤖🎥
 ## Star History
@@ -48,17 +36,13 @@ Discover Whisper-TikTok, an innovative AI-powered tool that leverages the prowes
 ## How it Works
-Employing Whisper-TikTok is a breeze: simply modify the [video.json](video.json). The JSON file contains the following fields:
 - `series`: The name of the series.
 - `part`: The part number of the video.
 - `text`: The text to be spoken in the video.
-- `outro`: The outro text to be spoken in the video.
 - `tags`: The tags to be used for the video.
-Summarizing the program's functionality:
-> Furnished with a structured JSON dataset containing details such as the **series name**, **video part number**, **video text** and **outro text**, the program orchestrates the synthesis of a video incorporating the provided text and outro. Subsequently, the generated video is stored within the designated `output` folder.
 <details>
 <summary>Details</summary>
@@ -80,8 +64,8 @@ The program conducts the **sequence of actions** outlined below:
 ## Web App (Online)
-There is a Web App hosted thanks to Streamlit which is public available, just click on the link that will take you directly to the Web App.
-> https://convert.streamlit.app
 ## Local Installation
@@ -127,14 +111,14 @@ choco install ffmpeg
 scoop install ffmpeg
 ```
->Please note that for optimal performance, it's advisable to have a GPU when using the OpenAI Whisper model for speech recognition. However, the program will work without a GPU, but it will run more slowly. This performance difference is because GPUs efficiently handle fp16 computation, while CPUs use fp32 or fp64 (depending on your machine), which are slower.
 ## Web-UI (Local)
 To run the Web-UI locally, execute the following command within your terminal:
 ```bash
-streamlit run app.py --server.port=8501 --server.address=0.0.0.0
 ```
 ## Command-Line
@@ -196,7 +180,7 @@ python main.py --url https://www.youtube.com/watch?v=dQw4w9WgXcQ --tts en-US-Jen
 - Modify the font color of the subtitles:
-```
 python main.py --sub_format b --font_color #FFF000 --tts en-US-JennyNeural
 ```
@@ -214,36 +198,25 @@ edge-tts --list-voices
 ## Additional Resources
-### Accelerate Video Creation
-> Contributed by [@duozokker](<https://github.com/duozokker>)
-**reddit2json** is a Python script that transforms Reddit post URLs into a JSON file, streamlining the process of creating video.json files. This tool not only converts Reddit links but also offers functionalities such as translating Reddit post content using DeepL and modifying content through custom OpenAI GPT calls.
-#### reddit2json: Directly Convert Reddit Links to JSON
-reddit2json is designed to process a list of Reddit post URLs, converting them into a JSON format that can be used directly for video creation. This tool enhances the video creation process by providing a faster and more efficient way to generate video.json files.
-[Here is the detailed README for reddit2json](https://github.com/duozokker/reddit2json/blob/main/README.md) which includes instructions for installation, setting up the .env file, example calls, and more.
-## Code of Conduct
 Please review our [Code of Conduct](./CODE_OF_CONDUCT.md) before contributing to Whisper-TikTok.
-## Contributing
 We welcome contributions from the community! Please see our [Contributing Guidelines](./CONTRIBUTING.md) for more information.
-## Upcoming Features
 - Integration with the OpenAI API to generate more advanced responses.
 - Generate content by extracting it from reddit <https://github.com/MatteoFasulo/Whisper-TikTok/issues/22>
-## Acknowledgments
 - We'd like to give a huge thanks to [@rany2](https://www.github.com/rany2) for their [edge-tts](https://github.com/rany2/edge-tts) package, which made it possible to use the Microsoft Edge Cloud TTS API with Whisper-TikTok.
 - We also acknowledge the contributions of the Whisper model by [@OpenAI](https://github.com/openai/whisper) for robust speech recognition via large-scale weak supervision
 - Also [@jianfch](https://github.com/jianfch/stable-ts) for the stable-ts package, which made it possible to use the OpenAI Whisper model with Whisper-TikTok in a stable manner with font color and subtitle format options.
-## License
 Whisper-TikTok is licensed under the [Apache License, Version 2.0](https://github.com/MatteoFasulo/Whisper-TikTok/blob/main/LICENSE).

 # Introducing Whisper-TikTok 🤖🎥
 ## Star History
 ## How it Works
+Employing Whisper-TikTok is a breeze: simply modify the [clips.csv](clips.csv). The CSV file contains the following attributes:
 - `series`: The name of the series.
 - `part`: The part number of the video.
 - `text`: The text to be spoken in the video.
 - `tags`: The tags to be used for the video.
+- `outro`: The outro text to be spoken in the video.
 <details>
 <summary>Details</summary>
 ## Web App (Online)
+There is a Web App hosted thanks to Streamlit which is public available in HuggingFace, just click on the link that will take you directly to the Web App.
+> https://huggingface.co/spaces/MatteoFasulo/Whisper-TikTok-Demo
 ## Local Installation
 scoop install ffmpeg
 ```
+> Please note that for optimal performance, it's advisable to have a GPU when using the OpenAI Whisper model for Automatic Speech Recognition (ASR). However, the program will also work without a GPU, but it will run more slowly.
 ## Web-UI (Local)
 To run the Web-UI locally, execute the following command within your terminal:
 ```bash
+streamlit run app.py
 ```
 ## Command-Line
 - Modify the font color of the subtitles:
+```bash
 python main.py --sub_format b --font_color #FFF000 --tts en-US-JennyNeural
 ```
 ## Additional Resources
+### Code of Conduct
 Please review our [Code of Conduct](./CODE_OF_CONDUCT.md) before contributing to Whisper-TikTok.
+### Contributing
 We welcome contributions from the community! Please see our [Contributing Guidelines](./CONTRIBUTING.md) for more information.
+### Upcoming Features
 - Integration with the OpenAI API to generate more advanced responses.
 - Generate content by extracting it from reddit <https://github.com/MatteoFasulo/Whisper-TikTok/issues/22>
+### Acknowledgments
 - We'd like to give a huge thanks to [@rany2](https://www.github.com/rany2) for their [edge-tts](https://github.com/rany2/edge-tts) package, which made it possible to use the Microsoft Edge Cloud TTS API with Whisper-TikTok.
 - We also acknowledge the contributions of the Whisper model by [@OpenAI](https://github.com/openai/whisper) for robust speech recognition via large-scale weak supervision
 - Also [@jianfch](https://github.com/jianfch/stable-ts) for the stable-ts package, which made it possible to use the OpenAI Whisper model with Whisper-TikTok in a stable manner with font color and subtitle format options.
+### License
 Whisper-TikTok is licensed under the [Apache License, Version 2.0](https://github.com/MatteoFasulo/Whisper-TikTok/blob/main/LICENSE).

Home.py → app.py RENAMED Viewed

@@ -1,6 +1,5 @@
-import os
 import sys
-import json
 from pathlib import Path
 import asyncio
 import platform
@@ -10,12 +9,11 @@ import edge_tts
 import streamlit as st
 import pandas as pd
-from src.video_creator import VideoCreator
 from utils import rgb_to_bgr
 result = None
 async def generate_video(
         model,
         tts_voice,
@@ -27,9 +25,8 @@ async def generate_video(
         non_english,
         upload_tiktok,
         verbose,
-        video_json,
-        background_tab,
         video_num,
         max_words,
         *args,
         **kwargs):
@@ -49,18 +46,18 @@ async def generate_video(
         max_words=max_words
     )
-    async def get_video(video_data, args):
         with st.status("Generating video...", expanded=False) as status:
-            video_creator = VideoCreator(video_data, args)
             status.update(label="Downloading video...")
-            video_creator.download_video()
             status.update(label="Loading model...")
             video_creator.load_model()
             status.update(label="Creating text...")
-            video_creator.create_text()
             status.update(label="Generating audio...")
             await video_creator.text_to_speech()
@@ -73,6 +70,7 @@ async def generate_video(
             status.update(label="Integrating subtitles...")
             video_creator.integrate_subtitles()
             if upload_tiktok:
                 status.update(label="Uploading to TikTok...")
@@ -82,43 +80,24 @@ async def generate_video(
                           state="complete", expanded=False)
             return str(video_creator.mp4_final_video)
-    tasks = [get_video(video_json[i], args)
-             for i, name in enumerate(video_num)]
-    results = await asyncio.gather(*tasks)
-    if len(results) == 1:
-        return results[0]
     else:
-        return results[-1]
 @st.cache_data
-def json_to_df(json_file):
-    return pd.read_json(json_file)
 @st.cache_data
-def df_to_json(df):
-    try:
-        # Convert the DataFrame to a JSON string
-        json_str = df.to_json(orient='records', indent=4, force_ascii=False)
-        # raise an error if the dataframe has no rows (at least one is required)
-        if df.shape[0] == 0:
-            st.error("You must add at least one video to the JSON")
-            return
-        # Save the JSON string to a file
-        with open('video.json', 'w', encoding='UTF-8') as f:
-            f.write(json_str)
-        st.success("JSON saved successfully!")
-    except ValueError as e:
-        st.error("You must fill all the fields in the JSON")
-    except Exception as e:
-        st.error(f"Error saving JSON: {e}")
 # Streamlit Config
@@ -148,12 +127,12 @@ async def main():
     st.title("🏆 Whisper-TikTok 🚀")
     st.write("Create a TikTok video with text-to-speech of Microsoft Edge's TTS and subtitles of Whisper model.")
-    st.subheader("JSON Editor", help="Here you can edit the JSON file with the videos. Copy-and-paste is supported and compatible with Google Sheets, Excel, and others. You can do bulk-editing by dragging the handle on a cell (similar to Excel)!")
-    st.write("ℹ️ The JSON file is saved automatically when you click the button below. Every time you edit the JSON file, you must click the button to save the changes otherwise they will be lost.")
-    edited_df = st.data_editor(json_to_df('video.json'),
                                num_rows="dynamic")
-    st.button("Save JSON", on_click=df_to_json, args=(
-        edited_df,), help="Save the JSON file with the videos")
     st.divider()
@@ -164,15 +143,14 @@ async def main():
         with st.expander("ℹ️ How to use"):
             st.write(
                 """
-                1. Choose the video to generate using the dropdown menu.
                 2. Choose the model to use for the subtitles.
                 3. Choose the voice to use for the text-to-speech.
-                4. Choose the background video to use for the TikTok video.
                 5. Choose the position of the subtitles.
                 6. Choose the font, font color, and font size for the subtitles.
-                7. Choose the URL of the background video to use for the TikTok video.
-                8. Check the "Non-english" checkbox if you want to generate a video in a non-english language.
-                9. Check the "Upload to TikTok" checkbox if you want to upload the video to TikTok using the TikTok session cookie. For this step it is required to have a TikTok account and to be logged in on your browser. Then the required cookies.txt file can be generated using this guide
                 """)
     LEFT, RIGHT = st.columns(2)
@@ -233,9 +211,7 @@ async def main():
         st.subheader("Video settings")
-        st.write("JSON file with the videos")
-        with open('video.json', encoding='utf-8') as fh:
-            video_json = st.json(json.load(fh), expanded=False)
         # Get the list of files in "background"
         folder_path = Path("background").absolute()
@@ -244,26 +220,26 @@ async def main():
         # Create a Dropdown with the list of files
         background_tab = st.selectbox(
-            "Your Backgrounds", files, index=0, help="The background video to use for the TikTok video")
-        # Choose which video to generate
-        videos = json.load(open("video.json"))
-        video_num = st.multiselect(
-            "Video",
-            options=videos,
-            format_func=lambda video: f"{video['series']} - {video['part']}",
-            default=[videos[0]],
-            help="The video to generate. If you want to generate multiple videos, select them as a multiselect."
-        )
-        if st.button("Generate Video"):
             if not video_num:
-                st.error("You must select at least one video to generate")
                 return
             global result
             result = await generate_video(model, tts_voice, sub_position, font, font_color, font_size,
-                                          url, non_english, upload_tiktok, verbose, videos, background_tab, video_num, max_words)
     with RIGHT:
         if result:

 import sys
+import csv
 from pathlib import Path
 import asyncio
 import platform
 import streamlit as st
 import pandas as pd
+from src.video_creator import ClipMaker
 from utils import rgb_to_bgr
 result = None
 async def generate_video(
         model,
         tts_voice,
         non_english,
         upload_tiktok,
         verbose,
         video_num,
+        background_tab,
         max_words,
         *args,
         **kwargs):
         max_words=max_words
     )
+    async def get_clip(clip, args):
         with st.status("Generating video...", expanded=False) as status:
+            video_creator = ClipMaker(clip=clip, args=args)
             status.update(label="Downloading video...")
+            video_creator.download_background_video()
             status.update(label="Loading model...")
             video_creator.load_model()
             status.update(label="Creating text...")
+            video_creator.merge_clip_text()
             status.update(label="Generating audio...")
             await video_creator.text_to_speech()
             status.update(label="Integrating subtitles...")
             video_creator.integrate_subtitles()
+            print('HERE x3')
             if upload_tiktok:
                 status.update(label="Uploading to TikTok...")
                           state="complete", expanded=False)
             return str(video_creator.mp4_final_video)
+    task = [get_clip(clip, args) for clip in video_num]
+    result = await asyncio.gather(*task)
+    if len(result) == 1:
+        return result[0]
     else:
+        return result[-1] # Return the last video generated if multiple videos are generated
 @st.cache_data
+def csv_to_df(csv_file):
+    return pd.read_csv(csv_file, sep='|', encoding='utf-8')
 @st.cache_data
+def df_to_csv(df):
+    # Save the edited dataframe to the CSV file
+    df.to_csv("clips.csv", index=False, sep='|')
+    return df
 # Streamlit Config
     st.title("🏆 Whisper-TikTok 🚀")
     st.write("Create a TikTok video with text-to-speech of Microsoft Edge's TTS and subtitles of Whisper model.")
+    st.subheader("Clip Editor", help="Here you can edit the CSV file with the clips data. Copy-and-paste is supported and compatible with Google Sheets, Excel, and others. You can do bulk-editing by dragging the handle on a cell (similar to Excel)!")
+    st.write("ℹ️ The CSV file is saved automatically when you click the button below. Every time you edit the CSV file, you must click the button to save the changes otherwise they will be lost.")
+    edited_df = st.data_editor(csv_to_df("clips.csv"),
                                num_rows="dynamic")
+    st.button("Save CSV", on_click=df_to_csv, args=(
+        edited_df,), help="Save the CSV file with the clips")
     st.divider()
         with st.expander("ℹ️ How to use"):
             st.write(
                 """
+                1. Choose the clip to generate using the dropdown menu.
                 2. Choose the model to use for the subtitles.
                 3. Choose the voice to use for the text-to-speech.
+                4. Choose the background video to use for the clip.
                 5. Choose the position of the subtitles.
                 6. Choose the font, font color, and font size for the subtitles.
+                7. Check the "Non-english" checkbox if you want to generate a clip in a non-english language.
+                8. Check the "Upload to TikTok" checkbox if you want to upload the clip to TikTok using the TikTok session cookie. For this step it is required to have a TikTok account and to be logged in on your browser. Then the required cookies.txt file can be generated using the guide specified in the README. The cookies.txt file must be placed in the root folder of the project.
                 """)
     LEFT, RIGHT = st.columns(2)
         st.subheader("Video settings")
+        st.write("CSV file with the clips")
         # Get the list of files in "background"
         folder_path = Path("background").absolute()
         # Create a Dropdown with the list of files
         background_tab = st.selectbox(
+            "Your Backgrounds", files, index=0, help="The background video to use for the clip")
+        # Choose which clip to generate the video for
+        with open('clips.csv', 'r', encoding='utf-8') as csvfile:
+            clips = csv.DictReader(csvfile, delimiter='|')
+            video_num = st.multiselect(
+                "Video",
+                options=clips,
+                format_func=lambda video: f"{video['series']} - {video['part']}",
+                help="The clip to generate. If you want to generate multiple clips, select them as a multiselect."
+            )
+        if st.button("Generate Clip"):
             if not video_num:
+                st.error("You must select at least one clip to generate")
                 return
             global result
             result = await generate_video(model, tts_voice, sub_position, font, font_color, font_size,
+                                          url, non_english, upload_tiktok, verbose, video_num, background_tab, max_words)
     with RIGHT:
         if result:

clips.csv ADDED Viewed

	@@ -0,0 +1,3 @@

+series|part|text|tags|outro
+Crazy facts that you did not know|4|The first person to survive going over Niagara Falls in a barrel was a 63-year-old school teacher|[survive, Niagara Falls, facts]|I hope you enjoyed this video. If you did, please give it a thumbs up and subscribe to my channel. I will see you in the next video.
+Crazy facts that you did not know|6|Did you know that the shortest war in history lasted only 38 minutes? It was between Britain and Zanzibar in 1896|[shortest war, history, 38 minutes, Britain, Zanzibar]|I hope you enjoyed this video. If you did, please give it a thumbs up and subscribe to my channel. I will see you in the next video.

example-reddit-post.txt DELETED Viewed

	@@ -1,2 +0,0 @@
1	- https://www.reddit.com/r/stories/comments/1afvvvu/my_fiance_had_a_special_name_for_me_when_he_first/
2	- https://www.reddit.com/r/stories/comments/1afzk7v/i_think_my_mom_cheated/

example-video.json DELETED Viewed

@@ -1 +0,0 @@

- [{"series": "Geständnis eines pensionierten FBI-Agenten", "part": "", "outro": "", "text": "Ich habe früher in einer medizinischen Abteilung eines Krankenhauses im Nordwesten gearbeitet. Die Patienten wurden endoskopischen Untersuchungen unterzogen, für die sie sediert wurden. Bei diesem Fall hatten wir einen älteren Herrn als Patienten, während wir auf den Arzt warteten, unterhielten wir uns freundlich, nichts Ungewöhnliches. Als der Arzt herein kam, fragte er uns sofort, ob der Patient uns von seiner Vergangenheit erzählt hätte. Ich begann damit, die medizinischen Gründe aufzuzählen, warum er das Verfahren hatte, aber der Arzt unterbrach mich und sagte: \"Nein, seine bisherige Arbeit als verdeckter FBI-Mob-Agent.\" Natürlich war meine Reaktion: \"Ohhhhh nein... das muss interessant gewesen sein, mit diesen Mafiagangstern umzugehen.\" Die Antwort des Patienten hat mich bis heute verfolgt. Seine genauen Worte waren:.\"Diese Jungs waren nicht so schlimm wie diese verdammten Politiker.\".Dann erzählte er eine Geschichte davon, wie er Leiter der Sicherheit bei einer \"Kongressveranstaltung\" in den 80er Jahren war. Er sagte, ein anderer Agent habe ihm das Telefon gereicht und gesagt, \"ein Kongressabgeordneter\" wolle mit ihm sprechen..Das Gespräch verlief folgendermaßen:.Kongressabgeordneter: Gibt es dort Frauen?.Agent: Ich weiß nicht, was Sie meinen... aber ja, es sind Frauen hier..Kongressabgeordneter: Wenn ich ankomme, möchte ich eine in mein Zimmer geschickt bekommen... \"NICHT ÄLTER ALS 13\"..Direkt nachdem er das gesagt hatte, gab der Anästhesist ihm die Medikamente, und er verlor das Bewusstsein. Wir standen alle einfach da in Stille, während er das Verfahren durchlief... was zum Teufel hat er uns gerade erzählt?.EDIT: Offenbar bleiben Leute an der Verwendung des Begriffs \"Informant\" hängen... also habe ich ihn entfernt. Für Klarheit, die ich für selbstverständlich hielt.. dieser alte Mann war kein \"Mafia-Informant\" im Sinne eines Mob-Spitzels. Er war ein pensionierter FBI-Agent, der undercover mit der Mafia gearbeitet hat. Zu einer völlig anderen Zeit behauptete er, von einem Kongressabgeordneten nach eine-jährigen Mädchen gefragt worden zu sein. Dieser Mann hatte keinen Grund zu lügen... er hat es nicht einmal erwähnt, der Chirurg hat es..EDIT 2:.Die Geschichte ist zu 100% wahr, so wie sie passiert ist..Könnte der alte Mann lügen, ja natürlich. Glaube ich, dass er gelogen hat, NEIN!.Die Untersuchung war eine EGD \"obere Endoskopie\"..Der Eingriff wurde von einem Chirurgen zur postoperativen Überwachung durchgeführt, nicht von einem Gastroenterologen..Ihr Nörgler müsst verstehen, dass es elitäre Pädophilenringe gibt und sie schon seit langer Zeit existieren..Diejenigen, die dies als eine Unterstützung für eine politische Weltanschauung betrachten, liegen falsch. Ich habe keine politische Zugehörigkeit..Für all diejenigen, die behaupten \"Das FBI ist nicht für Sicherheit verantwortlich und arbeitet nicht mit dem Kongress zusammen.\" Ihr nehmt an, dass ihr wisst, in welcher Funktion dieser Mann während seiner gesamten Karriere gearbeitet hat??.https://de.wikipedia.org/wiki/FBI_Police.\"Aufgaben und Verantwortlichkeiten\".\"Die FBI-Polizei kann gelegentlich bei bedeutenden nationalen Sicherheitsveranstaltungen eingesetzt werden, wie Präsidenteneinführungen, dem Super Bowl, Konferenzen von weltweiten Führern sowie großen politischen Parteikonferenzen.\""}]

example.env DELETED Viewed

@@ -1,7 +0,0 @@
-REDDIT_USER_AGENT=
-REDDIT_CLIENT_ID=
-REDDIT_CLIENT_SECRET=
-DEEPL_AUTH_KEY=
-OPENAI_API_KEY=

main.py CHANGED Viewed

@@ -1,6 +1,6 @@
 # utils.py
 import asyncio
-import json
 import platform
 from dotenv import find_dotenv, load_dotenv
 from utils import *
@@ -8,24 +8,18 @@ from utils import *
 # msg.py
 import msg
-# logger.py
-from src.logger import setup_logger
 # arg_parser.py
 from src.arg_parser import parse_args
 # video_creator.py
-from src.video_creator import VideoCreator
 # Default directory
 HOME = Path.cwd()
-# Logging
-logger = setup_logger()
-# JSON video file
-video_json_path = HOME / 'video.json'
-jsonData = json.loads(video_json_path.read_text(encoding='utf-8'))
 #######################
@@ -33,25 +27,23 @@ jsonData = json.loads(video_json_path.read_text(encoding='utf-8'))
 #######################
-async def main() -> bool:
     console.clear()  # Clear terminal
     args = await parse_args()
-    videos = jsonData
-    for video in videos:
-        logger.debug('Creating video')
         with console.status(msg.STATUS) as status:
-            load_dotenv(find_dotenv())  # Optional
-            console.log(
-                f"{msg.OK}Finish loading environment variables")
-            logger.info('Finish loading environment variables')
-            video_creator = VideoCreator(video, args)
-            video_creator.download_video()
             video_creator.load_model()
-            video_creator.create_text()
             await video_creator.text_to_speech()
             video_creator.generate_transcription()
             video_creator.select_background()
@@ -60,7 +52,7 @@ async def main() -> bool:
                 video_creator.upload_to_tiktok()
         console.log(f'{msg.DONE} {str(video_creator.mp4_final_video)}')
-    return 0
 if __name__ == "__main__":
@@ -70,7 +62,7 @@ if __name__ == "__main__":
     loop = asyncio.get_event_loop()
-    loop.run_until_complete(main())
     loop.close()

 # utils.py
 import asyncio
+import csv
 import platform
 from dotenv import find_dotenv, load_dotenv
 from utils import *
 # msg.py
 import msg
 # arg_parser.py
 from src.arg_parser import parse_args
 # video_creator.py
+from src.video_creator import ClipMaker
 # Default directory
 HOME = Path.cwd()
+# List of clips to generate
+video_csv = HOME / 'clips.csv'
+video_data = csv.DictReader(open(video_csv, 'r', encoding='utf-8'), delimiter='|')
 #######################
 #######################
+async def main(video_list) -> bool:
     console.clear()  # Clear terminal
     args = await parse_args()
+    for video in video_list:
         with console.status(msg.STATUS) as status:
+            # Load env vars (if any)
+            load_dotenv(find_dotenv())
+            console.log(f"{msg.OK}Finish loading environment variables")
+            video_creator = ClipMaker(video, args)
+            video_creator.download_background_video()
             video_creator.load_model()
+            video_creator.merge_clip_text()
             await video_creator.text_to_speech()
             video_creator.generate_transcription()
             video_creator.select_background()
                 video_creator.upload_to_tiktok()
         console.log(f'{msg.DONE} {str(video_creator.mp4_final_video)}')
+    return True
 if __name__ == "__main__":
     loop = asyncio.get_event_loop()
+    loop.run_until_complete(main(video_list=video_data))
     loop.close()

packages.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ ffmpeg

pages/Reddit.py DELETED Viewed

@@ -1,119 +0,0 @@
-from pathlib import Path
-import random
-import streamlit as st
-import praw
-HOME = Path(__name__).parent.absolute()
-@st.cache_data
-def create_instance(*args, **kwargs):
-    reddit = praw.Reddit(
-        client_id=kwargs.get('client_id'),
-        client_secret=kwargs.get('client_secret'),
-        user_agent=kwargs.get('user_agent'),
-    )
-    subreddit = get_subreddit(reddit=reddit, subreddit=kwargs.get(
-        'subreddit'), nsfw=kwargs.get('nsfw'))
-    submission = get_random_submission(subreddit=subreddit)
-    st.session_state['submission'] = submission
-    return True
-def get_subreddit(*args, **kwargs):
-    reddit = kwargs.get('reddit')
-    subreddit = reddit.subreddit(kwargs.get('subreddit'))
-    nsfw = kwargs.get('nsfw')
-    try:
-        st.text(f"Subreddit: {subreddit.display_name}")
-    except Exception as exception:
-        st.exception(exception=exception)
-    if subreddit.over18 and not nsfw:
-        st.error(
-            body='subreddit has NSFW contents but you did not select to scrape them')
-    return subreddit
-def get_random_submission(*args, **kwargs):
-    subreddit = kwargs.get('subreddit')
-    submissions = [submission for submission in subreddit.hot(limit=10)]
-    return random.choice(submissions)
-# Streamlit Config
-st.set_page_config(
-    page_title="Whisper-TikTok",
-    page_icon="💬",
-    layout="wide",
-    initial_sidebar_state="expanded",
-    menu_items={
-        'Get Help': 'https://github.com/MatteoFasulo/Whisper-TikTok',
-        'Report a bug': "https://github.com/MatteoFasulo/Whisper-TikTok/issues",
-        'About':
-            """
-            # Whisper-TikTok
-            Whisper-TikTok is an innovative AI-powered tool that leverages the prowess of Edge TTS, OpenAI-Whisper, and FFMPEG to craft captivating TikTok videos also with a web application interface!
-            Mantainer: https://github.com/MatteoFasulo
-            If you find a bug or if you just have questions about the project feel free to reach me at https://github.com/MatteoFasulo/Whisper-TikTok
-            Any contribution to this project is welcome to improve the quality of work!
-            """
-    }
-)
-with st.sidebar:
-    with st.expander("ℹ️ How to use"):
-        st.write(
-            """
-            Before starting you will need to create a new [Reddit API App](https://www.reddit.com/prefs/apps) by selecting `script` (personal use).
-            Then, after putting the App name, http://localhost as `reddit uri` and `about url`, you have just to insert those values in this dashboard to use the Reddit API for scraping any subreddit.
-            """)
-    client_id = st.text_input(label='Reddit Client ID')
-    client_secret = st.text_input(
-        label='Reddit Client Secret', type='password')
-    user_agent = st.text_input(label='Reddit User Agent')
-st.title("🏆 Whisper-TikTok 🚀")
-st.subheader('Reddit section')
-st.write("""
-    This section allows you to generate videos from subreddits.""")
-st.divider()
-LEFT, RIGHT = st.columns(2)
-with LEFT:
-    num_videos = st.number_input(label='How many videos do you want to generate?',
-                                 min_value=1, max_value=10, value=1, step=1)
-    subreddit = st.text_input(
-        label='What Subreddit do you want to use', placeholder='AskReddit')
-    nsfw = st.checkbox(label='NSFW content?', value=False)
-    max_chars = st.slider(label='Maximum number of characters per line',
-                          min_value=10, max_value=50, value=38, step=1)
-    max_words = st.number_input(label='Maximum number of words per line', min_value=1,
-                                max_value=5, value=2, step=1)
-    result = st.button('Get subreddit')
-    with RIGHT:
-        if result:
-            create_instance(client_id=client_id, client_secret=client_secret,
-                            user_agent=user_agent, subreddit=subreddit, nsfw=nsfw)
-            submission = st.session_state['submission']
-            title = submission.title
-            submission.comment_sort = "new"
-            top_level_comments = list(submission.comments)
-            max_comments = 10
-            st.subheader(title)
-            for comment in top_level_comments[:max_comments]:
-                st.text(comment.body)
-                st.divider()

pages/__init__.py DELETED Viewed

File without changes

reddit-post.txt DELETED Viewed

File without changes

reddit2json.py DELETED Viewed

@@ -1,133 +0,0 @@
-import praw
-import requests
-import json
-import os
-import re
-from tqdm import tqdm
-from openai import OpenAI
-from dotenv import load_dotenv
-import argparse
-load_dotenv()  # take environment variables from .env.
-# Parse command-line arguments
-parser = argparse.ArgumentParser(description='Process Reddit posts.')
-parser.add_argument('--method', type=str, default='chat', choices=['translate', 'chat'],
-                    help='Method to use for processing text. "translate" uses Deepl, "chat" uses GPT-3.5 Turbo.')
-parser.add_argument('--lang', type=str, default='EN',
-                    help='Target language for translation. Only used if method is "translate".')
-args = parser.parse_args()
-client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
-def chat_with_gpt3(prompt):
-    completion = client.chat.completions.create(
-        model="gpt-3.5-turbo",
-        messages=[
-            {"role": "system", "content": f"You are an assistant that meaningfully translates English Reddit post texts into Language:{args.lang} and optimizes them for text-to-speech. The following is a Reddit post that you should translate and optimize for text-to-speech"},
-            {"role": "user", "content": prompt}
-        ]
-    )
-    # Extract the content attribute
-    return completion.choices[0].message.content
-def get_reddit_post(url):
-    reddit = praw.Reddit(
-        client_id=os.getenv("REDDIT_CLIENT_ID"),
-        client_secret=os.getenv("REDDIT_CLIENT_SECRET"),
-        user_agent=os.getenv("REDDIT_USER_AGENT"),
-    )
-    post = reddit.submission(url=url)
-    return post.title, post.selftext
-def translate_to_german(text):
-    # url = "https://api.deepl.com/v2/translate"
-    url = "https://api-free.deepl.com/v2/translate"
-    data = {
-        "auth_key": os.getenv("DEEPL_AUTH_KEY"),
-        "text": text,
-        "target_lang": args.lang,
-    }
-    response = requests.post(url, data=data)
-    response_json = response.json()
-    return response_json['translations'][0]['text']
-def process_text(title, text):
-    if args.method == 'translate':
-        title = translate_to_german(title)
-        text = translate_to_german(text)
-    elif args.method == 'chat':
-        title = chat_with_gpt3(
-            f"Translate the following title into Language: {args.lang} and adjust it so that it is optimized for a lecture by a text-to-speech program. Also remove all parentheses such as (29m) or (M23) or (M25) etc. Also remove all edits from the Reddit post so only the pure text remains:" + "\n\n" + "title" + "\n\n" + "Revised title:")
-        text = chat_with_gpt3(
-            f"Translate the following text into Language: {args.lang} and adjust it so that it is optimized for a lecture by a text-to-speech program. Also remove all parentheses such as (29m) or (M23) or (M25) or (19) etc. Also remove all edits from the Reddit post so only the pure text remains. Break off the text at the most exciting point to keep the readers very curious:" + "\n\n" + "text" + "\n\n" + "Revised text:")
-    return title, text
-def modify_json(title_text, part_text, outro_text, main_text):
-    data = []
-    for i in range(len(title_text)):
-        data.append({
-            "series": title_text[i],
-            "part": part_text[i],
-            "outro": outro_text[i],
-            "text": main_text[i]
-        })
-    with open('./video.json', 'w', encoding='utf-8') as f:
-        json.dump(data, f, ensure_ascii=False)
-def read_file_line_by_line(file_path):
-    with open(file_path, 'r') as file:
-        for line in file:
-            yield line
-title_text = []
-main_text = []
-# Convert generator to list to get length
-lines = list(read_file_line_by_line('./reddit-post.txt'))
-for line in tqdm(lines, desc="Processing Reddit posts", unit="post"):
-    title, text = get_reddit_post(line)
-    title, text = process_text(title, text)
-    title = title.replace('\n\n', '.')  # replace '\n\n' with ' ' in title
-    text = text.replace('\n\n', '.')  # replace '\n\n' with ' ' in text
-    title = title.replace('&#x200B', '')  # replace , with '' in title
-    text = text.replace('&#x200B', '')  # replace , with '' in text
-    # remove gender and age indications from title and text
-    title = re.sub(r'\(?\d+\s*[mwMW]\)?', '', title)
-    text = re.sub(r'\(?\d+\s*[mwMW]\)?', '', text)
-    # remove gender and age indications where M/W is written before the number
-    title = re.sub(r'\(?\s*[mwMW]\s*\d+\)?', '', title)
-    text = re.sub(r'\(?\s*[mwMW]\s*\d+\)?', '', text)
-    # remove characters not allowed in a Windows filename from title
-    title = re.sub(r'[<>:"/\\|?*,]', '', title)
-    text = text.replace('Edit:', '')
-    text = text.replace('edit:', '')
-    title_text.append(title)
-    main_text.append(text)
-# Initialize part_text and outro_text after the loop
-part_text = [""] * len(title_text)
-outro_text = [""] * len(title_text)
-modify_json(title_text, part_text, outro_text, main_text)

requirements.txt CHANGED Viewed

@@ -14,4 +14,4 @@ tiktok-uploader
 streamlit
 praw
 requests
-openai

 streamlit
 praw
 requests
+openai

src/subtitle_creator.py CHANGED Viewed

@@ -3,16 +3,22 @@ from pathlib import Path
 import torch
-def srt_create(whisper_model, path: str, series: str, part: int, text: str, filename: str, **kwargs) -> bool:
     series = series.replace(' ', '_')
     srt_path = f"{path}{os.sep}{series}{os.sep}"
     srt_filename = f"{srt_path}{series}_{part}.srt"
     ass_filename = f"{srt_path}{series}_{part}.ass"
     absolute_srt_path = Path(srt_filename).absolute()
     absolute_ass_path = Path(ass_filename).absolute()
     word_dict = {
         'Fontname': kwargs.get('font', 'Arial'),
         'Alignment': kwargs.get('sub_position', 5),
@@ -25,13 +31,16 @@ def srt_create(whisper_model, path: str, series: str, part: int, text: str, file
         'MarginR': '0',
     }
     transcribe = whisper_model.transcribe(
         filename, regroup=True, fp16=torch.cuda.is_available())
     transcribe.split_by_gap(0.5).split_by_length(kwargs.get(
         'max_characters')).merge_by_gap(0.15, max_words=kwargs.get('max_words'))
     transcribe.to_srt_vtt(str(absolute_srt_path), word_level=True)
     transcribe.to_ass(str(absolute_ass_path), word_level=True,
                       highlight_color=kwargs.get('font_color'), **word_dict)
     return ass_filename

 import torch
+def srt_create(whisper_model, path: str, series: str, part: int, filename: str, **kwargs) -> str:
+    # Transcribe using Whisper model
+    # Replace whitespaces with underscores for series name
     series = series.replace(' ', '_')
+    # Retrieve the folder path of srt and ass files
     srt_path = f"{path}{os.sep}{series}{os.sep}"
     srt_filename = f"{srt_path}{series}_{part}.srt"
     ass_filename = f"{srt_path}{series}_{part}.ass"
+    # Get the absolute path
     absolute_srt_path = Path(srt_filename).absolute()
     absolute_ass_path = Path(ass_filename).absolute()
+    # Subtitle style dict
     word_dict = {
         'Fontname': kwargs.get('font', 'Arial'),
         'Alignment': kwargs.get('sub_position', 5),
         'MarginR': '0',
     }
+    # Transcribe the .mp3 file using Whisper
     transcribe = whisper_model.transcribe(
         filename, regroup=True, fp16=torch.cuda.is_available())
+    # Adjustments to the style
     transcribe.split_by_gap(0.5).split_by_length(kwargs.get(
         'max_characters')).merge_by_gap(0.15, max_words=kwargs.get('max_words'))
     transcribe.to_srt_vtt(str(absolute_srt_path), word_level=True)
     transcribe.to_ass(str(absolute_ass_path), word_level=True,
                       highlight_color=kwargs.get('font_color'), **word_dict)
     return ass_filename

src/video_creator.py CHANGED Viewed

@@ -1,8 +1,8 @@
-import json
 from pathlib import Path
 import stable_whisper as whisper
-from .logger import setup_logger
 from .subtitle_creator import srt_create
 from .text_to_speech import tts
 from .tiktok import upload_tiktok
@@ -11,85 +11,107 @@ from .video_downloader import download_video as youtube_download
 from utils import *
 HOME = Path.cwd()
-logger = setup_logger()
 media_folder = HOME / 'media'
-class VideoCreator:
-    def __init__(self, video, args):
         self.args = args
-        self.video = video
-        self.series = video.get('series', '')
-        self.part = video.get('part', '')
-        self.text = video.get('text', '')
-        self.tags = video.get('tags', list())
-        self.outro = video.get('outro', '')
         self.path = Path(media_folder).absolute()
-    def download_video(self, folder='background'):
         youtube_download(url=self.args.url, folder=folder)
-        console.log(
-            f"{msg.OK}Video downloaded from {self.args.url} to {folder}")
-        logger.info(f"Video downloaded from {self.args.url} to {folder}")
     def load_model(self):
         model = self.args.model
         if self.args.model != "large" and not self.args.non_english:
             model = self.args.model + ".en"
         whisper_model = whisper.load_model(model)
         self.model = whisper_model
         return whisper_model
-    def create_text(self):
-        req_text = f"{self.series} - Part {self.part}.\n{self.text}\n{self.outro}"
         series = self.series.replace(' ', '_')
         filename = f"{self.path}{os.sep}{series}{os.sep}{series}_{self.part}.mp3"
         Path(f"{self.path}{os.sep}{series}").mkdir(parents=True, exist_ok=True)
         self.req_text = req_text
         self.mp3_file = filename
         return req_text, filename
-    async def text_to_speech(self):
         await tts(self.req_text, outfile=self.mp3_file, voice=self.args.tts, args=self.args)
-    def generate_transcription(self):
         ass_filename = srt_create(self.model,
-                                  self.path, self.series, self.part, self.text, self.mp3_file, **vars(self.args))
         ass_filename = Path(ass_filename).absolute()
         self.ass_file = ass_filename
         return ass_filename
-    def select_background(self):
         try:
-            # Background video selected with WebUI
-            background_mp4 = self.args.mp4_background
-            with KeepDir() as keep_dir:
-                keep_dir.chdir("background")
-                background_mp4 = Path(background_mp4).absolute()
-        except AttributeError:
-            # CLI execution
-            background_mp4 = random_background()
-        background_mp4 = str(Path(background_mp4).absolute())
         self.mp4_background = background_mp4
         return background_mp4
-    def integrate_subtitles(self):
-        final_video = prepare_background(
-            self.mp4_background, filename_mp3=self.mp3_file, filename_srt=self.ass_file, verbose=self.args.verbose)
         final_video = Path(final_video).absolute()
         self.mp4_final_video = final_video
         return final_video
-    def upload_to_tiktok(self):
-        uploaded = upload_tiktok(str(
-            self.mp4_final_video), title=f"{self.series} - {self.part}", tags=self.tags, headless=not self.args.verbose)
         return uploaded

 from pathlib import Path
 import stable_whisper as whisper
+# Local imports
 from .subtitle_creator import srt_create
 from .text_to_speech import tts
 from .tiktok import upload_tiktok
 from utils import *
 HOME = Path.cwd()
 media_folder = HOME / 'media'
+class ClipMaker:
+    def __init__(self, clip: dict, args):
+        self.clip = clip
         self.args = args
+        # Fetch clip data or set default values
+        self.series = clip.get('series', 'Crazy facts that you did not know')
+        self.part = clip.get('part', '1')
+        self.text = clip.get('text', 'The first person to survive going over Niagara Falls in a barrel was a 63-year-old school teacher')
+        self.tags = clip.get('tags', ['survive', 'Niagara Falls', 'facts'])
+        self.outro = clip.get('outro', 'I hope you enjoyed this video. If you did, please give it a thumbs up and subscribe to my channel. I will see you in the next video.')
+        # Set media folder path
         self.path = Path(media_folder).absolute()
+    def download_background_video(self, folder='background') -> None:
+        # Download background video for the clip
         youtube_download(url=self.args.url, folder=folder)
+        console.log(f"{msg.OK}Video downloaded from {self.args.url} to {folder}")
+        return None
     def load_model(self):
+        # Load Whisper model
         model = self.args.model
         if self.args.model != "large" and not self.args.non_english:
             model = self.args.model + ".en"
         whisper_model = whisper.load_model(model)
+        # Set model to class attribute
         self.model = whisper_model
         return whisper_model
+    def merge_clip_text(self) -> tuple:
+        # Merge clip series, part, text and outro to create a single text for the clip
+        req_text = f"{self.series} - Part {self.part}.\n{self.text}\n{self.outro}" # TODO: allow user to customize this
+        # Remove whitespaces from series name and create a folder for the series
         series = self.series.replace(' ', '_')
         filename = f"{self.path}{os.sep}{series}{os.sep}{series}_{self.part}.mp3"
+        # Create series folder if it does not exist
         Path(f"{self.path}{os.sep}{series}").mkdir(parents=True, exist_ok=True)
+        # Set class attributes for text and mp3 (audio) file
         self.req_text = req_text
         self.mp3_file = filename
         return req_text, filename
+    async def text_to_speech(self) -> None:
+        # Convert text to speech using the selected TTS voice
         await tts(self.req_text, outfile=self.mp3_file, voice=self.args.tts, args=self.args)
+        return None
+    def generate_transcription(self) -> Path:
+        # Generate subtitles for the clip using the Whisper model
         ass_filename = srt_create(self.model,
+                                  self.path, self.series, self.part, self.mp3_file, **vars(self.args))
+        # Get the absolute path of .ass file
         ass_filename = Path(ass_filename).absolute()
+        # Set class attribute for .ass style file of subtitles
         self.ass_file = ass_filename
         return ass_filename
+    def select_background(self, random: bool = True) -> Path:
+        # Select which background video to use for the clip
         try:
+            # Background video selected with WebUI for Streamlit
+            # Add to the path the parent folder (background)
+            background_file = self.args.mp4_background
+            background_mp4 = Path(HOME / 'background' / background_file) # Concat path
+            background_mp4 = background_mp4.absolute()
+        except AttributeError: # Local CLI execution
+            if random:
+                background_mp4 = random_background()
+            else: # TODO: allow the user to select which background video to use
+                pass
+        # Set class attribute for mp4 background file
         self.mp4_background = background_mp4
         return background_mp4
+    def integrate_subtitles(self) -> Path:
+        # Use FFMPEG to integrate subtitles into background video and trim everything with fixed length of the audio file
+        final_video = prepare_background(str(self.mp4_background), filename_mp3=self.mp3_file, filename_srt=str(self.ass_file), verbose=self.args.verbose)
         final_video = Path(final_video).absolute()
+        # Set class attribute for mp4 final clip file
         self.mp4_final_video = final_video
         return final_video
+    def upload_to_tiktok(self) -> bool: # TODO: check if still working with Cookie
+        # Automatic upload on TikTok
+        uploaded = upload_tiktok(str(self.mp4_final_video), title=f"{self.series} - {self.part}", tags=self.tags, headless=not self.args.verbose)
         return uploaded

src/video_downloader.py CHANGED Viewed

@@ -1,13 +1,10 @@
 import subprocess
 from pathlib import Path
-import msg
-from utils import KeepDir
 HOME = Path.cwd()
-def download_video(url: str, folder: str = 'background'):
     """
     Downloads a video from the given URL and saves it to the specified folder.
@@ -19,7 +16,5 @@ def download_video(url: str, folder: str = 'background'):
     if not directory.exists():
         directory.mkdir()
-    with KeepDir() as keep_dir:
-        keep_dir.chdir(folder)
-        subprocess.run(['yt-dlp', '-f bestvideo[ext=mp4]',
-                       '--restrict-filenames', url], check=True)

 import subprocess
 from pathlib import Path
 HOME = Path.cwd()
+def download_video(url: str, folder: str = 'background') -> None:
     """
     Downloads a video from the given URL and saves it to the specified folder.
     if not directory.exists():
         directory.mkdir()
+    subprocess.run(['yt-dlp', '-f bestvideo[ext=mp4]', '--restrict-filenames', '--windows-filenames', f'-P {directory}', url], check=True)
+    return None

src/video_prepare.py CHANGED Viewed

@@ -9,31 +9,49 @@ HOME = Path.cwd()
 def prepare_background(background_mp4: str, filename_mp3: str, filename_srt: str, verbose: bool = False) -> str:
     video_info = get_info(background_mp4, kind='video')
     video_duration = int(round(video_info.get('duration'), 0))
     audio_info = get_info(filename_mp3, kind='audio')
     audio_duration = int(round(audio_info.get('duration'), 0))
     ss = random.randint(0, (video_duration-audio_duration))
     audio_duration = convert_time(audio_duration)
     if ss < 0:
         ss = 0
-    srt_raw = filename_srt
-    srt_filename = filename_srt.name
-    srt_path = filename_srt.parent.absolute()
     directory = HOME / 'output'
     if not directory.exists():
         directory.mkdir()
     outfile = f"{HOME}{os.sep}output{os.sep}output_{ss}.mp4"
     if verbose:
         rich_print(
             f"{filename_srt = }\n{background_mp4 = }\n{filename_mp3 = }\n", style='bold green')
     args = [
         "ffmpeg",
         "-ss", str(ss),
@@ -42,7 +60,7 @@ def prepare_background(background_mp4: str, filename_mp3: str, filename_srt: str
         "-i", filename_mp3,
         "-map", "0:v",
         "-map", "1:a",
-        "-vf", f"crop=ih/16*9:ih, scale=w=1080:h=1920:flags=lanczos, gblur=sigma=2, ass='{srt_raw.absolute()}'",
         "-c:v", "libx264",
         "-crf", "23",
         "-c:a", "aac",
@@ -55,8 +73,10 @@ def prepare_background(background_mp4: str, filename_mp3: str, filename_srt: str
     if verbose:
         rich_print('[i] FFMPEG Command:\n'+' '.join(args)+'\n', style='yellow')
-    with KeepDir() as keep_dir:
-        keep_dir.chdir(srt_path)
-        subprocess.run(args, check=True)
     return outfile

 def prepare_background(background_mp4: str, filename_mp3: str, filename_srt: str, verbose: bool = False) -> str:
+    # Check if the input files are strings
+    assert isinstance(background_mp4, str)
+    assert isinstance(filename_srt, str)
+    assert isinstance(filename_mp3, str)
+    # Get the duration of the video and audio files
     video_info = get_info(background_mp4, kind='video')
     video_duration = int(round(video_info.get('duration'), 0))
     audio_info = get_info(filename_mp3, kind='audio')
     audio_duration = int(round(audio_info.get('duration'), 0))
+    # Randomly select a start time for the audio file
     ss = random.randint(0, (video_duration-audio_duration))
+    # Convert the time to HH:MM:SS format
     audio_duration = convert_time(audio_duration)
     if ss < 0:
         ss = 0
+    # Create the output directory if it does not exist
     directory = HOME / 'output'
     if not directory.exists():
         directory.mkdir()
+    # Set the output file path
     outfile = f"{HOME}{os.sep}output{os.sep}output_{ss}.mp4"
     if verbose:
         rich_print(
             f"{filename_srt = }\n{background_mp4 = }\n{filename_mp3 = }\n", style='bold green')
+    # Switch inside the subtitle file directory
+    old_dir = os.getcwd()
+    os.chdir(Path(filename_srt).parent)
+    # Extract only the filename from the path
+    # This is to avoid any issues with the path (see https://stackoverflow.com/questions/71597897/unable-to-parse-option-value-xxx-srt-as-image-size-in-ffmpeg)
+    # First we switch inside the directory of the subtitle file and then we execute the FFMPEG command with the filename only (not the full path)
+    filename_srt_name = Path(filename_srt).name
+    # FFMPEG Command
     args = [
         "ffmpeg",
         "-ss", str(ss),
         "-i", filename_mp3,
         "-map", "0:v",
         "-map", "1:a",
+        "-vf", f"crop=ih/16*9:ih, scale=w=1080:h=1920:flags=lanczos, gblur=sigma=2, ass='{filename_srt_name}'",
         "-c:v", "libx264",
         "-crf", "23",
         "-c:a", "aac",
     if verbose:
         rich_print('[i] FFMPEG Command:\n'+' '.join(args)+'\n', style='yellow')
+    # Execute the FFMPEG command
+    subprocess.run(args, check=True)
+    # Go back to old dir
+    os.chdir(old_dir)
     return outfile

utils.py CHANGED Viewed

@@ -1,4 +1,3 @@
-import datetime
 import os
 from pathlib import Path
 import random
@@ -8,32 +7,15 @@ import ffmpeg
 from rich.console import Console
 import msg
-from src.logger import setup_logger
 console = Console()
-logger = setup_logger()
-class KeepDir:
-    def __init__(self):
-        self.original_dir = os.getcwd()
-    def __enter__(self):
-        return self
-    def __exit__(self, exc_type, exc_val, exc_tb):
-        os.chdir(self.original_dir)
-    def chdir(self, path):
-        os.chdir(path)
 def rich_print(text, style: str = ""):
     console.print(text, style=style)
-def random_background(folder: str = "background") -> str:
     """
     Returns the filename of a random file in the specified folder.
@@ -41,18 +23,21 @@ def random_background(folder: str = "background") -> str:
         folder(str): The folder containing the files.
     Returns:
-        str: The filename of a randomly selected file in the folder.
     """
     directory = Path(folder).absolute()
     if not directory.exists():
         directory.mkdir()
-    with KeepDir() as keep_dir:
-        keep_dir.chdir(folder)
-        files = os.listdir(".")
-        random_file = random.choice(files)
-        return Path(random_file).absolute()
 def get_info(filename: str, kind: str):
     global probe
@@ -61,7 +46,6 @@ def get_info(filename: str, kind: str):
         probe = ffmpeg.probe(filename)
     except ffmpeg.Error as e:
         console.log(f"{msg.ERROR}{e.stderr}")
-        logger.exception(e.stderr)
         sys.exit(1)
     if kind == 'video':

 import os
 from pathlib import Path
 import random
 from rich.console import Console
 import msg
 console = Console()
 def rich_print(text, style: str = ""):
     console.print(text, style=style)
+def random_background(folder: str = "background") -> Path:
     """
     Returns the filename of a random file in the specified folder.
         folder(str): The folder containing the files.
     Returns:
+        Path: The absolute path of the random file.
     """
+    # Get the absolute path of the folder
     directory = Path(folder).absolute()
+    # Create the folder if it does not exist
     if not directory.exists():
         directory.mkdir()
+    # Select a random background video for the clip inside the folder
+    random_file = random.choice(os.listdir(directory))
+    # Return the absolute path of the random file adding the folder path
+    # Concat the folder path with the random file name
+    return directory / random_file
 def get_info(filename: str, kind: str):
     global probe
         probe = ffmpeg.probe(filename)
     except ffmpeg.Error as e:
         console.log(f"{msg.ERROR}{e.stderr}")
         sys.exit(1)
     if kind == 'video':

video.json DELETED Viewed

@@ -1,19 +0,0 @@
-[
-    {
-        "series": "Crazy facts that you did not know",
-        "part": "4",
-        "outro": "Follow us for more",
-        "text": "Sku",
-        "tags": [
-            "chess",
-            "facts",
-            "crazy"
-        ]
-    },
-    {
-        "series": "Crazy facts that you did not know",
-        "part": "5",
-        "outro": "Follow us for more",
-        "text": "Test"
-    }
-]