Updated with code

2025-01-28 17:00:03 -05:00
parent 2b37a68c56
commit 3c44257d8a
8 changed files with 180 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,4 @@
 __pycache__/
 *.pyc
 .env
 .DS_Store
--- a/README.md
+++ b/README.md
@ -0,0 +1,25 @@
 # OBS Recording Transcriber
 Process OBS recordings with AI-based transcription and summarization.
 ## Features
 - AI transcription using Whisper.
 - Summarization using Hugging Face Transformers.
 - File selection, resource validation, and error handling.
 ## Installation
 1. Clone the repo.
 git clone https://github.com/yourusername/OBS_Recording_Transcriber.git
 cd OBS_Recording_Transcriber
 2. Install dependencies:
 pip install -r requirements.txt
 Notes:
 Ensure that the versions align with the features you use and your system compatibility.
 torch version should match the capabilities of your hardware (e.g., CUDA support for GPUs).
 whisper might need to be installed from source or a GitHub repository if it's not available on PyPI.
 If you encounter any issues regarding compatibility, versions may need adjustments.
 3. streamlit run app.py
--- a/app.py
+++ b/app.py
@ -0,0 +1,58 @@
 import streamlit as st
 from utils.audio_processing import extract_audio
 from utils.transcription import transcribe_audio
 from utils.summarization import summarize_text
 from utils.validation import validate_environment
 from pathlib import Path
 def main():
    st.title("🎥 OBS Recording Transcriber")
    st.caption("Process your OBS recordings with AI transcription and summarization")
    # Allow the user to select a base folder
    st.sidebar.header("Folder Selection")
    base_folder = st.sidebar.text_input(
        "Enter the base folder path:",
        value=str(Path.home())
    )
    base_path = Path(base_folder)
    # Validate environment
    env_errors = validate_environment(base_path)
    if env_errors:
        st.error("## Environment Issues")
        for error in env_errors:
            st.markdown(f"- {error}")
        return
    # File selection
    recordings = list(base_path.glob("*.mp4"))
    if not recordings:
        st.warning(f"📂 No recordings found in the folder: {base_folder}!")
        return
    selected_file = st.selectbox("Choose a recording", recordings)
    if st.button("🚀 Start Processing"):
        try:
            transcript, summary = transcribe_audio(selected_file)
            if transcript:
                st.subheader("🖍 Summary")
                st.write(summary)
                st.subheader("📜 Full Transcript")
                with st.expander("View transcript content"):
                    st.text(transcript)
                st.download_button(
                    label="💾 Download Transcript",
                    data=transcript,
                    file_name=f"{Path(selected_file).stem}_transcript.txt",
                    mime="text/plain"
                )
            else:
                st.error("❌ Failed to process recording")
        except Exception as e:
            st.error(f"An error occurred: {e}")
            st.write(e)  # This will show the traceback in the Streamlit app
 if __name__ == "__main__":
    main()
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,5 @@
 streamlit==1.26.0
 moviepy==1.0.3
 whisper
 transformers==4.21.1
 torch>=1.7.0
--- a/utils/audio_processing.py
+++ b/utils/audio_processing.py
@ -0,0 +1,12 @@
 from moviepy.editor import AudioFileClip
 from pathlib import Path
 def extract_audio(video_path: Path):
    """Extract audio from a video file."""
    try:
        audio = AudioFileClip(str(video_path))
        audio_path = video_path.parent / f"{video_path.stem}_audio.wav"
        audio.write_audiofile(str(audio_path), verbose=False, logger=None)
        return audio_path
    except Exception as e:
        raise RuntimeError(f"Audio extraction failed: {e}")
--- a/utils/summarization.py
+++ b/utils/summarization.py
@ -0,0 +1,8 @@
 from transformers import pipeline
 SUMMARY_MODEL = "Falconsai/text_summarization"
 def summarize_text(text):
    """Summarize text using a Hugging Face pipeline."""
    summarizer = pipeline("summarization", model=SUMMARY_MODEL)
    return summarizer(text, max_length=150, min_length=30, do_sample=False)[0]["summary_text"]
--- a/utils/transcription.py
+++ b/utils/transcription.py
@ -0,0 +1,60 @@
 import whisper
 from pathlib import Path
 from transformers import pipeline, AutoTokenizer
 WHISPER_MODEL = "base"
 SUMMARIZATION_MODEL = "t5-base"
 def transcribe_audio(audio_path: Path):
    """Transcribe audio using Whisper."""
    model = whisper.load_model(WHISPER_MODEL)
    result = model.transcribe(str(audio_path))
    transcript = result["text"]
    summary = summarize_text(transcript)
    return transcript, summary
 def summarize_text(text):
    """Summarize text using a pre-trained T5 transformer model with chunking."""
    summarization_pipeline = pipeline("summarization", model=SUMMARIZATION_MODEL)
    tokenizer = AutoTokenizer.from_pretrained(SUMMARIZATION_MODEL)
    max_tokens = 512
    tokens = tokenizer(text, return_tensors='pt')
    num_tokens = len(tokens['input_ids'][0])
    if num_tokens > max_tokens:
        chunks = chunk_text(text, max_tokens)
        summaries = []
        for chunk in chunks:
            summary_output = summarization_pipeline("summarize: " + chunk, max_length=150, min_length=30, do_sample=False)
            summaries.append(summary_output[0]['summary_text'])
        overall_summary = " ".join(summaries)
    else:
        overall_summary = summarization_pipeline("summarize: " + text, max_length=150, min_length=30, do_sample=False)[0]['summary_text']
    return overall_summary
 def chunk_text(text, max_tokens):
    """Splits the text into a list of chunks based on token limits."""
    tokenizer = AutoTokenizer.from_pretrained(SUMMARIZATION_MODEL)
    words = text.split()
    chunks = []
    current_chunk = []
    current_length = 0
    for word in words:
        hypothetical_length = current_length + len(tokenizer(word, return_tensors='pt')['input_ids'][0]) - 2
        if hypothetical_length <= max_tokens:
            current_chunk.append(word)
            current_length = hypothetical_length
        else:
            chunks.append(' '.join(current_chunk))
            current_chunk = [word]
            current_length = len(tokenizer(word, return_tensors='pt')['input_ids'][0]) - 2
    if current_chunk:
        chunks.append(' '.join(current_chunk))
    return chunks
--- a/utils/validation.py
+++ b/utils/validation.py
@ -0,0 +1,8 @@
 from pathlib import Path
 def validate_environment(obs_path: Path):
    """Validate environment and prerequisites."""
    errors = []
    if not obs_path.exists():
        errors.append(f"OBS directory not found: {obs_path}")
    return errors