dtkne commited on
Commit
506f1dd
·
verified ·
1 Parent(s): 4c8f8ee

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -3,10 +3,10 @@ import os
3
  from moviepy.editor import VideoFileClip
4
  from transformers import pipeline
5
 
6
- # Load ASR (Speech-to-Text) pipeline
7
  asr = pipeline(task="automatic-speech-recognition", model="distil-whisper/distil-small.en")
8
 
9
- # Load Summarization model
10
  summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
11
 
12
  def transcribe_and_summarize(video_file):
@@ -23,11 +23,11 @@ def transcribe_and_summarize(video_file):
23
  transcription_result = asr(audio_path, return_timestamps=True)
24
  transcribed_text = " ".join([segment['text'] for segment in transcription_result['chunks']])
25
 
26
- # Summarize if long enough
27
  if len(transcribed_text.split()) < 50:
28
  summarized_text = "Text too short to summarize."
29
  else:
30
- summary_result = summarizer(transcribed_text, max_length=100, min_length=30, do_sample=False)
31
  summarized_text = summary_result[0]['summary_text']
32
 
33
  return transcribed_text, summarized_text
 
3
  from moviepy.editor import VideoFileClip
4
  from transformers import pipeline
5
 
6
+ # ASR (Speech-to-Text) pipeline
7
  asr = pipeline(task="automatic-speech-recognition", model="distil-whisper/distil-small.en")
8
 
9
+ # Summarization model
10
  summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
11
 
12
  def transcribe_and_summarize(video_file):
 
23
  transcription_result = asr(audio_path, return_timestamps=True)
24
  transcribed_text = " ".join([segment['text'] for segment in transcription_result['chunks']])
25
 
26
+ # Summarize
27
  if len(transcribed_text.split()) < 50:
28
  summarized_text = "Text too short to summarize."
29
  else:
30
+ summary_result = summarizer(transcribed_text, max_length=500, min_length=30, do_sample=False)
31
  summarized_text = summary_result[0]['summary_text']
32
 
33
  return transcribed_text, summarized_text