File size: 1,799 Bytes
5fb0891 427e7ec 5fb0891 427e7ec 5fb0891 427e7ec 5fb0891 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 |
import whisper
import os
import pandas as pd
import plotly_express as px
import nltk
import plotly.graph_objects as go
from optimum.onnxruntime import ORTModelForSequenceClassification
from transformers import pipeline, AutoTokenizer, AutoModelForSequenceClassification, AutoModelForTokenClassification
from sentence_transformers import SentenceTransformer, CrossEncoder, util
import streamlit as st
import en_core_web_lg
nltk.download('punkt')
from nltk import sent_tokenize
auth_token = os.environ.get("auth_token")
st.sidebar.header("Home")
asr_model_options = ['tiny.en','base.en','small.en']
asr_model_name = st.sidebar.selectbox("Transcription model", options=asr_model_options, key="sbox")
st.markdown("## Interview analyzer")
twitter_link = """
[![](https://img.shields.io/twitter/follow/nickmuchi?label=@nickmuchi&style=social)](https://twitter.com/nickmuchi)
"""
st.markdown(twitter_link)
st.markdown(
"""
**๐ Enter a YouTube Earnings Call URL below and navigate to the sidebar tabs**
"""
)
if 'sbox' not in st.session_state:
st.session_state.sbox = asr_model_name
if "earnings_passages" not in st.session_state:
st.session_state["earnings_passages"] = ''
if "sen_df" not in st.session_state:
st.session_state['sen_df'] = ''
url_input = st.text_input(
label="Enter YouTube URL, example below is McDonalds Earnings Call Q1 2023",
value="https://www.youtube.com/watch?v=4p6o5kkZYyA")
if 'url' not in st.session_state:
st.session_state['url'] = ""
st.session_state['url'] = url_input
st.markdown(
"<h3 style='text-align: center; color: red;'>OR</h3>",
unsafe_allow_html=True
)
upload_wav = st.file_uploader("Upload a .wav/.mp3/.mp4 audio file ",key="upload",type=['.wav','.mp3','.mp4'])
|