import streamlit as st import hf_inference # пути до моделей словарь models_dict = ['text_model_path' : text_model_path, 'video_model_path' : video_model_path, 'audio_model_path': audio_model_path] st.title("Multimodal ERC project") uploaded_file = st.file_uploader("Choose a video") input_text = st.text_area("Please, write transcript", '''That's obligatory.''') if uploaded_file is not None & input_text != '''That's obligatory.''': output_emotion = infer_multimodal_model(input_text, uploaded_file, models_dict) # закидываю видео и текст в инференс # получаю аутпут эмоции st.write(f"We think that's {output_emotion}")