Spaces:

Sabbah13
/

text_transcribation_diarization_and_summarization

Paused

text_transcribation_diarization_and_summarization

File size: 3,603 Bytes

ee531be
 
8fb0be5
ee531be
 
 
 
 
 
d74e638
ee531be
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8fb0be5
ee531be
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8fb0be5
ee531be
 
 
8fb0be5
ee531be
 
 
 
 
8fb0be5
ee531be
 
 
 
 
 
8fb0be5
ee531be
 
8fb0be5
ee531be
 
 
8fb0be5
ee531be
 
 
17e6aa5
ee531be

import requests
import base64
import os
import json
import streamlit as st
from speechlib import Transcriptor

def transcribe_audio(file, log_folder, language, modelSize, ACCESS_TOKEN, voices_folder, quantization):
    transcriptor = Transcriptor(file, log_folder, language, modelSize, ACCESS_TOKEN, voices_folder, quantization)
    return transcriptor.whisper()
    
def transform_transcript(transcript):
    result = []
    for segment in transcript:
        start_time, end_time, text, speaker = segment
        result.append(f"{speaker} ({start_time:.1f} : {end_time:.1f}) : {text}")
    return '\n'.join(result)
    
st.title('Audio Transcription App')

ACCESS_TOKEN = st.secrets["HF_TOKEN"]

uploaded_file = st.file_uploader("Загрузите аудиофайл", type=["mp4", "wav", "m4a"])

if uploaded_file is not None:
    file_extension = uploaded_file.name.split(".")[-1]  # Получаем расширение файла
    temp_file_path = f"temp_file.{file_extension}"  # Создаем временное имя файла с правильным расширением
    
    with open(temp_file_path, "wb") as f:
        f.write(uploaded_file.getbuffer())
        
    log_folder = "logs"
    language = "ru"
    modelSize = os.getenv('WHISPER_MODEL_SIZE')
    voices_folder = ""
    quantization = False
    
    with st.spinner('Транскрибируем...'):
        result = transcribe_audio(temp_file_path, log_folder, language, modelSize, ACCESS_TOKEN, voices_folder, quantization)
        
    st.write("Результат транскрибации:")
    transcript = transform_transcript(result)
    st.text(transcript)
    
    with st.spinner('Резюмируем...'):
        username = st.secrets["GIGA_USERNAME"]
        password = st.secrets["GIGA_SECRET"]
        
        # Получаем строку с базовой авторизацией в формате Base64
        auth_str = f'{username}:{password}'
        auth_bytes = auth_str.encode('utf-8')
        auth_base64 = base64.b64encode(auth_bytes).decode('utf-8')
        url = os.getenv('GIGA_AUTH_URL')
        
        headers = {
            'Authorization': f'Basic {auth_base64}',  # вставляем базовую авторизацию
            'RqUID': os.getenv('GIGA_rquid'),
            'Content-Type': 'application/x-www-form-urlencoded',
            'Accept': 'application/json'
        }
        
        data = {
            'scope': os.getenv('GIGA_SCOPE')
        }
        
        response = requests.post(url, headers=headers, data=data, verify=False)
        access_token = response.json()['access_token']
        print('Got access token')
        
        url_completion = os.getenv('GIGA_COMPLETION_URL')
        
        data_copm = json.dumps({
          "model": os.getenv('GIGA_MODEL'),
          "messages": [
            {
              "role": "user",
              "content": os.getenv('GIGA_BASE_PROMPT') + transcript
            }
          ],
          "stream": False,
          "max_tokens": int(os.getenv('GIGA_MAX_TOKENS')),
        })
        
        headers_comp = {
          'Content-Type': 'application/json',
          'Accept': 'application/json',
          'Authorization': 'Bearer ' + access_token
        }
        
        response = requests.post(url_completion, headers=headers_comp, data=data_copm, verify=False)
        response_data = response.json()
        answer_from_llm = response_data['choices'][0]['message']['content']
        
    st.write("Результат резюмирования:")
    st.text(answer_from_llm)