Spaces:

Sven33
/

SATE

Sleeping

File size: 2,358 Bytes

67d6834

import os
import json
import base64
import requests

def wav_to_base64_url(wav_path):
    with open(wav_path, "rb") as f:
        b64_audio = base64.b64encode(f.read()).decode()
    return f"data:audio/wav;base64,{b64_audio}"

def is_api_available(api_url):
    try:
        response = requests.get(api_url)
        return response.status_code < 500
    except Exception as e:
        print("[Error] Cannot reach API:", e)
        return False

def annotate_mispronunciation(session_id, api_url="http://localhost:8080", base_dir="session_data"):
    json_path = os.path.join(base_dir, session_id, f"{session_id}_transcriptionCW.json")
    if not os.path.exists(json_path):
        print(f"[Error] File not found: {json_path}")
        return

    if not is_api_available(api_url):
        print(f"[Error] API not available at {api_url}")
        return

    with open(json_path, "r", encoding="utf-8") as f:
        data = json.load(f)

    segments = data.get("segments", [])
    for segment in segments:
        start = segment["start"]
        end = segment["end"]
        speaker = segment["speaker"]
        filename = f"{session_id}-{start:.2f}-{end:.2f}-{speaker}.wav"
        filepath = os.path.join(base_dir, session_id, filename)
        if not os.path.exists(filepath):
            print(f"[Warning] Audio file missing: {filename}")
            continue

        audio_url = wav_to_base64_url(filepath)
        try:
            resp = requests.post(
                f"{api_url}/vocallens/api/analyze",
                headers={"Content-Type": "application/json"},
                data=json.dumps([audio_url])
            )
            if resp.status_code == 200:
                result = resp.json()
                segment["mispronunciation"] = result.get("ce", "")
            else:
                print(f"[Warning] API error {resp.status_code} for {filename}")
                segment["mispronunciation"] = ""
        except Exception as e:
            print(f"[Error] Exception during API call for {filename}:", e)
            segment["mispronunciation"] = ""

    with open(json_path, "w", encoding="utf-8") as f:
        json.dump(data, f, indent=4, ensure_ascii=False)
    
    print(f"Session {session_id} mispronunciation annotation done: {json_path}")
    return data

if __name__ == "__main__":
    annotate_mispronunciation("000030")