Spaces:

Sven33
/

SATE

Sleeping

SATE / mispronunciation.py

Shuwei Hou

init

67d6834 2 months ago

2.36 kB

	import os
	import json
	import base64
	import requests

	def wav_to_base64_url(wav_path):
	with open(wav_path, "rb") as f:
	b64_audio = base64.b64encode(f.read()).decode()
	return f"data:audio/wav;base64,{b64_audio}"

	def is_api_available(api_url):
	try:
	response = requests.get(api_url)
	return response.status_code < 500
	except Exception as e:
	print("[Error] Cannot reach API:", e)
	return False

	def annotate_mispronunciation(session_id, api_url="http://localhost:8080", base_dir="session_data"):
	json_path = os.path.join(base_dir, session_id, f"{session_id}_transcriptionCW.json")
	if not os.path.exists(json_path):
	print(f"[Error] File not found: {json_path}")
	return

	if not is_api_available(api_url):
	print(f"[Error] API not available at {api_url}")
	return

	with open(json_path, "r", encoding="utf-8") as f:
	data = json.load(f)

	segments = data.get("segments", [])
	for segment in segments:
	start = segment["start"]
	end = segment["end"]
	speaker = segment["speaker"]
	filename = f"{session_id}-{start:.2f}-{end:.2f}-{speaker}.wav"
	filepath = os.path.join(base_dir, session_id, filename)
	if not os.path.exists(filepath):
	print(f"[Warning] Audio file missing: {filename}")
	continue

	audio_url = wav_to_base64_url(filepath)
	try:
	resp = requests.post(
	f"{api_url}/vocallens/api/analyze",
	headers={"Content-Type": "application/json"},
	data=json.dumps([audio_url])
	)
	if resp.status_code == 200:
	result = resp.json()
	segment["mispronunciation"] = result.get("ce", "")
	else:
	print(f"[Warning] API error {resp.status_code} for {filename}")
	segment["mispronunciation"] = ""
	except Exception as e:
	print(f"[Error] Exception during API call for {filename}:", e)
	segment["mispronunciation"] = ""

	with open(json_path, "w", encoding="utf-8") as f:
	json.dump(data, f, indent=4, ensure_ascii=False)

	print(f"Session {session_id} mispronunciation annotation done: {json_path}")
	return data

	if __name__ == "__main__":
	annotate_mispronunciation("000030")