smxxxxxxx commited on
Commit
f12944f
·
verified ·
1 Parent(s): 00c470c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +13 -6
app.py CHANGED
@@ -43,12 +43,19 @@ def convert_audio_to_wav(audio_file):
43
  return None
44
 
45
  def evaluate_asr_accuracy(transcription, reference):
46
- """Calculate WER and CER metrics"""
47
- transformation = jiwer.Compose([
48
- jiwer.ToLowerCase(), jiwer.RemovePunctuation(), jiwer.RemoveMultipleSpaces()
49
- ])
50
- wer = jiwer.wer(reference, transcription, truth_transform=transformation, hypothesis_transform=transformation)
51
- return 1 - wer, 1 - jiwer.cer(reference, transcription, truth_transform=transformation)
 
 
 
 
 
 
 
52
 
53
  # Cached dataset loading with audio decoding
54
  @st.cache_data(show_spinner=False)
 
43
  return None
44
 
45
  def evaluate_asr_accuracy(transcription, reference):
46
+ """Simplified evaluation with direct string processing"""
47
+ # 简单预处理
48
+ ref_processed = reference.lower().strip()
49
+ hyp_processed = transcription.lower().strip()
50
+
51
+ if not ref_processed: # 参考文本为空
52
+ return 0.0, 0.0
53
+
54
+ # 计算WER和CER
55
+ wer = jiwer.wer(ref_processed, hyp_processed)
56
+ cer = jiwer.cer(ref_processed, hyp_processed)
57
+
58
+ return 1 - wer, 1 - cer
59
 
60
  # Cached dataset loading with audio decoding
61
  @st.cache_data(show_spinner=False)