Skip to content

Commit

Permalink
Merge pull request #29 from opensource-spraakherkenning-nl/add-bn-nl-…
Browse files Browse the repository at this point in the history
…variations

Add variations from top 20 confusion pairs
  • Loading branch information
greenw0lf authored Nov 20, 2023
2 parents 665acda + 526ffd1 commit 54196eb
Show file tree
Hide file tree
Showing 2 changed files with 11 additions and 5 deletions.
2 changes: 0 additions & 2 deletions ASR_NL_benchmark/interface.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,8 +22,6 @@ def upload_page():
kind = request.form.get('kind')
skip_ref_norm = request.form.get('skip-ref-norm')
skip_hyp_norm = request.form.get('skip-hyp-norm')
print(skip_hyp_norm)
print(skip_ref_norm)
global benchmarking
benchmarking = pipeline.Pipeline(hyp, 'ctm', ref, 'stm', kind, skip_ref_norm, skip_hyp_norm)
Thread(target=benchmarking.main).start()
Expand Down
14 changes: 11 additions & 3 deletions ASR_NL_benchmark/variations.glm
Original file line number Diff line number Diff line change
Expand Up @@ -13,8 +13,6 @@ z'n => zijn / [ ] __ [ ]
'k => ik / [ ] __ [ ]
'r => er / [ ] __ [ ]
'ns => eens / [ ] __ [ ]
ie => hij / [ ] __ [ ]
da's => dat is / [ ] __ [ ]
d'ruit => eruit / [ ] __ [ ]
restaurant- => restaurant / [ ] __ [ ]
jeugd- => jeugd / [ ] __ [ ]
Expand Down Expand Up @@ -59,7 +57,6 @@ tewerk => te werk / [ ] __ [ ]
[concept-] => [{ concept- / concept }] / [ ] __ [ ]
[NAVO-] => [{ NAVO- / NAVO }] / [ ] __ [ ]
[uh] => [{ uh / %HESITATION }] / [ ] __ [ ]
[BNR-nieuwsradio] => [{ BNR-nieuwsradio / BNR nieuwsradio }] / [ ] __ [ ]
;;
;; BN-VL
[Darfour] => [{ Darfour / Darfur }] / [ ] __ [ ]
Expand Down Expand Up @@ -90,3 +87,14 @@ tewerk => te werk / [ ] __ [ ]
[marktonderzoekbureau] => [{ marktonderzoekbureau / marktonderzoeksbureau }] / [ ] __ [ ]
[Noordwestkust] => [{ Noordwestkust / Noord-Westkust }] / [ ] __ [ ]
[carnavalvierders] => [{ carnavalvierders / carnavalsvierders }] / [ ] __ [ ]

;; Whisper evaluation on N-Best
;; BN-NL
ie => hij / [ ] __ [ ]
da's => dat is / [ ] __ [ ]
[BNR-nieuwsradio] => [{ BNR-nieuwsradio / BNR nieuwsradio }] / [ ] __ [ ]
[Moszkowicz] => [{ Moszkowicz / Moskovic }] / [ ] __ [ ]
[Kooi] => [{ Kooi / Kooij }] / [ ] __ [ ]
[Araújo] => [{ Araújo / Araujo }] / [ ] __ [ ]
[Bagdad] => [{ Bagdad / Baghdad }] / [ ] __ [ ]
[Holleeder] => [{ Holleeder / Holleder }] / [ ] __ [ ]

0 comments on commit 54196eb

Please sign in to comment.