blob: 211793e89f1f26bde5a68f29db56697454d5c799 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
|
#!/bin/bash
blatherdir=~/.config/blather
sourcefile=$blatherdir/sentences.corpus
langdir=$blatherdir/language
tempfile=$blatherdir/url.txt
lmtoolurl=http://www.speech.cs.cmu.edu/cgi-bin/tools/lmtool/run
cd $blatherdir
# upload corpus file, find the resulting dictionary file url
curl -L -F corpus=@"$sourcefile" -F formtype=simple $lmtoolurl \
|grep -A 1 "base name" |grep http \
| sed -e 's/^.*\="//' | sed -e 's/\.tgz.*$//' | sed -e 's/TAR//' > $tempfile
# download the .dic and .lm files
curl -C - -O $(cat $tempfile).dic
curl -C - -O $(cat $tempfile).lm
# mv em to the right name/place
mv *.dic $langdir/dic
mv *.lm $langdir/lm
rm $tempfile
|