12345678910111213141516171819202122232425262728293031 |
- #!/bin/bash
-
- blatherdir=~/.config/blather
- sentences=$blatherdir/sentences.corpus
- sourcefile=$blatherdir/commands
- langdir=$blatherdir/language
- tempfile=$blatherdir/url.txt
- lmtoolurl=http://www.speech.cs.cmu.edu/cgi-bin/tools/lmtool/run
-
- cd $blatherdir
-
- sed -f - $sourcefile > $sentences <<EOFcommands
- /^$/d
- /^#/d
- s/\:.*$//
- EOFcommands
-
- # upload corpus file, find the resulting dictionary file url
- curl -L -F corpus=@"$sentences" -F formtype=simple $lmtoolurl \
- |grep -A 1 "base name" |grep http \
- | sed -e 's/^.*\="//' | sed -e 's/\.tgz.*$//' | sed -e 's/TAR//' > $tempfile
-
- # download the .dic and .lm files
- curl -C - -O $(cat $tempfile).dic
- curl -C - -O $(cat $tempfile).lm
-
- # mv em to the right name/place
- mv *.dic $langdir/dic
- mv *.lm $langdir/lm
-
- rm $tempfile
|