1234567891011121314151617181920212223242526272829303132 |
- #!/bin/bash
-
- blatherdir=~/.config/kaylee
- blatherdatadir=~/.local/share/kaylee
- blathercachedir=~/.cache/kaylee
- sentences=$blatherdatadir/sentences.corpus
- sourcefile=$blatherdir/commands.conf
- tempfile=$blathercachedir/url.txt
- lmtoolurl=http://www.speech.cs.cmu.edu/cgi-bin/tools/lmtool/run
-
- cd $blatherdir
-
- sed -f - $sourcefile > $sentences <<EOFcommands
- /^$/d
- /^#/d
- s/\:.*$//
- EOFcommands
-
- # upload corpus file, find the resulting dictionary file url
- curl -L -F corpus=@"$sentences" -F formtype=simple $lmtoolurl \
- |grep -A 1 "base name" |grep http \
- | sed -e 's/^.*\="//' | sed -e 's/\.tgz.*$//' | sed -e 's/TAR//' > $tempfile
-
- # download the .dic and .lm files
- curl -C - -O $(cat $tempfile).dic
- curl -C - -O $(cat $tempfile).lm
-
- # mv em to the right name/place
- mv *.dic $blatherdatadir/dic
- mv *.lm $blatherdatadir/lm
-
- rm $tempfile
|