aboutsummaryrefslogtreecommitdiffstats
path: root/get_embeddings.sh
diff options
context:
space:
mode:
Diffstat (limited to 'get_embeddings.sh')
-rwxr-xr-xget_embeddings.sh10
1 files changed, 5 insertions, 5 deletions
diff --git a/get_embeddings.sh b/get_embeddings.sh
index dde7839..aba2078 100755
--- a/get_embeddings.sh
+++ b/get_embeddings.sh
@@ -37,10 +37,10 @@ wget -nc -q https://dl.fbaipublicfiles.com/fasttext/vectors-crawl/cc.sl.300.vec.
37 37
38echo "Extracting embeddings" 38echo "Extracting embeddings"
39 39
40for LANG in sq bg el it ro sl; do 40for lang_code in sq bg el it ro sl; do
41 gunzip "${EMBS}/cc.${LANG}.300.vec.gz" 41 gunzip "${EMBS}/cc.${lang_code}.300.vec.gz"
42 mv "${EMBS}/cc.${LANG}.300.vec.gz" "${EMBS}/${LANG}.1M.vec" 42 mv "${EMBS}/cc.${lang_code}.300.vec" "${EMBS}/${lang_code}.1M.vec"
43done 43done
44 44
45unzip -ofq "${EMBS}/crawl-300d-2M.vec.zip" -d "${EMBS}" 45unzip -q "${EMBS}/crawl-300d-2M.vec.zip" -d "${EMBS}"
46mv "${EMBS}/crawl-300d-2M.vec" "${EMBS}/en.vec" 46mv "${EMBS}/crawl-300d-2M.vec" "${EMBS}/en.1M.vec"