diff options
-rwxr-xr-x | get_embeddings.sh | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/get_embeddings.sh b/get_embeddings.sh index be354a6..b53d493 100755 --- a/get_embeddings.sh +++ b/get_embeddings.sh | |||
@@ -49,5 +49,5 @@ rm -f "${EMBS}/crawl-300d-2M.vec.zip" | |||
49 | # truncate to top 500k tokens for efficiency | 49 | # truncate to top 500k tokens for efficiency |
50 | for lang_code in bg en el it ro sl sq; do | 50 | for lang_code in bg en el it ro sl sq; do |
51 | sed -in '1,500001!d' "${EMBS}/${lang_code}.vec" | 51 | sed -in '1,500001!d' "${EMBS}/${lang_code}.vec" |
52 | sed -in '1 s/^.*$/500000 300/' "${EMBS}/${lang_code}.vec" | 52 | sed -i '1 s/^.*$/500000 300/' "${EMBS}/${lang_code}.vec" |
53 | done | 53 | done |