forked from facebookarchive/NAMAS
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathprep_torch_data.sh
executable file
·33 lines (21 loc) · 1.33 KB
/
prep_torch_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
#/bin/bash
COUNT=5
WINDOW=5
DATA_DIR=$1
OUT_DIR=$1/processed
SCRIPTS=$ABS/summary
export LUA_PATH="$LUA_PATH;$ABS/?.lua"
mkdir -p $OUT_DIR
th $SCRIPTS/build_dict.lua -inf $DATA_DIR/train.article.dict -outf $OUT_DIR/train.article.dict.torch
th $SCRIPTS/build_dict.lua -inf $DATA_DIR/train.title.dict -outf $OUT_DIR/train.title.dict.torch
echo "-- Creating data directories."
mkdir -p $OUT_DIR/train/title
mkdir -p $OUT_DIR/train/article
mkdir -p $OUT_DIR/valid.filter/title
mkdir -p $OUT_DIR/valid.filter/article
cp $OUT_DIR/train.title.dict.torch $OUT_DIR/train/title/dict
cp $OUT_DIR/train.article.dict.torch $OUT_DIR/train/article/dict
echo "-- Build the matrices"
# Share the dictionary.
th $SCRIPTS/build.lua -inArticleDictionary $OUT_DIR/train.article.dict.torch -inTitleDictionary $OUT_DIR/train.title.dict.torch -inTitleFile $DATA_DIR/valid.title.filter.txt -outTitleDirectory $OUT_DIR/valid.filter/title/ -inArticleFile $DATA_DIR/valid.article.filter.txt -outArticleDirectory $OUT_DIR/valid.filter/article/ -window $WINDOW
th $SCRIPTS/build.lua -inArticleDictionary $OUT_DIR/train.article.dict.torch -inTitleDictionary $OUT_DIR/train.title.dict.torch -inTitleFile $DATA_DIR/train.title.txt -outTitleDirectory $OUT_DIR/train/title/ -inArticleFile $DATA_DIR/train.article.txt -outArticleDirectory $OUT_DIR/train/article/ -window $WINDOW