Commit 24f10e5f140af81440f88d2f89ca084ee72e5958

Authored by Cristina Muntean
1 parent d08f9507

changes to scripts to sync with params and formatting

scripts/aggregate-wc-with-edge.sh
... ... @@ -9,6 +9,7 @@ OPTION="blacklist"
9 9 OUTPUT_DIR=/data/muntean/edge-features-10-cities-november #all-vs-chicago-blacklist.tsv
10 10 FILENAME=$2
11 11 OUTPUT_NAME=`basename $FILENAME | cut -d'.' -f1` #takes the name f the city and aggregate type e.g. "seattle_3of3"
  12 +MIN_FREQ=1
12 13  
13   -echo $COMMAND --o $OPTION --c $CITY --out $OUTPUT_DIR/all-without-$OUTPUT_NAME-blacklist.tsv $FILENAME
14   -$COMMAND --o $OPTION --c $CITY --out $OUTPUT_DIR/all-without-$OUTPUT_NAME-blacklist.tsv $FILENAME
  14 +echo $COMMAND --o $OPTION --c $CITY --minfreq $MIN_FREQ --out $OUTPUT_DIR/all-without-$OUTPUT_NAME-blacklist.tsv $FILENAME
  15 +$COMMAND --o $OPTION --c $CITY --minfreq $MIN_FREQ --out $OUTPUT_DIR/all-without-$OUTPUT_NAME-blacklist.tsv $FILENAME
... ...
scripts/sort-on-feat-aggregates.sh
... ... @@ -23,8 +23,8 @@ COLUMN=4
23 23 for LINE in `ls $INPUT_DIR/*`
24 24 do
25 25 #echo $LINE
26   - OUTPUT_NAME=`basename $LINE | cut -d'.' -f1`
27   - #echo $OUTPUT_NAME
28   - sort -t$'\t' -n -r -k$COLUMN $LINE > $INPUT_DIR/${OUTPUT_NAME}-sorted-col-${COLUMN}.tsv
  26 + OUTPUT_NAME=`basename $LINE | cut -d'.' -f1`
  27 + #echo $OUTPUT_NAME
  28 + sort -t$'\t' -n -r -k$COLUMN $LINE > $INPUT_DIR/${OUTPUT_NAME}-sorted-col-${COLUMN}.tsv
29 29 done
30 30 exit 0
... ...
scripts/sort-on-feat.sh
... ... @@ -20,11 +20,11 @@ CORES=16
20 20 INPUT_DIR=/data/muntean/edge-features-10-cities-november
21 21 COLUMN=4
22 22  
23   -for LINE in `ls $INPUT_DIR/*`
  23 +for LINE in `ls $INPUT_DIR/all-without-boston_20151101*`
24 24 do
25 25 #echo $LINE
26   - OUTPUT_NAME=`basename $LINE | cut -d'.' -f1`
27   - #echo $OUTPUT_NAME
28   - sort -t$'\t' -n -r -k$COLUMN $LINE > $INPUT_DIR/${OUTPUT_NAME}-sorted-col-${COLUMN}.tsv
  26 + OUTPUT_NAME=`basename $LINE | cut -d'.' -f1`
  27 + #echo $OUTPUT_NAME
  28 + sort -t$'\t' -n -r -k$COLUMN $LINE > $INPUT_DIR/${OUTPUT_NAME}-sorted-col-${COLUMN}.tsv
29 29 done
30 30 exit 0
... ...