many improvements to the code to get it building from a dry run
[redirect-tools] / example / 01-extract_redirects_wrapper.sh
index e953c6182cf35878ba1bdc01266e5363c7d261c8..be882ca0bc5e3ce883edda05270c16f77295e4fc 100755 (executable)
@@ -9,4 +9,4 @@ INPUT_FILE=$(find ${DATA_DIR}/wp-enwiki-xml -name '*7z' | sed -n ${RUN}p)
 OUTPUT_FILE="${DATA_DIR}/wp-enwiki-redir/wp_edits_redir_${INDEX}.tsv.bz2"
 
 # print material out
-7za x -so "${INPUT_FILE}" | /usr/local/bin/python2.7 ${CUR_DIR}/extract_redirects.py | bzip2 -c - > ${OUTPUT_FILE}
+7za x -so "${INPUT_FILE}" | /usr/local/bin/python2.7 ${CUR_DIR}/01-extract_redirects.py | bzip2 -c - > ${OUTPUT_FILE}

Benjamin Mako Hill || Want to submit a patch?