#!/bin/bash set -eu # Get all the docx files in the tmp dir, ls tmp/*.docx | \ # Extract just the filename so we can reuse it easily. xargs -n 1 basename -s .docx | \ while IFS= read -r filename; do # Make a directory to put the XML in mkdir -p "tmp/$filename" # Unzip the docx to get at the xml unzip -o "tmp/$filename.docx" -d "tmp/$filename" # Convert to markdown with XSL xsltproc tools/docx-to-md.xsl "tmp/$filename/word/document.xml" | \ # Hard wrap at 80 chars at word bourdaries fold -w 80 -s | \ # Remove trailing whitespace & save in the nostarch dir for comparison sed -e "s/ *$//" > "nostarch/$filename.md" done