summaryrefslogtreecommitdiffstats
path: root/src/doc/book/tools/doc-to-md.sh
blob: 8c802a71fa52f5817ded67914310b7ee00e78fdf (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/bin/bash

set -eu

# Get all the docx files in the tmp dir.
find tmp -name '*.docx' -print0 | \
# Extract just the filename so we can reuse it easily.
xargs -0 basename -s .docx | \
while IFS= read -r filename; do
    # Truncate the `nostarch` dir file and put the "no editing" warning back.
    # Tell shellcheck to ignore this because I want the `/src/` printed
    # literally, not expanded.
    # shellcheck disable=SC2016
    echo '<!-- DO NOT EDIT THIS FILE.

This file is periodically generated from the content in the `/src/`
directory, so all fixes need to be made in `/src/`.
-->' > "nostarch/$filename.md"
    # Make a directory to put the XML in.
    mkdir -p "tmp/$filename"
    # Unzip the docx to get at the XML.
    unzip -o "tmp/$filename.docx" -d "tmp/$filename"
    # Convert to markdown with XSL.
    xsltproc tools/docx-to-md.xsl "tmp/$filename/word/document.xml" | \
    # Hard wrap at 80 chars at word bourdaries.
    fold -w 80 -s | \
    # Remove trailing whitespace and append to the file in the `nostarch` dir for comparison.
    sed -e "s/ *$//" >> "nostarch/$filename.md"
done