unoffice

Reclaim text from office documents
git clone https://logand.com/git/unoffice.git/
Log | Files | Refs | README

commit 192ff85d55f9006475cdacdbebd1a7e2cfd683a9
parent 81f916b9299dd8434e765fc230d0e177cae72bdd
Author: Tomas Hlavaty <tom@logand.com>
Date:   Tue,  2 Jul 2019 07:53:46 +0200

added unabw

Diffstat:
Aunabw | 10++++++++++
1 file changed, 10 insertions(+), 0 deletions(-)

diff --git a/unabw b/unabw @@ -0,0 +1,10 @@ +#!/usr/bin/env bash +set -euo pipefail +sed 's/<p[^<\/]*>/\n/g' "$1" \ + | sed 's/<[^<]*>//g' \ + | sed 's/&lt;/</g' \ + | sed 's/&gt;/>/g' \ + | sed "s/&apos;/'/g" \ + | sed 's/&quot;/"/g' \ + | sed 's/&amp;/&/g' \ + | cat -s