summaryrefslogtreecommitdiff
path: root/rc/bin/doc2txt
blob: f01147ebc06fffb7de8028bc1c53b12e8b606261 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
#!/bin/rc

rfork en

if(! ~ $#* 0 1) {
	echo 'usage: doc2txt [file.doc]' >[1=2]
	exit usage
}

switch($#*){
case 0
	cat >/tmp/doc2txt.$pid
	file=/tmp/doc2txt.$pid
case 1
	file=$1
}
aux/olefs $file || { 
	echo 'doc2txt: couldn''t mount word document' >[1=2]
	rm -f /tmp/doc2txt.$pid
	exit word
}

if(! test -f /mnt/doc/WordDocument) {
	echo 'doc2txt: is an msoffice doc but not a word document' >[1=2]
	rm -f /tmp/doc2txt.$pid
	exit worddoc
}

aux/mswordstrings /mnt/doc/WordDocument | tcs -f microsoft -t utf |fmt  | uniq
unmount /mnt/doc
rm -f /tmp/doc2txt.$pid