summaryrefslogtreecommitdiff
path: root/Makefile
diff options
context:
space:
mode:
authorNick White <git@njw.me.uk>2013-05-26 21:52:41 +0100
committerNick White <git@njw.me.uk>2013-05-26 21:52:41 +0100
commit5d0c5974e2655a6f66153bffb67c9346c2c4a589 (patch)
tree5f0f2d773dda4bb5f7078c0971cc92cf5c46000d /Makefile
parentb0055fe870a04fbd8eaef669c1ccfb0febfe8bc3 (diff)
downloadoed2dict-5d0c5974e2655a6f66153bffb67c9346c2c4a589.tar.bz2
oed2dict-5d0c5974e2655a6f66153bffb67c9346c2c4a589.zip
Correct e tag removal, correct headword separation
Diffstat (limited to 'Makefile')
-rw-r--r--Makefile5
1 files changed, 3 insertions, 2 deletions
diff --git a/Makefile b/Makefile
index 10c4fb3..cfb4484 100644
--- a/Makefile
+++ b/Makefile
@@ -11,9 +11,10 @@ all: oed.jargon oed.dict.dz
.htm.jargon:
iconv -f ISO-8859-1 -t UTF-8 < "$<" \
+ | sed 's/\r//g' \
| awk -f htmtojargon.awk \
- | sed -f separateheadmeta.sed \
| sed -f symbols.sed \
+ | perl -p removeetags.pl \
| sed -f xmlcleanup.sed \
| sed -f xmlcleanup2.sed \
> "$@"
@@ -28,7 +29,7 @@ oed.dict: oed.jargon
cat $< \
| dictfmt -j --utf8 \
--columns 0 --headword-separator ',' \
- --index-data-separator ';' \
+ --index-data-separator " " \
-u http://njw.me.uk/oed \
-s "Oxford English Dictionary, 2nd Edition" \
oed