diff options
author | Nick White <git@njw.me.uk> | 2013-05-26 21:52:41 +0100 |
---|---|---|
committer | Nick White <git@njw.me.uk> | 2013-05-26 21:52:41 +0100 |
commit | 5d0c5974e2655a6f66153bffb67c9346c2c4a589 (patch) | |
tree | 5f0f2d773dda4bb5f7078c0971cc92cf5c46000d /Makefile | |
parent | b0055fe870a04fbd8eaef669c1ccfb0febfe8bc3 (diff) | |
download | oed2dict-5d0c5974e2655a6f66153bffb67c9346c2c4a589.tar.bz2 oed2dict-5d0c5974e2655a6f66153bffb67c9346c2c4a589.zip |
Correct e tag removal, correct headword separation
Diffstat (limited to 'Makefile')
-rw-r--r-- | Makefile | 5 |
1 files changed, 3 insertions, 2 deletions
@@ -11,9 +11,10 @@ all: oed.jargon oed.dict.dz .htm.jargon: iconv -f ISO-8859-1 -t UTF-8 < "$<" \ + | sed 's/\r//g' \ | awk -f htmtojargon.awk \ - | sed -f separateheadmeta.sed \ | sed -f symbols.sed \ + | perl -p removeetags.pl \ | sed -f xmlcleanup.sed \ | sed -f xmlcleanup2.sed \ > "$@" @@ -28,7 +29,7 @@ oed.dict: oed.jargon cat $< \ | dictfmt -j --utf8 \ --columns 0 --headword-separator ',' \ - --index-data-separator ';' \ + --index-data-separator " " \ -u http://njw.me.uk/oed \ -s "Oxford English Dictionary, 2nd Edition" \ oed |