summaryrefslogtreecommitdiff
path: root/xmlcleanup2.sed
diff options
context:
space:
mode:
authorNick White <git@njw.me.uk>2013-05-26 21:52:41 +0100
committerNick White <git@njw.me.uk>2013-05-26 21:52:41 +0100
commit5d0c5974e2655a6f66153bffb67c9346c2c4a589 (patch)
tree5f0f2d773dda4bb5f7078c0971cc92cf5c46000d /xmlcleanup2.sed
parentb0055fe870a04fbd8eaef669c1ccfb0febfe8bc3 (diff)
downloadoed2dict-5d0c5974e2655a6f66153bffb67c9346c2c4a589.tar.bz2
oed2dict-5d0c5974e2655a6f66153bffb67c9346c2c4a589.zip
Correct e tag removal, correct headword separation
Diffstat (limited to 'xmlcleanup2.sed')
-rw-r--r--xmlcleanup2.sed6
1 files changed, 0 insertions, 6 deletions
diff --git a/xmlcleanup2.sed b/xmlcleanup2.sed
index 5352a92..56e66b0 100644
--- a/xmlcleanup2.sed
+++ b/xmlcleanup2.sed
@@ -1,12 +1,6 @@
#!/bin/sed -f
# sed rules that must run after the main set
-# <e> tags seem to duplicate <v> tags for some quotes
-# NOTE this assumes e tags only come at end of lines
-s/<e>.*$//g
-# TODO: make this work instead of the above
-#s/<e>.*?<\/e>//g
-
# any xml tags not processed can just go away
s/<[^>]*>//g
# any xml character entities not processed can just go away