#!/bin/sed -f # sed rules that must run after the main set # tags seem to duplicate tags for some quotes # NOTE this assumes e tags only come at end of lines s/.*$//g # TODO: make this work instead of the above #s/.*?<\/e>//g # any xml tags not processed can just go away s/<[^>]*>//g # any xml character entities not processed can just go away s/&[^;]*;//g