perl -lne 'print for /molecule_idref="([^"]+)/g' xmlfile