Category: | Web Stuff |
Author/Contact Info | Briac 'Oeufmayo' Pilpré |
Description: | The python guys (they can't be all bad, after all :) have created a DTD called XML Bookmark Exchange Language which "is a rich interchange
format for "bookmark" data as used by most Internet browsers."
As I wanted to play with the XML::Writer module and clean up my bookmark files, I ended up whipping up this code. Have fun!
Update 2001-11-13: Complete rewrite of the adr2xbel script. It follows a bit more closely the python script found in the PyXML library demos. |
#!/usr/bin/perl -w
use strict;
use XML::Writer;
# Small utility to parse Opera bookmark files.
# Originally written in Python by Lars Marius Garshol
# perl version - Briac Pilpré
my $version = <>;
die "Doesn't seem to be a Opera Hotlist\n" if $version !~ /^Opera/;
chomp( $version );
my $xml = new XML::Writer(DATA_MODE=>1, DATA_INDENT=>1);
$xml->xmlDecl();
$xml->doctype(
'xbel',
'+//IDN python.org//DTD XML Bookmark Exchange Language 1.0//EN/
+/XML',
'xbel.dtd');
$xml->startTag('xbel');
$xml->dataElement('desc', $version);
while (<>){
next unless /\S/;
chomp;
if ( $_ eq '#FOLDER' || $_ eq '#URL' ){
my $node = $_;
my $line;
{
local $/ = ""; # Paragraph mode
$line = <>;
}
if ($node eq '#FOLDER'){
my $name = $1 if $line =~ /NAME=(.*)/;
my $created = $1 if $line =~ /CREATED=(.*)/;
$xml->startTag('folder');
$xml->dataElement('title', $name);
}
elsif ($node eq '#URL') {
my $name = $1 if $line =~ /NAME=(.*)/;
my $created = $1 if $line =~ /CREATED=(.*)/;
my $order = $1 if $line =~ /ORDER=(.*)/;
my $visited = $1 if $line =~ /VISITED=(.*)/;
my $url = $1 if $line =~ /URL=(.*)/;
$xml->startTag('bookmark', href => $url,
added => $created, visited => $visited);
$xml->dataElement('title', $name);
$xml->endTag('bookmark');
}
}
elsif ( $_ eq '-'){
$xml->endTag('folder');
}
}
$xml->endTag('xbel');
Bonus: Added Bonus the xbel2adr script! __END__
#!/usr/bin/perl -w
use strict;
use XML::Parser;
die "usage: $0 opera.xbel\n" if !$ARGV[0];
my $parser = new XML::Parser(Handlers => {
Start=>\&start, End=>\&end, Char=>\&char,
});
my%equiv=(title=>'NAME', desc=>'DESCRIPTION');
my $flag = '';
$parser->parsefile($ARGV[0]);
sub char {
my ($p, $txt) = @_; return if $txt =~ /^\s*$/;
chomp($txt);
print $txt . "\n" if exists($equiv{$flag});
}
sub start {
my ($p, $e, %a) = @_; $flag = $e;
if ($e eq 'folder'){ print "\n#FOLDER\n" }
elsif ($e eq 'bookmark'){print "\n#URL\n\tURL=" . $a{'href'} if $a
+{'href'}}
else {print "\n\t" . $equiv{$e} . "=" if exists $equiv{$e} }
}
sub end {undef $flag}
Previous version: __END__ #!/usr/bin/perl -w # # adr2xbel : Convert Opera Bookmarks file to xbel # (XML Bookmark Exchange Language) # OeufMayo - 23 apr 2001 use strict; use XML::Writer; use IO; die "usage: $0 opera.adr\n" if !$ARGV[0]; my $output = new IO::File("> $ARGV[0].xbel.xml") or die $!; my $writer = new XML::Writer(OUTPUT => $output, DATA_MODE => 1, DATA_INDENT => 4) or die $!; $writer->xmlDecl('iso-8859-1', 'no'); $writer->doctype( 'xbel', undef, 'http://www.python.org/topics/xml/dtds/xbel-1.0.dtd'); $writer->startTag('xbel'); $writer->dataElement('title', 'Opera Hotlist version 2.0'); $/ = ""; while (<>){ chomp; my @chunk = split(/\n\t/, $_); while ($chunk[0] =~ s/^(-\n)//){ # Folder end $writer->endTag('folder') if $chunk[0]; } if ($chunk[0] =~ /^#FOLDER/){ # Folder beginning shift @chunk; my %attrs = &getAttlist(@chunk); $writer->startTag("folder"); for ('title', 'desc'){ $writer->dataElement($_, $attrs{$_}); } } elsif ($chunk[0] =~ /^#URL/){ # URL Tag shift @chunk; my %attrs = &getAttlist(@chunk); $writer->startTag("bookmark", 'href' => $attrs{href} ); for ('title', 'desc'){ $writer->dataElement($_, $attrs{$_}); } $writer->endTag("bookmark"); } } $writer->endTag('xbel'); $writer->end; ######################### sub getAttlist { my %attrs; my %tr = ( URL=>'href', DESCRIPTION=>'desc', NAME=>'title', ); foreach $_ (@_){ m/^([^=]+)=(.*)$/; my ($key, $value) = ($1, $2); next unless ( $key eq 'URL' || $key eq 'DESCRIPTION' || $key eq 'NAME' ); $key = $tr{$key}; $attrs{$key} = $value; } return %attrs; } |
|
---|
Replies are listed 'Best First'. | |
---|---|
Re: Opera Bookmarks to XBEL
by Anonymous Monk on Apr 25, 2003 at 16:53 UTC | |
by Anonymous Monk on May 26, 2004 at 11:53 UTC |
Back to
Code Catacombs