What about using a FSA based parser?
#!/usr/bin/perl
use strict;
use warnings;
use Text::Diff;
{
my $INDENT_STEP=4;
sub indenter {
my ($expr)=@_;
my $indent=0;
my $result='';
pos($expr)=undef;
while(1) {
if ($expr =~ m{\G \s* ( \( [&|!] )}smxcg) {
# combinatore: print, newline, inc indent
$result.=(' 'x$indent)."$1\n";
$indent+=$INDENT_STEP;
}
elsif ($expr =~ m{\G \s* ( \( [^)=]+ = [^)]+ \) )}smxcg) {
# test: print, newline
$result.=(' 'x$indent)."$1\n";
}
elsif ($expr =~ m{\G \s* ( \) )}smxcg) {
# fine combinatore: dec intert, print, newline
$indent-=$INDENT_STEP;
$result.=(' 'x$indent)."$1\n";
}
else {
last;
}
}
return $result;
}
}
my $expr=q{(&(&(&(& (mailnickname=*) (| (&(objectCategory=person)(obje
+ctClass=user)(!(homeMDB=*))(!(msExchHomeServerName=*)))(&(objectCateg
+ory=person)(objectClass=user)(|(homeMDB=*)(msExchHomeServerName=*)))(
+&(objectCategory=person)(objectClass=contact))(objectCategory=group)(
+objectCategory=publicFolder)(objectCategory=msExchDynamicDistribution
+List) )))(objectCategory=contact)(proxyAddresses=smtp:*example.com)))
+};
my $expected=<<'END_EXPECTED';
(&
(&
(&
(&
(mailnickname=*)
(|
(&
(objectCategory=person)
(objectClass=user)
(!
(homeMDB=*)
)
(!
(msExchHomeServerName=*)
)
)
(&
(objectCategory=person)
(objectClass=user)
(|
(homeMDB=*)
(msExchHomeServerName=*)
)
)
(&
(objectCategory=person)
(objectClass=contact)
)
(objectCategory=group)
(objectCategory=publicFolder)
(objectCategory=msExchDynamicDistributionList)
)
)
)
(objectCategory=contact)
(proxyAddresses=smtp:*example.com)
)
)
END_EXPECTED
my $ret=indenter($expr);
print "ok\n" if $ret eq $expected;
print diff \$ret,\$expected, {
STYLE => 'Unified',
};
-
Are you posting in the right place? Check out Where do I post X? to know for sure.
-
Posts may use any of the Perl Monks Approved HTML tags. Currently these include the following:
<code> <a> <b> <big>
<blockquote> <br /> <dd>
<dl> <dt> <em> <font>
<h1> <h2> <h3> <h4>
<h5> <h6> <hr /> <i>
<li> <nbsp> <ol> <p>
<small> <strike> <strong>
<sub> <sup> <table>
<td> <th> <tr> <tt>
<u> <ul>
-
Snippets of code should be wrapped in
<code> tags not
<pre> tags. In fact, <pre>
tags should generally be avoided. If they must
be used, extreme care should be
taken to ensure that their contents do not
have long lines (<70 chars), in order to prevent
horizontal scrolling (and possible janitor
intervention).
-
Want more info? How to link
or How to display code and escape characters
are good places to start.
|